diff --git a/chapter_preliminaries/pandas.md b/chapter_preliminaries/pandas.md index 49e006295..8cc879e71 100644 --- a/chapter_preliminaries/pandas.md +++ b/chapter_preliminaries/pandas.md @@ -37,7 +37,7 @@ with open(data_file, 'w') as f: # !pip install pandas import pandas as pd -data = pd.read_csv(data_file) +data = pd.read_csv(data_file, na_values=['NA']) print(data) ``` @@ -55,7 +55,7 @@ print(data) ```{.python .input} #@tab all inputs, outputs = data.iloc[:, 0:2], data.iloc[:, 2] -inputs = inputs.fillna(inputs.mean()) +inputs = inputs.fillna(inputs.select_dtypes(include=['number']).mean()) print(inputs) ``` diff --git a/chapter_preliminaries/pandas_origin.md b/chapter_preliminaries/pandas_origin.md index 1e6cdb4c8..33d425cc7 100644 --- a/chapter_preliminaries/pandas_origin.md +++ b/chapter_preliminaries/pandas_origin.md @@ -45,7 +45,7 @@ This dataset has four rows and three columns, where each row describes the numbe # !pip install pandas import pandas as pd -data = pd.read_csv(data_file) +data = pd.read_csv(data_file, na_values=['NA']) print(data) ``` @@ -64,7 +64,7 @@ we [**replace the "NaN" entries with the mean value of the same column.**] ```{.python .input} #@tab all inputs, outputs = data.iloc[:, 0:2], data.iloc[:, 2] -inputs = inputs.fillna(inputs.mean()) +inputs = inputs.fillna(inputs.select_dtypes(include=['number']).mean()) print(inputs) ``` @@ -132,3 +132,4 @@ Create a raw dataset with more rows and columns. :begin_tab:`tensorflow` [Discussions](https://discuss.d2l.ai/t/195) :end_tab: +