In [1]:
import pandas as pd
surveys_df = pd.read_csv("data/surveys.csv")
In [2]:
type(surveys_df)
Out[2]:
In [3]:
surveys_df['record_id'].dtype
Out[3]:
In [4]:
surveys_df.dtypes
Out[4]:
In [5]:
surveys_df['record_id'] = surveys_df['record_id'].astype('float64')
surveys_df['record_id'].dtype
Out[5]:
In [6]:
surveys_df['weight'].mean()
Out[6]:
In [7]:
print(len(surveys_df[pd.isnull(surveys_df.weight)]))
print(len(surveys_df[surveys_df.weight> 0]))
In [8]:
df1 = surveys_df.copy()
df1['weight'] = df1['weight'].fillna(0)
In [9]:
df1['weight'].mean()
Out[9]:
In [10]:
df1['weight'] = surveys_df['weight'].fillna(surveys_df['weight'].mean())