In [1]:
import pandas as pd
%matplotlib inline
In [2]:
df = pd.read_csv("data/Data_Collection_Sheet.csv")
In [4]:
df["height (inches)"].hist(bins=5)
Out[4]:
In [7]:
df.columns
Out[7]:
In [8]:
df['siblings (not including you)'].hist()
Out[8]:
In [9]:
df['siblings (not including you)'].mean()
Out[9]:
In [11]:
df[df['height (inches)'] > 75]
Out[11]:
In [13]:
df[df['height (inches)'] < 59]
Out[13]:
In [14]:
df = pd.read_excel("data/height_weight.xlsx")
In [18]:
df.plot(kind='scatter',y='weight',x='height')
Out[18]:
In [19]:
df.corr()
Out[19]:
In [ ]: