In [1]:
import pandas as pd
%matplotlib inline
import matplotlib.pyplot as plt
import statsmodels.formula.api as smf
In [4]:
df = pd.read_csv("data/hanford.csv")
In [5]:
df
Out[5]:
In [6]:
df['Exposure'].mean()
Out[6]:
In [7]:
df['Exposure'].describe()
Out[7]:
In [9]:
df.corr()
Out[9]:
In [8]:
df.plot(kind='scatter', x='Mortality', y='Exposure')
Out[8]:
In [10]:
lm = smf.ols(formula='Mortality~Exposure',data=df).fit()
lm.params
Out[10]:
In [11]:
intercept, Exposure = lm.params
Mortality = Exposure*10+intercept
In [12]:
Mortality
Out[12]:
In [ ]:
In [13]:
intercept, Exposure = lm.params
Mortality = Exposure*10+intercept
In [14]:
Mortality
Out[14]:
In [ ]: