In [47]:
import pandas as pd
%matplotlib inline
import matplotlib.pyplot as plt
import statsmodels.formula.api as smf
In [48]:
df = pd.read_excel("data/2013_NYC_CD_MedianIncome_Recycle.xlsx")
In [49]:
df.head()
Out[49]:
In [51]:
lm = smf.ols(formula="RecycleRate~MdHHIncE",data=df).fit()
In [52]:
lm.params
Out[52]:
In [53]:
Intercept, Median_Income = lm.params
In [58]:
df['Predicted RecycleRate'] = Median_Income*df['MdHHIncE']+Intercept
In [59]:
df.head()
Out[59]:
In [56]:
intercept, slope = lm.params
In [57]:
df.plot(kind="scatter",x="MdHHIncE",y="RecycleRate")
plt.plot(df["MdHHIncE"],slope*df["MdHHIncE"]+intercept,"-",color="red")
Out[57]:
In [ ]:
In [ ]: