In [5]:
import pandas as pd
%matplotlib inline
import matplotlib.pyplot as plt
import statsmodels.formula.api as smf
In [5]:
cd ..
In [6]:
pwd
Out[6]:
In [7]:
cd "C:\Users\Harsha Devulapalli\Desktop\algorithms\class4\homework\data"
In [8]:
df=pd.read_excel("2013_NYC_CD_MedianIncome_Recycle.xlsx")
In [9]:
df.plot(kind="scatter",x="MdHHIncE",y="RecycleRate")
Out[9]:
In [30]:
lm = smf.ols(formula="RecycleRate~MdHHIncE",data=df).fit()
In [31]:
lm.params
Out[31]:
In [32]:
intercept, slope = lm.params
In [33]:
df.plot(kind="scatter",x="MdHHIncE",y="RecycleRate")
plt.plot(df["MdHHIncE"],slope*df["MdHHIncE"]+intercept,"-",color="red")
Out[33]:
In [38]:
def returnrate(income):
rate = slope*income+intercept
return rate
In [39]:
returnrate(20000)
Out[39]: