Using the 2013_NYC_CD_MedianIncome_Recycle.xlsx file, calculate the correlation between the recycling rate and the median income. Discuss your findings in your PR.
In [1]:
import pandas as pd
import matplotlib
%matplotlib inline
In [2]:
df = pd.read_excel('data/2013_NYC_CD_MedianIncome_Recycle.xlsx')
In [3]:
df.head()
Out[3]:
In [9]:
df.plot(kind = 'scatter', x = 'MdHHIncE', y = 'RecycleRate')
Out[9]:
In [11]:
df.corr()
Out[11]:
In [ ]: