In [ ]:
    
import pandas as pd
from pprint import pprint
import matplotlib.pyplot as plt
plt.style.use('ggplot')
%matplotlib inline
    
In [ ]:
    
df = pd.read_table('data/preprocessed.tsv')
    
In [ ]:
    
pprint(df.columns.tolist())
    
In [ ]:
    
df['n_votes'].describe()
    
In [ ]:
    
# ENTER CODE HERE
    
In [ ]:
    
df['n_votes'].hist(bins=20)
    
In [ ]:
    
# ENTER CODE HERE
    
In [ ]:
    
df['section'].value_counts().plot(kind="bar")
    
In [ ]:
    
df['section'].value_counts().plot(kind="pie")
    
In [ ]:
    
### ENTER CODE HERE
    
In [ ]:
    
df.plot.scatter(x="n_votes", y="selected")
    
In [ ]:
    
### ENTER CODE HERE