In [ ]:
import pandas as pd
from pprint import pprint
import matplotlib.pyplot as plt
plt.style.use('ggplot')
%matplotlib inline
In [ ]:
df = pd.read_table('data/preprocessed.tsv')
In [ ]:
pprint(df.columns.tolist())
In [ ]:
df['n_votes'].describe()
In [ ]:
# ENTER CODE HERE
In [ ]:
df['n_votes'].hist(bins=20)
In [ ]:
# ENTER CODE HERE
In [ ]:
df['section'].value_counts().plot(kind="bar")
In [ ]:
df['section'].value_counts().plot(kind="pie")
In [ ]:
### ENTER CODE HERE
In [ ]:
df.plot.scatter(x="n_votes", y="selected")
In [ ]:
### ENTER CODE HERE