In [1]:
import pandas as pd
df = pd.read_csv("../dataset/git_demo_timestamp_linux.csv", sep=";")
df.author.value_counts().head(10)
Out[1]:
In [2]:
%matplotlib inline
df.author.value_counts().head(10).plot(kind='pie')
Out[2]:
In [3]:
df['timestamp_local'] = pd.to_datetime(df['timestamp_local'])
df.describe()
Out[3]:
In [4]:
df.timestamp_local.dt.year.value_counts(sort=False).plot(kind='bar')
Out[4]:
In [5]:
df.timestamp_local.dt.hour.value_counts(sort=False).plot(kind='bar')
Out[5]: