In [3]:
%matplotlib inline
import matplotlib.pyplot as plt
import pandas as pd
In [12]:
names = pd.read_csv("../../data/names.txt", header=None)
names.columns = ["name"]
names["length"] = names["name"].apply(lambda name: len(name))
names.head()
Out[12]:
In [13]:
names.describe()
Out[13]:
In [55]:
plt.hist(names["length"], bins=[i for i in range(30)], rwidth=0.9, facecolor='green', alpha=0.75)
plt.title("Name Length Distribution")
plt.xlabel("Length")
plt.ylabel("#Names")
Out[55]:
In [ ]: