In [7]:
import os
import pandas as pd


source_path = 'D:\Python_my\Python_Netology_homework\data_names'
source_dir_path = os.path.normpath(os.path.abspath(source_path))


def download_year_data(year):
    y = year
    source_file = os.path.normpath(os.path.join(source_dir_path, 'yob{}.txt'.format(year)))
    year_data = pd.read_csv(source_file, names=['Name', 'Gender', 'Count'])
    # year_data['Year'] = year_data.apply(lambda x: int(year), axis=1)
    year_data = year_data.drop(['Gender'], axis=1)
    # print(year_data.query('Name == "Ruth" | Name == "Robert"').groupby('Name').sum())
    return year_data.query('Name == ["Ruth", "Robert"]').groupby('Name').sum()

names = []
names_dict = {}
ruth_n_robert_all_time = {}
for i in range(1900, 1904):
    names_dict[i] = download_year_data(i)

ruth_n_robert_all_time = pd.concat(names_dict, names=['Year'])
# print(ruth_n_robert_all_time)
print()
# print(ruth_n_robert_all_time.unstack('Name'))



Out[7]:
<matplotlib.axes._subplots.AxesSubplot at 0x1babe0aac8>

In [8]:
ruth_n_robert_dynamics = ruth_n_robert_all_time.unstack('Name')
ruth_n_robert_dynamics


Out[8]:
Count
Name Robert Ruth
Year
1900 3845 4781
1901 2559 3989
1902 3201 4401
1903 3057 4531

In [9]:
ruth_n_robert_dynamics.plot(title='Ruth vs Robert', grid=True)


Out[9]:
<matplotlib.axes._subplots.AxesSubplot at 0x1ba66ca588>

In [10]:
ruth_n_robert_dynamics.plot.bar()


Out[10]:
<matplotlib.axes._subplots.AxesSubplot at 0x1babe4cef0>

In [ ]: