In [4]:
%reset
In [1]:
import pandas as pd
import seaborn as sns
import numpy as np
%matplotlib inline
In [2]:
checkin = pd.read_csv('../../../data/interim/clean_US_cities/checkin_clean.csv')
In [3]:
checkin.head()
Out[3]:
In [19]:
checkin.info()
In [97]:
# Making columns aggregating checkins by day of week
checkin['mon_list'] = checkins['time'].map(lambda x: [list_item for list_item in x[1:-1].split(',') if 'Mon' in list_item])
checkin['tue_list'] = checkins['time'].map(lambda x: [list_item for list_item in x[1:-1].split(',') if 'Tue' in list_item])
checkin['wed_list'] = checkins['time'].map(lambda x: [list_item for list_item in x[1:-1].split(',') if 'Wed' in list_item])
checkin['thu_list'] = checkins['time'].map(lambda x: [list_item for list_item in x[1:-1].split(',') if 'Thu' in list_item])
checkin['fri_list'] = checkins['time'].map(lambda x: [list_item for list_item in x[1:-1].split(',') if 'Fri' in list_item])
checkin['sat_list'] = checkins['time'].map(lambda x: [list_item for list_item in x[1:-1].split(',') if 'Sat' in list_item])
checkin['sun_list'] = checkins['time'].map(lambda x: [list_item for list_item in x[1:-1].split(',') if 'Sun' in list_item])
In [98]:
# Converting day of week lists to dictionaries so that # of checkins can be looked up by hour
checkin['mon_list'] = checkin['mon_list'].map(lambda x:
{int(list_item.replace(' ', '').replace('Mon-', '').split(':')[0]):int(list_item.replace(' ', '').replace('Mon-', '').split(':')[1])
for list_item in x})
checkin['tue_list'] = checkin['tue_list'].map(lambda x:
{int(list_item.replace(' ', '').replace('Tue-', '').split(':')[0]):int(list_item.replace(' ', '').replace('Tue-', '').split(':')[1])
for list_item in x})
checkin['wed_list'] = checkin['wed_list'].map(lambda x:
{int(list_item.replace(' ', '').replace('Wed-', '').split(':')[0]):int(list_item.replace(' ', '').replace('Wed-', '').split(':')[1])
for list_item in x})
checkin['thu_list'] = checkin['thu_list'].map(lambda x:
{int(list_item.replace(' ', '').replace('Thu-', '').split(':')[0]):int(list_item.replace(' ', '').replace('Thu-', '').split(':')[1])
for list_item in x})
checkin['fri_list'] = checkin['fri_list'].map(lambda x:
{int(list_item.replace(' ', '').replace('Fri-', '').split(':')[0]):int(list_item.replace(' ', '').replace('Fri-', '').split(':')[1])
for list_item in x})
checkin['sat_list'] = checkin['sat_list'].map(lambda x:
{int(list_item.replace(' ', '').replace('Sat-', '').split(':')[0]):int(list_item.replace(' ', '').replace('Sat-', '').split(':')[1])
for list_item in x})
checkin['sun_list'] = checkin['sun_list'].map(lambda x:
{int(list_item.replace(' ', '').replace('Sun-', '').split(':')[0]):int(list_item.replace(' ', '').replace('Sun-', '').split(':')[1])
for list_item in x})
In [102]:
checkin.head()
Out[102]: