In [2]:
import pandas as pd
import numpy as np
import datetime as datetime
import seaborn as sns
import matplotlib.pyplot as plt

plt.rcParams['figure.figsize'] = (15, 5)

#Cargo los datos pero parseando las fechas a DataTime
trip = pd.read_csv('db/trip.csv', parse_dates=['start_date','end_date'])
weather = pd.read_csv('db/weather.csv')
status= pd.read_csv('db/stat80.csv')

In [3]:
#Observacion de los tipos de datos
trip.head(10)


Out[3]:
id duration start_date start_station_name start_station_id end_date end_station_name end_station_id bike_id subscription_type zip_code
0 4576 63 2013-08-29 14:13:00 South Van Ness at Market 66 2013-08-29 14:14:00 South Van Ness at Market 66 520 Subscriber 94127
1 4607 70 2013-08-29 14:42:00 San Jose City Hall 10 2013-08-29 14:43:00 San Jose City Hall 10 661 Subscriber 95138
2 4130 71 2013-08-29 10:16:00 Mountain View City Hall 27 2013-08-29 10:17:00 Mountain View City Hall 27 48 Subscriber 97214
3 4251 77 2013-08-29 11:29:00 San Jose City Hall 10 2013-08-29 11:30:00 San Jose City Hall 10 26 Subscriber 95060
4 4299 83 2013-08-29 12:02:00 South Van Ness at Market 66 2013-08-29 12:04:00 Market at 10th 67 319 Subscriber 94103
5 4927 103 2013-08-29 18:54:00 Golden Gate at Polk 59 2013-08-29 18:56:00 Golden Gate at Polk 59 527 Subscriber 94109
6 4500 109 2013-08-29 13:25:00 Santa Clara at Almaden 4 2013-08-29 13:27:00 Adobe on Almaden 5 679 Subscriber 95112
7 4563 111 2013-08-29 14:02:00 San Salvador at 1st 8 2013-08-29 14:04:00 San Salvador at 1st 8 687 Subscriber 95112
8 4760 113 2013-08-29 17:01:00 South Van Ness at Market 66 2013-08-29 17:03:00 South Van Ness at Market 66 553 Subscriber 94103
9 4258 114 2013-08-29 11:33:00 San Jose City Hall 10 2013-08-29 11:35:00 MLK Library 11 107 Subscriber 95060

In [5]:
#A cada dato de la columna de comienzo del viaje (start_date) le aplico una funcion para saber en que dia de la semana fueron
#realizados los viajes
#Aclaracion: dayofweek nos da los dias ordenados desde 0(lunes) hasta 6(domingo)
#Realizo un plot de barras para visualizar lo calculado en el paso anterior
plt = trip['start_date'].apply(lambda x: x.dayofweek).value_counts().plot('bar');
plt.set_xlabel('Dias de la semana');
plt.set_ylabel('Cantidad');
plt.set_title('Cantidad de viajes por dia de la semana');
plt.set_xticklabels(['Martes','Miercoles','Jueves','Lunes','Viernes','Sabado','Domingo'], fontdict=None, minor=False);

In [ ]: