In [1]:
import pandas as pd
In [2]:
data = pd.read_csv("Accidents7904.csv")
In [3]:
print type(data)
In [4]:
list(data)
Out[4]:
In [5]:
data['\xef\xbb\xbfAccident_Index'][:5]
Out[5]:
In [6]:
data_london = data[data['Police_Force'] == 1]
print data_london[:5]
In [7]:
type(data_london['Date'][0])
Out[7]:
In [8]:
data_london['Date'] = pd.to_datetime(data_london['Date'])
In [9]:
data_london['Date'][:5]
Out[9]:
In [10]:
data_london['Date'][0] > pd.to_datetime('2000-01-01')
Out[10]:
In [11]:
data_london['Date'][0] > pd.to_datetime('1979-01-01')
Out[11]:
In [12]:
data_london[:1]
Out[12]:
In [13]:
#print type(data_london['Date'])
#print data_london['Date'][0]
data_london_new = data_london[data_london['Date'] > pd.to_datetime('2000-01-01')]
print len(data_london_new)
print data_london_new[:5]
In [14]:
data_london_new['Time'][:5]
Out[14]:
In [15]:
print (data_london_new['Time'].iloc[1])
print type(data_london_new['Time'].iloc[1])
In [16]:
pd.to_datetime(data_london['Time'].iloc[0])
Out[16]:
In [17]:
data_london.iloc[0]
Out[17]:
In [59]:
data_london_new2 = data_london_new[['Date', 'Time', 'Number_of_Casualties']]
data_london_new2.head()
Out[59]:
In [60]:
data_london_new2.sort('Date', inplace=True)
#data_london_new2.set_index('Date', inplace=True)
data_london_new2.head()
Out[60]:
In [61]:
data_london_new2.sort('Time', inplace=True)
#data_london_new2.set_index('Date', inplace=True)
data_london_new2.head()
Out[61]:
In [63]:
writer = pd.ExcelWriter('output.xlsx')
data_london_new2.to_excel(writer,'Sheet1')
writer.save()
In [65]:
In [ ]: