Download Excel file from: https://data.gov.uk/dataset/road-accidents-safety-data/resource/80b76aec-a0a1-4e14-8235-09cc6b92574a
Excel (or OpenOffice) can't open it, since it's too large. Can Python help?
Note: If code freezes, kill Ipython and try again.
In [ ]:
import pandas as pd
In [ ]:
data = pd.read_csv("Accidents7904.csv")
In [ ]:
len(data)
In [ ]:
accidents_sunday = data[data.Day_of_Week == 1]
len(accidents_sunday)
In [ ]:
accidents_sunday_twenty_cars = data[(data.Day_of_Week == 1) & (data.Number_of_Vehicles > 20)]
len(accidents_sunday_twenty_cars)
In [ ]:
accidents_sunday_twenty_cars_rain = data[
(data.Day_of_Week == 1) & (data.Number_of_Vehicles > 20) &
(data.Weather_Conditions == 2)]
len(accidents_sunday_twenty_cars_rain)
In [ ]:
london_data = data[data['Police_Force'] == 1 & (data.Day_of_Week == 1)]
len(london_data)
In [ ]:
london_data_2000 = london_data[
(pd.to_datetime(london_data['Date'], coerce=True) >
pd.to_datetime('2000-01-01', coerce=True)) &
(pd.to_datetime(london_data['Date'], coerce=True) <
pd.to_datetime('2000-12-31', coerce=True))
]
len(london_data_2000)
In [ ]:
writer = pd.ExcelWriter(
'London_Sundays_2000.xlsx', engine='xlsxwriter')
london_data_2000.to_excel(writer, 'Sheet1')
writer.save()
In [ ]: