Download Excel file from: https://data.gov.uk/dataset/road-accidents-safety-data/resource/80b76aec-a0a1-4e14-8235-09cc6b92574a

Excel (or OpenOffice) can't open it, since it's too large. Can Python help?

Note: If code freezes, kill Ipython and try again.


In [ ]:
import pandas as pd

In [ ]:
data = pd.read_csv("Accidents7904.csv")

In [ ]:
len(data)

In [ ]:
accidents_sunday = data[data.Day_of_Week == 1]
len(accidents_sunday)

In [ ]:
accidents_sunday_twenty_cars = data[(data.Day_of_Week == 1) & (data.Number_of_Vehicles > 20)]
len(accidents_sunday_twenty_cars)

In [ ]:
accidents_sunday_twenty_cars_rain = data[
    (data.Day_of_Week == 1) & (data.Number_of_Vehicles > 20) &
    (data.Weather_Conditions == 2)]
len(accidents_sunday_twenty_cars_rain)

In [ ]:
london_data = data[data['Police_Force'] == 1 & (data.Day_of_Week == 1)]
len(london_data)

In [ ]:
london_data_2000 = london_data[
    (pd.to_datetime(london_data['Date'], coerce=True) >
        pd.to_datetime('2000-01-01', coerce=True)) &
    (pd.to_datetime(london_data['Date'], coerce=True) <
        pd.to_datetime('2000-12-31', coerce=True))
]

len(london_data_2000)

In [ ]:
writer = pd.ExcelWriter(
    'London_Sundays_2000.xlsx', engine='xlsxwriter')
london_data_2000.to_excel(writer, 'Sheet1')
writer.save()

In [ ]: