In [1]:
import pandas as pd
import matplotlib.pyplot as plt
import numpy as np
%matplotlib inline
In [2]:
!wget http://www.metoffice.gov.uk/pub/data/weather/uk/climate/stationdata/southamptondata.txt
In [23]:
pd.read_csv?
In [42]:
dateparse = lambda x, y: pd.datetime.strptime(x+" "+y, '%Y %m')
remove_star = lambda x: x.replace("*", "")
df = pd.read_csv("southamptondata.txt", skiprows=[0, 1, 2, 3, 4, 6], sep=" ", skipinitialspace=True,
na_values="---", parse_dates={'date': [0, 1]}, date_parser=dateparse, skipfooter=1,
converters={2:remove_star, 3:remove_star, 4:remove_star, 5:remove_star})
df.head()
Out[42]:
In [35]:
df.info()
In [45]:
dates = df.date.values
rain = df.rain.values
tmax = df.tmax.values
plt.plot(dates, tmax)
Out[45]: