In [3]:
from __future__ import print_function
import os
import pandas as pd
from statsmodels.tsa import stattools
%matplotlib inline
from matplotlib import pyplot as plt
In [5]:
#read the data from into a pandas.DataFrame
air_miles = pd.read_csv('datasets/us-airlines-monthly-aircraft-miles-flown.csv')
air_miles.index = air_miles.Month
In [7]:
#Let's see first 10 rows of it
air_miles.head(10)
Out[7]:
In [8]:
#Let's rename the 2nd column
air_miles.rename(columns={'U.S. airlines: monthly aircraft miles flown (Millions) 1963 -1970':\
'Air miles flown'
},
inplace=True
)
In [10]:
#Plot the time series of air miles flown
fig = plt.figure(figsize=(5.5, 5.5))
ax = fig.add_subplot(1,1,1)
air_miles['Air miles flown'].plot(ax=ax)
ax.set_title('Monthly air miles flown during 1963 - 1970')
plt.savefig('plots/ch2/B07887_02_13.png', format='png', dpi=300)
In [19]:
adf_result = stattools.adfuller(air_miles['Air miles flown'], autolag='AIC')
In [20]:
print('p-val of the ADF test in air miles flown:', adf_result[1])