In [1]:
import pandas as pd
df = pd.DataFrame.from_csv('2014-15-player-per-game-averages.csv')
df.head()
Out[1]:
That was a little easier than my own helper class :)
Let's now examine a scatter matrix comparing all combinations of the numerical stats.
In [16]:
import matplotlib.pyplot as plt
from pandas.tools.plotting import scatter_matrix
%matplotlib inline
%config InlineBackend.figure_format = 'retina'
scatter_matrix(
df[['height_inches', 'weight_lbs', 'min', 'pts', 'reb', 'ast', 'blk']],
figsize = (12, 12)
)
# plt.savefig('nba-scatter.png')
None