In [83]:
import numpy as np
import pandas as pd
from scipy import stats
In [84]:
df = pd.read_csv('datasets/dataset2.csv')
In [85]:
hours = df['average_montly_hours'].values
In [86]:
norm_hours = (hours-np.mean(hours))/np.std(hours)
In [87]:
norm_hours.reshape(-1,1)
Out[87]:
In [88]:
stats.describe(norm_hours)
Out[88]:
In [ ]: