In [4]:
%pylab inline

import pandas as pd


Populating the interactive namespace from numpy and matplotlib

In [5]:
train_set = pd.read_csv("data/competition_data/train_set.csv")
np.log(train_set.cost + 1).hist(bins=100)


Out[5]:
<matplotlib.axes._subplots.AxesSubplot at 0x4fa5250>

In [7]:
train_pred = pd.read_csv("train_pred.csv")
# train_pred.cost.hist(bins=100)
np.log(train_pred.cost + 1).hist(bins=100)


Out[7]:
<matplotlib.axes._subplots.AxesSubplot at 0x56d3890>

In [6]:
test_pred = pd.read_csv("test_pred.csv")
# test_pred.cost.hist(bins=100)
np.log(test_pred.cost + 1).hist(bins=100)


Out[6]:
<matplotlib.axes._subplots.AxesSubplot at 0x54b0a90>

In [ ]: