Q-1-2_Neural_Nets_with_a_random_first_layer

Janet Matsen

Code notes:


In [ ]:
import numpy as np
import matplotlib as mpl
%matplotlib inline
import time

import pandas as pd
import seaborn as sns

from mnist import MNIST  # public package for making arrays out of MINST data.

In [ ]:
import sys
sys.path.append('../code/')

In [ ]:
from ridge_regression import RidgeMulti
from hyperparameter_explorer import HyperparameterExplorer

In [ ]:
from mnist_helpers import mnist_training, mnist_testing

In [ ]:
import matplotlib.pyplot as plt
from pylab import rcParams
rcParams['figure.figsize'] = 4, 3

Prepare MNIST training data


In [ ]:
train_X, train_y = mnist_training()
test_X, test_y = mnist_testing()

Explore hyperparameters before training model on all of the training data.


In [ ]:
hyper_explorer = HyperparameterExplorer(X=train_X, y=train_y, 
                                        model=RidgeMulti, 
                                        validation_split=0.1, score_name = 'training RMSE', 
                                        use_prev_best_weights=False,
                                        test_X = test_X, test_y = test_y)

In [ ]:
hyper_explorer.train_model(lam=1e10, verbose=False)

In [ ]:
hyper_explorer.train_model(lam=1e+08, verbose=False)
hyper_explorer.train_model(lam=1e+07, verbose=False)

In [ ]:
hyper_explorer.train_model(lam=1e+06, verbose=False)

In [ ]:
hyper_explorer.train_model(lam=1e5, verbose=False)
hyper_explorer.train_model(lam=1e4, verbose=False)
hyper_explorer.train_model(lam=1e03, verbose=False)
hyper_explorer.train_model(lam=1e2, verbose=False)

In [ ]:
hyper_explorer.train_model(lam=1e1, verbose=False)

In [ ]:
hyper_explorer.train_model(lam=1e0, verbose=False)
hyper_explorer.train_model(lam=1e-1, verbose=False)
hyper_explorer.train_model(lam=1e-2, verbose=False)
hyper_explorer.train_model(lam=1e-3, verbose=False)
hyper_explorer.train_model(lam=1e-4, verbose=False)
hyper_explorer.train_model(lam=1e-5, verbose=False)

In [ ]:
hyper_explorer.summary

In [ ]:
hyper_explorer.plot_fits()

In [ ]:
t = time.localtime(time.time())

hyper_explorer.plot_fits(filename = "Q-1-1-3_val_and_train_RMSE_{}-{}".format(t.tm_mon, t.tm_mday))

In [ ]:
hyper_explorer.plot_fits(ylim=(.6,.7),
                         filename = "Q-1-1-3_val_and_train_RMSE_zoomed_in{}-{}".format(t.tm_mon, t.tm_mday))

In [ ]:
hyper_explorer.best('score')

In [ ]:
hyper_explorer.best('summary')

In [ ]:
hyper_explorer.best('best score')

In [ ]:
hyper_explorer.train_on_whole_training_set(lam=1e7)

In [ ]:
hyper_explorer.final_model.results_row()

In [ ]:
hyper_explorer.evaluate_test_data()

In [ ]:


In [ ]: