Rain

https://www.kaggle.com/c/how-much-did-it-rain-ii/data

Variables/Functions Data Model Training Predictions

Variables/Functions ^



In [1]:

    
from IPython.core.debugger import Tracer
#Tracer()()

import os, sys, time

### prevent the dying jupyter notebook
stdout = sys.stdout
#sys.stdout = sys.__stdout__  # did not work to restoure print -> console
#sys.stdout = open('keras_output.txt', 'a+')
#sys.stdout = stdout

import utils
import importlib
importlib.reload(utils)

#Allow relative imports to directories above cwd/
sys.path.insert(1, os.path.join(sys.path[0], '..'))

#import modules
from utils import *

%matplotlib inline

np.random.seed(42)

from sklearn.preprocessing import MinMaxScaler
from sklearn.metrics import mean_squared_error

%pwd  #Verify we are in the right directory
!uname -a









    



Using TensorFlow backend.






    Out[1]:





<module 'utils' from '/home/tw/dev/py/module/twBase/utils.py'>






    Out[1]:





'/home/tw/kg/rain'






    



Linux sysid 4.8.0-34-generic #36-Ubuntu SMP Wed Dec 21 17:24:18 UTC 2016 x86_64 x86_64 x86_64 GNU/Linux



In [15]:

    
#Create references to important directories we will use over and over
current_dir = os.getcwd()
dataname = 'rain-s'

sample = False
if sample:
    dpath = "./data/rain-s/"
else:
    dpath = "./data/rain/"

seq_len = 19



In [25]:

    
import twModel
importlib.reload(twModel)









    Out[25]:





<module 'twModel' from '/home/tw/kg/rain/twModel.py'>



In [ ]:

    
from keras.models import load_model
model = load_model('xxx.h5')



In [9]:

    
#model = twModel.RNNModel()
model = twModel.BidiRNNModel()



In [ ]:



In [11]:

    
model.init_model(rnn_size=256,
                    dense_size=512,
                    #optimizer='Adam',
                    init='uniform',
                    activation='relu',
                    layers=[False, False],
                    dropout_rate=0)









    



____________________________________________________________________________________________________
Layer (type)                     Output Shape          Param #     Connected to                     
====================================================================================================
input_2 (InputLayer)             (None, 19, 22)        0                                            
____________________________________________________________________________________________________
timedistributed_8 (TimeDistribute(None, 19, 512)       11776       input_2[0][0]                    
____________________________________________________________________________________________________
simplernn_5 (SimpleRNN)          (None, 19, 256)       196864      timedistributed_8[0][0]          
____________________________________________________________________________________________________
simplernn_7 (SimpleRNN)          (None, 19, 256)       196864      timedistributed_8[0][0]          
____________________________________________________________________________________________________
timedistributed_9 (TimeDistribute(None, 19, 512)       131584      simplernn_5[0][0]                
____________________________________________________________________________________________________
timedistributed_11 (TimeDistribut(None, 19, 512)       131584      simplernn_7[0][0]                
____________________________________________________________________________________________________
simplernn_6 (SimpleRNN)          (None, 19, 256)       196864      timedistributed_9[0][0]          
____________________________________________________________________________________________________
simplernn_8 (SimpleRNN)          (None, 19, 256)       196864      timedistributed_11[0][0]         
____________________________________________________________________________________________________
timedistributed_10 (TimeDistribut(None, 19, 512)       131584      simplernn_6[0][0]                
____________________________________________________________________________________________________
timedistributed_12 (TimeDistribut(None, 19, 512)       131584      simplernn_8[0][0]                
____________________________________________________________________________________________________
merge_2 (Merge)                  (None, 19, 1024)      0           timedistributed_10[0][0]         
                                                                   timedistributed_12[0][0]         
____________________________________________________________________________________________________
timedistributed_13 (TimeDistribut(None, 19, 512)       524800      merge_2[0][0]                    
____________________________________________________________________________________________________
timedistributed_14 (TimeDistribut(None, 19, 1)         513         timedistributed_13[0][0]         
____________________________________________________________________________________________________
lambda_2 (Lambda)                (None, 1)             0           timedistributed_14[0][0]         
====================================================================================================
Total params: 1850881
____________________________________________________________________________________________________



In [13]:

    
from IPython.display import SVG
from keras.utils.visualize_util import model_to_dot

SVG(model_to_dot(model.model).create(prog='dot', format='svg'))









    Out[13]:



In [52]:

    
X_train, y_train, X_valid, y_valid = twModel.data(sample)
X_train.shape, y_train.shape, X_valid.shape, y_valid.shape









    Out[52]:





((643349, 19, 22), (643349,), (73165, 19, 22), (73165,))



In [53]:

    
%%time
#%%capture output
sys.stdout = open('keras_output.txt', 'a+')
m_, hist = model.train(X_train, y_train, epochs=35, batch_size=128, verbose=1, validation_data=(X_valid, y_valid))
sys.stdout = stdout
hist

model.save()



In [ ]:



In [26]:

    
#model = twModel.RNNModel()
model = twModel.BidiRNNModel()
model.load()









    



model loaded from:  BidiRNNModel.h5



In [27]:

    
model.model.summary()









    



____________________________________________________________________________________________________
Layer (type)                     Output Shape          Param #     Connected to                     
====================================================================================================
input_2 (InputLayer)             (None, 19, 22)        0                                            
____________________________________________________________________________________________________
timedistributed_8 (TimeDistribute(None, 19, 512)       11776       input_2[0][0]                    
____________________________________________________________________________________________________
simplernn_5 (SimpleRNN)          (None, 19, 256)       196864      timedistributed_8[0][0]          
____________________________________________________________________________________________________
simplernn_7 (SimpleRNN)          (None, 19, 256)       196864      timedistributed_8[0][0]          
____________________________________________________________________________________________________
timedistributed_9 (TimeDistribute(None, 19, 512)       131584      simplernn_5[0][0]                
____________________________________________________________________________________________________
timedistributed_11 (TimeDistribut(None, 19, 512)       131584      simplernn_7[0][0]                
____________________________________________________________________________________________________
simplernn_6 (SimpleRNN)          (None, 19, 256)       196864      timedistributed_9[0][0]          
____________________________________________________________________________________________________
simplernn_8 (SimpleRNN)          (None, 19, 256)       196864      timedistributed_11[0][0]         
____________________________________________________________________________________________________
timedistributed_10 (TimeDistribut(None, 19, 512)       131584      simplernn_6[0][0]                
____________________________________________________________________________________________________
timedistributed_12 (TimeDistribut(None, 19, 512)       131584      simplernn_8[0][0]                
____________________________________________________________________________________________________
merge_2 (Merge)                  (None, 19, 1024)      0           timedistributed_10[0][0]         
                                                                   timedistributed_12[0][0]         
____________________________________________________________________________________________________
timedistributed_13 (TimeDistribut(None, 19, 512)       524800      merge_2[0][0]                    
____________________________________________________________________________________________________
timedistributed_14 (TimeDistribut(None, 19, 1)         513         timedistributed_13[0][0]         
____________________________________________________________________________________________________
lambda_2 (Lambda)                (None, 1)             0           timedistributed_14[0][0]         
====================================================================================================
Total params: 1850881
____________________________________________________________________________________________________



In [28]:

    
X_test = twModel.data_test()
X_test.shape









    Out[28]:





(717625, 19, 22)



In [39]:

    
X_test[:3,0,0]
X_test[:,0,0].max()









    Out[39]:





array([ 1.,  0.,  3.])






    Out[39]:





58.0



In [29]:

    
%%time
preds = model.model.predict(X_test, batch_size=128, verbose=2)



In [48]:

    
ids = np.load('test/obs_ids_test.npy')
ids.shape









    Out[48]:





(717625,)



In [49]:

    
df = pd.DataFrame(data=preds, index=ids[:], columns=['Expected'])



In [50]:

    
df.info()
df.to_csv('df.csv', index_label='Id')









    



<class 'pandas.core.frame.DataFrame'>
Int64Index: 717625 entries, 1 to 717625
Data columns (total 1 columns):
Expected    717625 non-null float32
dtypes: float32(1)
memory usage: 8.2 MB

Data ^



In [ ]:

    
%mkdir -p $dpath



In [ ]:

    
# run everything on a 10% data subset
# 13765202 line in train
!head -n 1000000 ./data/rain/train.csv > ./data/rain-s/train.csv
!head -n 800000 ./data/rain/test.csv > ./data/rain-s/test.csv



In [ ]:

    
# manual downlaod, kg did not work
!python data_preprocessing.py



In [ ]:

    
obs_ids_train = np.load('train/obs_ids_train_cv0.npy')
train = np.load(dpath+'processed_train.npy')



In [ ]:

    
train.shape, obs_ids_train.shape
train[0]
obs_ids_train[0]



In [ ]:

    
COLUMNS = ['Id','minutes_past', 'radardist_km', 'Ref', 'Ref_5x5_10th',
       'Ref_5x5_50th', 'Ref_5x5_90th', 'RefComposite',
       'RefComposite_5x5_10th', 'RefComposite_5x5_50th',
       'RefComposite_5x5_90th', 'RhoHV', 'RhoHV_5x5_10th',
       'RhoHV_5x5_50th', 'RhoHV_5x5_90th', 'Zdr', 'Zdr_5x5_10th',
       'Zdr_5x5_50th', 'Zdr_5x5_90th', 'Kdp', 'Kdp_5x5_10th',
       'Kdp_5x5_50th', 'Kdp_5x5_90th', 'Expected']

data_pd = pd.DataFrame(data=train[:,0:], columns=COLUMNS)
data_pd.info()
data_pd.head(2)



In [ ]:

    
data_pd.groupby('Id').count().head(3)
data_pd.groupby('Id').mean().head(3)



In [ ]:

    
# generate sequence data
!python data_augmentation_train.py



In [ ]:

    
# generate sequence data
!python data_augmentation_valid.py

Correlation

Load Data



In [ ]:

    
X_train = np.load('train/data_train_augmented_cv0_t19_rand0.npy')
y_train = np.load('train/data_train_expected_cv0.npy')
X_train.shape, y_train.shape
X_train[0, 0], y_train[0]



In [45]:

    
ids = np.load('valid/obs_ids_valid_cv0-s.npy')
X_valid = np.load('valid/data_valid_augmented_cv0_t19_rand0-s.npy')
y_valid = np.load('valid/data_valid_expected_cv0-s.npy')
X_valid.shape, y_valid.shape
X_valid[0, 0], y_valid[0]









    Out[45]:





((5268, 19, 22), (5268,))






    Out[45]:





(array([  0. ,  16. ,  15.5,   0. ,   0. ,  22.5,  15.5,   0. ,  15. ,  22.5,   0. ,   0. ,   0. ,
          0. ,   0. ,   0. ,   0. ,   0. ,   0. ,   0. ,   0. ,   0. ]),
 3.8100019999999999)



In [46]:

    
ids.shape









    Out[46]:





(5268,)



In [ ]:

    
plot2(X_train[0], y_train)

Model ^

Abtract Model



In [ ]:

    
class AbstractModel():
    
    def __init__(self):
        self.modelPath = dpath+self.get_classname()+'.h5'
        self.checkpoint = ModelCheckpoint(filepath= dpath + 'checkpoint-{epoch:02d}-{loss:.3f}-{val_loss:.3f}.hdf5')
        
    @classmethod  #classmethod always gets class as parameter
    def get_classname(cls):
        return cls.__name__
    
    def save(self):
        self.model.save(self.modelPath)
        print("model saved to: ", self.modelPath)
        
    def load(self):
        self.model = load_model(modelPath)
        print("model loaded from: ", self.modelPath)
        
    def train(self, X_train, y_train, epochs=1, batch_size=64, val_split=0.05, verbose=1):
        global_start_time = time.time()
        try:
            history = self.model.fit(
                X_train, y_train,
                batch_size=batch_size,
                nb_epoch=epochs,
                validation_split=val_split,
                verbose=verbose,
                #callbacks=[self.checkpoint, self.csvLogger])  #BUG: csv logger not rerun capable
                callbacks=[self.checkpoint])
        except KeyboardInterrupt:
            print('Training duration (s) : ', time.time() - global_start_time)
            return self.model, history

        print('Training duration (s) : ', time.time() - global_start_time)
        return self.model, history

Model Functional

Dense



In [ ]:

    
class BaselineModel(AbstractModel):
    
    def __init__(self):
        super(BaselineModel, self).__init__()
        self.model = None
        
    def __call__(self, neurons=12, optimizer='RMSprop', tw_init='uniform', activation='relu', dropout_rate=0, weight_constraint=2, layers=[False]):
        """ returns the model, e.g. for GridSearch"""
        self.model = None  # make sure, that instance is pickable
        return self.create_model(neurons, optimizer, tw_init, activation, dropout_rate, weight_constraint, layers)

    def init_model(self, neurons=12, optimizer='RMSprop', tw_init='uniform', activation='relu', dropout_rate=0, weight_constraint=2, layers=[False]):
        self.model = self.create_model(neurons, optimizer, tw_init, activation, dropout_rate, weight_constraint, layers)
        self.model.summary()

    def create_model(self, neurons=12, optimizer='RMSprop', tw_init='uniform', activation='relu', dropout_rate=0, weight_constraint=2, layers=[False]):
        ''' creates functional KERAS model
        parameters are passed from GridSearch, always provide default to call the model without GridSearch
        '''
        inputs = Input(shape=(40,))

        x = Dense(neurons, init=tw_init, activation=activation, W_constraint=maxnorm(weight_constraint))(inputs)
        x = Dropout(dropout_rate)(x)
        if layers[0]:
            x = Dense(neurons, init=tw_init, activation=activation, W_constraint=maxnorm(weight_constraint))(x)
            x = Dropout(dropout_rate)(x)
        if layers[1]:
            x = Dense(neurons, init=tw_init, activation=activation, W_constraint=maxnorm(weight_constraint))(x)
            x = Dropout(dropout_rate)(x)

        preds = Dense(1, activation='linear')(x)

        model = Model(input=inputs, output=preds)
        model.compile(optimizer=optimizer, loss='mse', metrics=['mse'])

        return model
        
        
m = BaselineModel([seq_len, seq_len+1, (seq_len+1)*2, 1])  #bias added
m.classtype
m.modelPath
m.model.summary()



In [ ]:

    
class DenseModel(BaseModel):
    """take the seq_len as feature input and predict one output"""
    
    classtype = 'dense'  # class variable
    
    def __init__(self, layers):
        super(DenseModel, self).__init__(layers)
        self.create(layers)

    def create(self, layers):
        if verbose: print('> Create Model', self.get_classname(), ' type: ', self.classtype)
        start = time.time()
        
        inputs = Input(shape=(layers[0],))
        
        x = Dense(layers[1], activation='relu')(inputs)
        x = Dropout(0.25)(x)
        x = Dense(layers[2], activation='relu')(x)
        x = Dropout(0.25)(x)
        preds = Dense(layers[3], activation='linear')(x)
        
        self.model = Model(input=inputs, output=preds)
        
        self.model.compile(optimizer='adam', loss='mse', metrics=['mse', 'mape'])
        if verbose: print("Compilation Time : ", time.time() - start)
        
        
m = DenseModel([seq_len, 500, 250, 1])  #bias added
m.model.summary()



In [ ]:

    
%%time
#%%capture output
#sys.stdout = open('keras_output.txt', 'a+')
#m.compile()
model, hist = m.train(X_train, y_train, epochs=1, verbose=1)
#sys.stdout = stdout
hist

#m.save()

LTSM



In [ ]:

    
class BaseLTSM(BaseModel):
    
    classtype = 'ltsm'  # class variable
    classname = 'BaseLTSM'
    
    def __init__(self, layers):
        super(BaseLTSM, self).__init__(layers)
        self.create(layers)

    def create(self, layers):
        print('> Create Model', self.get_classname(), ' type: ', self.classtype)
        start = time.time()
        
        inputs = Input(shape=(seq_len, layers[0]))
        
        x = LSTM(layers[1], activation='relu', return_sequences=True)(inputs)
        #x = Dropout(0.1)(x)
        x = LSTM(layers[2], activation='relu', return_sequences=False)(x)
        #x = Dropout(0.1)(x)
        preds = Dense(layers[3], activation='linear')(x)
        
        self.model = Model(input=inputs, output=preds)
        self.model.compile(optimizer='rmsprop', loss='mse', metrics=['mse'])
        print("Compilation Time : ", time.time() - start)
        
#m = BaseLTSM([1, seq_len+1, (seq_len+1)*2, 1])  #bias added
m = BaseLTSM([1, 50, 50, 1])  #bias added
m.modelPath
m.model.summary()

Training ^



In [ ]:

    
%%time
%%capture output
#sys.stdout = open('keras_output.txt', 'a+')
#m.compile()
model, hist = m.train(X_train, y_train, epochs=1, verbose=1)
#sys.stdout = stdout
hist

#m.save()



In [ ]:

    
output.show()



In [ ]:

    
from keras.models import load_model
# returns a compiled model
# identical to the previous one
model = load_model(h5PathModel)

Grid Search

https://github.com/fchollet/keras/blob/master/examples/mnist_sklearn_wrapper.py



In [ ]:

    
from sklearn.model_selection import GridSearchCV
from keras.wrappers.scikit_learn import KerasClassifier, KerasRegressor

def _model():
    return m.model
model = KerasRegressor(build_fn=_model, verbose=1)
# __call__
#model = KerasRegressor(build_fn=m, verbose=1)



In [ ]:

    
%%capture output
grid = GridSearchCV(model,
                         param_grid={'nb_epoch': [1],
                                     'batch_size': [10]},
                         #scoring='mse',
                         scoring='neg_mean_squared_error',
                         n_jobs=1)
grid_result = grid.fit(X_train, y_train)



In [ ]:

    
output.show()



In [ ]:

    
# summarize results
# The unified scoring API always maximizes the score, so scores which need to be minimized are negated in order for the unified scoring API to work correctly. The score that is returned is therefore negated when it is a score that should be minimized and left positive if it is a score that should be maximized.
print("Best: %f using %s" % (grid_result.best_score_, grid_result.best_params_))
means = grid_result.cv_results_['mean_test_score']
stds = grid_result.cv_results_['std_test_score']
params = grid_result.cv_results_['params']
for mean, stdev, param in zip(means, stds, params):
    print("%f (%f) with: %r" % (mean, stdev, param))



In [ ]:

    
# validator.best_estimator_ returns sklearn-wrapped version of best model.
# validator.best_estimator_.model returns the (unwrapped) keras model
best_model = grid.best_estimator_.model
metric_names = best_model.metrics_names
metric_values = best_model.evaluate(X_test, y_test)
for metric, value in zip(metric_names, metric_values):
    print(metric, ': ', value)



In [ ]:

    
grid_result.best_score_
grid_result.best_params_
grid_result.cv_results_

Predictions ^



In [ ]:

    
seq_len, X_test.shape, y_test.shape
X_test[0, :10], y_test[0]
X_test[1, :10], y_test[1]



In [ ]:

    
def predict_sequence_full(model, data, window_size):
    #Shift the window by 1 new prediction each time, re-run predictions on new window
    curr_frame = data[0]
    predicted = []
    
    # loop over entire testdata
    for i in range(len(data)):
        if m.classtype == 'ltsm':
            predicted.append(model.predict(curr_frame[np.newaxis,:,:])[0,0])  #get element from shape(1,1,:)
        elif m.classtype == 'dense':
            predicted.append(model.predict(curr_frame[np.newaxis,:])[0][0])  #get element from shape(1,1)
        else:
            raise ValueError('Wrong model type: ', modelType)
            
        curr_frame = curr_frame[1:]  #move window
        #Tracer()()
        curr_frame = np.insert(curr_frame, [window_size-2], predicted[-1], axis=0)  #fill frame with prediction
    return predicted



In [ ]:

    
%%time
length = len(X_test)
if m.classtype == 'ltsm':
    predicted = predict_sequence_full(model, X_test[:length], seq_len)
elif m.classtype == 'dense':
    predicted = predict_sequence_full(model, np.squeeze(X_test[:length]), seq_len)
else:
    raise ValueError('Wrong model type: ', modelType)
#predicted = predict_sequence_full(model, np.squeeze(X_test[:length]), seq_len)
print(len(predicted), predicted)
plot_result(y_test, predicted, length)



In [ ]:

    
y_test.shape
y_test
np.array(predicted)



In [ ]:

    
def evaluate(X, y, verbose=0):
    # gives the metrics, defined during compile
    for n in zip(model.metrics_names, model.evaluate(X, y, verbose=verbose)):
        print("{}:\t{}".format(n[0], n[1]))
evaluate(X_test, y_test, 1)



In [ ]:

Rain

Navigation

Variables/Functions ^

Data ^

Correlation

Load Data

Model ^

Abtract Model

Model Functional

Dense

LTSM

Training ^

Grid Search

Predictions ^