notebook.community

Edit and run



In [2]:

    
from new_SiameseNet import *
%matplotlib inline
import matplotlib.pyplot as plt









    



Using Theano backend.
/Users/wilbury/anaconda/lib/python2.7/site-packages/theano/tensor/signal/downsample.py:5: UserWarning: downsample module has been moved to the pool module.
  warnings.warn("downsample module has been moved to the pool module.")



In [3]:

    
# Prepare data
print 'Getting CIFAR10 data...'

'''
data = get_CIFAR10_data()

x_train, y_train = data['X_train'], data['y_train']
x_val,   y_val   = data['X_val'],   data['y_val']
'''

(x_train, y_train), (x_val, y_val) = cifar10.load_data()

x_train = x_train.astype('float32')
x_val = x_val.astype('float32')

y_train = y_train.reshape((y_train.shape[0],))
y_val = y_val.reshape((y_val.shape[0],))

N = x_train.shape[0]









    



Getting CIFAR10 data...



In [3]:

    
# Specify structure of Siamese part of SiameseNet
# This part needs to be improved. I'm kind of just using random layers.
init = 'glorot_uniform'
in_shp = (3,32,32)
seq = Sequential()
seq.add(BatchNormalization(epsilon=1e-7,
                            mode=0,
                            axis=1,
                            momentum=0.9,
                            weights=None,
                            input_shape=in_shp))
#seq.add(Flatten())
#seq.add(Dense(128, activation='relu'))
#seq.add(Dropout(0.1))
#seq.add(Dense(128, activation='relu'))
#seq.add(Dropout(0.1))
for _ in range(2):
    seq.add(Convolution2D(3, 3, 3, init=init, border_mode='same'))
    seq.add(Activation('relu'))
    seq.add(Dropout(.1))
#seq.add(Dense(128, activation='relu'))
seq.add(Flatten())
seq.add(Dense(128))
layers = seq

sn = SiameseNet(layers, input_shape=(3, 32, 32), verbose=False)
sn.compile()



In [4]:

    
def _train_sn(sn, x_train, y_train, x_val, y_val, filepath):
    d_val = invert_dataset(x_val,  y_val)
    d_train = invert_dataset(x_train,  y_train)
    num_ep = 10
    history = sn.fit(*generate_data(x_train, d_train), 
            validation_data=generate_data(x_val, d_val),
            nb_epoch=num_ep)
    return history

history = _train_sn(sn, x_train, y_train, x_val, y_val, filepath='weights.h5')









    



Train on 97600 samples, validate on 1540 samples
Epoch 1/10
97600/97600 [==============================] - 66s - loss: 0.3157 - val_loss: 0.2359
Epoch 2/10
97600/97600 [==============================] - 65s - loss: 0.2389 - val_loss: 0.2316
Epoch 3/10
97600/97600 [==============================] - 65s - loss: 0.2291 - val_loss: 0.2361
Epoch 4/10
97600/97600 [==============================] - 65s - loss: 0.2227 - val_loss: 0.2250
Epoch 5/10
97600/97600 [==============================] - 65s - loss: 0.2179 - val_loss: 0.2327
Epoch 6/10
97600/97600 [==============================] - 65s - loss: 0.2140 - val_loss: 0.2193
Epoch 7/10
97600/97600 [==============================] - 65s - loss: 0.2105 - val_loss: 0.2187
Epoch 8/10
97600/97600 [==============================] - 65s - loss: 0.2074 - val_loss: 0.2185
Epoch 9/10
97600/97600 [==============================] - 65s - loss: 0.2046 - val_loss: 0.2372
Epoch 10/10
97600/97600 [==============================] - 65s - loss: 0.2027 - val_loss: 0.2208



In [5]:

    
#loss = sn.evaluate(*generate_data(d_val, examples_per_image=5))
d_val = invert_dataset(x_val,  y_val)
val_x_dat, val_y_dat = generate_data(x_val, d_val)
prediction = sn.predict(val_x_dat)[SiameseNet.OUTPUT]

ret_preds = prediction
max_d = np.max(ret_preds)
min_d = np.min(ret_preds)

print max_d
print min_d

#thresh = (max_d + min_d) / 2.0
#preds = [0,0]
#for i,p in enumerate(prediction):
#    if ret_preds[i] > thresh:
#        preds[1] += 1
#    else:
#        preds[0] += 1
#print preds









    



1.26899111271
0.120806694031



In [6]:

    
#print history.history
l = history.history['loss']
val_l = history.history['val_loss']



In [ ]:



In [ ]:



In [7]:

    
plt.figure()
plt.plot(range(1,len(l)+1), l, label='Training Loss')
plt.title('Siamese Network Training/Validation Loss vs. Epochs')
plt.plot(range(1,len(val_l)+1), val_l, label='Validation Loss')
plt.xlabel('Epochs')
plt.ylabel('Loss')
plt.legend()
#plt.savefig('siam_loss3.png')









    Out[7]:





<matplotlib.legend.Legend at 0x7f45491f0a50>



In [8]:

    
def similarity(sn, x1, x2):
    x = [np.array([x1]), np.array([x2])]
    prediction = sn.predict(x, batch_size=1)
    return prediction['output'][0][0]



In [9]:

    
similarity(sn, x_train[0], x_train[1])









    Out[9]:





0.91613972187042236



In [10]:

    
num_zeros = 4913
num_ones = 9794 - 4913
num_examples = 80
sorted_index = np.argsort(y_train)[:num_zeros + num_ones]
chosen_zeros = sorted_index[random.sample(xrange(num_zeros), num_examples)]
chosen_ones = sorted_index[random.sample(xrange(num_zeros, num_zeros + num_ones), num_examples)]
indices = np.hstack((chosen_zeros, chosen_ones))
sorted_y_train = y_train[indices]
sorted_x_train = x_train[indices]



In [11]:

    
num_tests = len(indices)
similarity_matrix = np.zeros((num_tests, num_tests))
for i in xrange(num_tests):
    for j in xrange(num_tests):
        similarity_matrix[i][j] = similarity(sn, sorted_x_train[i], sorted_x_train[j])



In [17]:

    
%matplotlib inline
import matplotlib.pyplot as plt
import matplotlib



In [18]:

    
fig, ax = plt.subplots()
fig.set_size_inches(10, 10)
ax.pcolor(similarity_matrix, cmap=matplotlib.cm.Blues)
ax.set_xticks(np.arange(similarity_matrix.shape[0])+0.5, minor=False)
ax.set_yticks(np.arange(similarity_matrix.shape[1])+0.5, minor=False)
ax.set_xticklabels(sorted_y_train, minor=False)
ax.set_yticklabels(sorted_y_train, minor=False)
#plt.savefig('similarity_matrix_80_examples_5.png')









    Out[18]:





[<matplotlib.text.Text at 0x7f454a54bc90>,
 <matplotlib.text.Text at 0x7f454a53ed10>,
 <matplotlib.text.Text at 0x7f4549754790>,
 <matplotlib.text.Text at 0x7f4549754c90>,
 <matplotlib.text.Text at 0x7f454969f1d0>,
 <matplotlib.text.Text at 0x7f454969f6d0>,
 <matplotlib.text.Text at 0x7f454969fbd0>,
 <matplotlib.text.Text at 0x7f45496a9110>,
 <matplotlib.text.Text at 0x7f45496a9610>,
 <matplotlib.text.Text at 0x7f45496a9b10>,
 <matplotlib.text.Text at 0x7f45496b3050>,
 <matplotlib.text.Text at 0x7f45496b3550>,
 <matplotlib.text.Text at 0x7f45496b3a50>,
 <matplotlib.text.Text at 0x7f45496b3f50>,
 <matplotlib.text.Text at 0x7f45496be490>,
 <matplotlib.text.Text at 0x7f45496be990>,
 <matplotlib.text.Text at 0x7f45496bee90>,
 <matplotlib.text.Text at 0x7f45496c83d0>,
 <matplotlib.text.Text at 0x7f45496c88d0>,
 <matplotlib.text.Text at 0x7f45496c8dd0>,
 <matplotlib.text.Text at 0x7f45496d3390>,
 <matplotlib.text.Text at 0x7f45496d3ad0>,
 <matplotlib.text.Text at 0x7f45496db250>,
 <matplotlib.text.Text at 0x7f45496db990>,
 <matplotlib.text.Text at 0x7f4549663110>,
 <matplotlib.text.Text at 0x7f4549663850>,
 <matplotlib.text.Text at 0x7f4549663f90>,
 <matplotlib.text.Text at 0x7f454966b710>,
 <matplotlib.text.Text at 0x7f454966be50>,
 <matplotlib.text.Text at 0x7f45496f4850>,
 <matplotlib.text.Text at 0x7f45496eb410>,
 <matplotlib.text.Text at 0x7f4549757d90>,
 <matplotlib.text.Text at 0x7f454974e710>,
 <matplotlib.text.Text at 0x7f45497445d0>,
 <matplotlib.text.Text at 0x7f4549730f50>,
 <matplotlib.text.Text at 0x7f4549728b90>,
 <matplotlib.text.Text at 0x7f454971e510>,
 <matplotlib.text.Text at 0x7f4549789fd0>,
 <matplotlib.text.Text at 0x7f4549780a50>,
 <matplotlib.text.Text at 0x7f45497763d0>,
 <matplotlib.text.Text at 0x7f454976d290>,
 <matplotlib.text.Text at 0x7f45497dac10>,
 <matplotlib.text.Text at 0x7f45497d0850>,
 <matplotlib.text.Text at 0x7f45497c61d0>,
 <matplotlib.text.Text at 0x7f45497b2d50>,
 <matplotlib.text.Text at 0x7f4549679290>,
 <matplotlib.text.Text at 0x7f45496799d0>,
 <matplotlib.text.Text at 0x7f4549681150>,
 <matplotlib.text.Text at 0x7f4549681890>,
 <matplotlib.text.Text at 0x7f4549681fd0>,
 <matplotlib.text.Text at 0x7f4549689750>,
 <matplotlib.text.Text at 0x7f4549689e90>,
 <matplotlib.text.Text at 0x7f4549693610>,
 <matplotlib.text.Text at 0x7f4549693d50>,
 <matplotlib.text.Text at 0x7f454969c4d0>,
 <matplotlib.text.Text at 0x7f454969cc10>,
 <matplotlib.text.Text at 0x7f4549624390>,
 <matplotlib.text.Text at 0x7f4549624ad0>,
 <matplotlib.text.Text at 0x7f454962f250>,
 <matplotlib.text.Text at 0x7f454962f990>,
 <matplotlib.text.Text at 0x7f4549638110>,
 <matplotlib.text.Text at 0x7f4549638850>,
 <matplotlib.text.Text at 0x7f4549638f90>,
 <matplotlib.text.Text at 0x7f4549641710>,
 <matplotlib.text.Text at 0x7f4549641e50>,
 <matplotlib.text.Text at 0x7f454964a5d0>,
 <matplotlib.text.Text at 0x7f454964ad10>,
 <matplotlib.text.Text at 0x7f4549654490>,
 <matplotlib.text.Text at 0x7f4549654bd0>,
 <matplotlib.text.Text at 0x7f45495df350>,
 <matplotlib.text.Text at 0x7f45495dfa90>,
 <matplotlib.text.Text at 0x7f45495ea210>,
 <matplotlib.text.Text at 0x7f45495ea950>,
 <matplotlib.text.Text at 0x7f45495f30d0>,
 <matplotlib.text.Text at 0x7f45495f3810>,
 <matplotlib.text.Text at 0x7f45495f3f50>,
 <matplotlib.text.Text at 0x7f45495fd6d0>,
 <matplotlib.text.Text at 0x7f45495fde10>,
 <matplotlib.text.Text at 0x7f4549608590>,
 <matplotlib.text.Text at 0x7f4549608cd0>,
 <matplotlib.text.Text at 0x7f4549611450>,
 <matplotlib.text.Text at 0x7f4549611b90>,
 <matplotlib.text.Text at 0x7f454961b310>,
 <matplotlib.text.Text at 0x7f454961ba50>,
 <matplotlib.text.Text at 0x7f45495a61d0>,
 <matplotlib.text.Text at 0x7f45495a6910>,
 <matplotlib.text.Text at 0x7f45495af090>,
 <matplotlib.text.Text at 0x7f45495af7d0>,
 <matplotlib.text.Text at 0x7f45495aff10>,
 <matplotlib.text.Text at 0x7f45495ba690>,
 <matplotlib.text.Text at 0x7f45495badd0>,
 <matplotlib.text.Text at 0x7f45495c5550>,
 <matplotlib.text.Text at 0x7f45495c5c90>,
 <matplotlib.text.Text at 0x7f45495ce410>,
 <matplotlib.text.Text at 0x7f45495ceb50>,
 <matplotlib.text.Text at 0x7f45495d92d0>,
 <matplotlib.text.Text at 0x7f45495d9a10>,
 <matplotlib.text.Text at 0x7f4549563190>,
 <matplotlib.text.Text at 0x7f45495638d0>,
 <matplotlib.text.Text at 0x7f454956e050>,
 <matplotlib.text.Text at 0x7f454956e790>,
 <matplotlib.text.Text at 0x7f454956eed0>,
 <matplotlib.text.Text at 0x7f4549578650>,
 <matplotlib.text.Text at 0x7f4549578d90>,
 <matplotlib.text.Text at 0x7f4549582510>,
 <matplotlib.text.Text at 0x7f4549582c50>,
 <matplotlib.text.Text at 0x7f454958c3d0>,
 <matplotlib.text.Text at 0x7f454958cb10>,
 <matplotlib.text.Text at 0x7f4549594290>,
 <matplotlib.text.Text at 0x7f45495949d0>,
 <matplotlib.text.Text at 0x7f4549521150>,
 <matplotlib.text.Text at 0x7f4549521890>,
 <matplotlib.text.Text at 0x7f4549521fd0>,
 <matplotlib.text.Text at 0x7f454952b750>,
 <matplotlib.text.Text at 0x7f454952be90>,
 <matplotlib.text.Text at 0x7f4549535610>,
 <matplotlib.text.Text at 0x7f4549535d50>,
 <matplotlib.text.Text at 0x7f45495404d0>,
 <matplotlib.text.Text at 0x7f4549540c10>,
 <matplotlib.text.Text at 0x7f454954a390>,
 <matplotlib.text.Text at 0x7f454954aad0>,
 <matplotlib.text.Text at 0x7f4549555250>,
 <matplotlib.text.Text at 0x7f4549555990>,
 <matplotlib.text.Text at 0x7f45494df110>,
 <matplotlib.text.Text at 0x7f45494df850>,
 <matplotlib.text.Text at 0x7f45494dff90>,
 <matplotlib.text.Text at 0x7f45494e8710>,
 <matplotlib.text.Text at 0x7f45494e8e50>,
 <matplotlib.text.Text at 0x7f45494f35d0>,
 <matplotlib.text.Text at 0x7f45494f3d10>,
 <matplotlib.text.Text at 0x7f45494fc490>,
 <matplotlib.text.Text at 0x7f45494fcbd0>,
 <matplotlib.text.Text at 0x7f4549509350>,
 <matplotlib.text.Text at 0x7f4549509a90>,
 <matplotlib.text.Text at 0x7f4549512210>,
 <matplotlib.text.Text at 0x7f4549512950>,
 <matplotlib.text.Text at 0x7f454951b0d0>,
 <matplotlib.text.Text at 0x7f454951b810>,
 <matplotlib.text.Text at 0x7f454951bf50>,
 <matplotlib.text.Text at 0x7f45494a86d0>,
 <matplotlib.text.Text at 0x7f45494a8e10>,
 <matplotlib.text.Text at 0x7f45494b0590>,
 <matplotlib.text.Text at 0x7f45494b0cd0>,
 <matplotlib.text.Text at 0x7f45494bb450>,
 <matplotlib.text.Text at 0x7f45494bbb90>,
 <matplotlib.text.Text at 0x7f45494c6310>,
 <matplotlib.text.Text at 0x7f45494c6a50>,
 <matplotlib.text.Text at 0x7f45494d01d0>,
 <matplotlib.text.Text at 0x7f45494d0910>,
 <matplotlib.text.Text at 0x7f45494d9090>,
 <matplotlib.text.Text at 0x7f45494d97d0>,
 <matplotlib.text.Text at 0x7f45494d9f10>,
 <matplotlib.text.Text at 0x7f4549465690>,
 <matplotlib.text.Text at 0x7f4549465dd0>,
 <matplotlib.text.Text at 0x7f454946f550>,
 <matplotlib.text.Text at 0x7f454946fc90>,
 <matplotlib.text.Text at 0x7f454947a410>,
 <matplotlib.text.Text at 0x7f454947ab50>,
 <matplotlib.text.Text at 0x7f45494832d0>,
 <matplotlib.text.Text at 0x7f4549483a10>]



In [19]:

    
print np.mean(similarity_matrix[0:10:1,0:10:1])
print np.mean(similarity_matrix[10:20:1,10:20:1])
print np.mean(similarity_matrix[0:10:1,10:20:1])
print np.mean(similarity_matrix[10:20:1,0:10:1])









    



0.368407767128
0.405735358527
0.425017428994
0.425017426759



In [4]:

    
class KNN:
    def train(self, x, y):
        self.x_train = x
        self.y_train = y
        self.l2_dist = None
        self.siam_dist = None
        
    def compute_l2_dist(self, x_test):
        num_test = x_test.shape[0]
        num_train = self.x_train.shape[0]
        dists = np.zeros((num_test, num_train))
        x_test = x_test.reshape(num_test, -1)
        x_train = self.x_train.reshape(num_train, -1)
        aat = x_test.dot(x_test.T)
        abt = x_test.dot(x_train.T)
        bbt = x_train.dot(x_train.T)
        a2 = np.diag(aat).reshape(1,-1).T
        b2 = np.diag(bbt).reshape(1,-1)
        dists = np.sqrt(a2 - 2*abt + b2)
        self.l2_dists = dists
        
    def compute_siam_dist(self, sn, x_test):
        # x_test should be an array of datapoints
        #print self.x_train.shape
        #print x_test.shape
        num_test = x_test.shape[0]
        num_train = self.x_train.shape[0]
        dists = np.zeros((num_test, num_train))
        predictions = []
        for i in range(num_test):
            cur_samp = x_test[i]
            cur_samp = np.expand_dims(cur_samp, 0)
            cur_im = np.vstack([cur_samp]*num_train)
            x = [cur_im, self.x_train]
            prediction = sn.predict(x, batch_size=num_train)['output'].flatten()
            dists[i,:] = prediction
        self.siam_dists = dists
    
    def predict_k(self, mode='l2', k=1):
        dists = None
        if mode == 'l2':
            dists = self.l2_dists
        else:
            dists = self.siam_dists
        num_test = dists.shape[0]
        predictions = []
        for i in range(num_test):
            k_pred_inds = None
            k_pred_inds = dists[i,:].argsort()[:k]
            k_pred_dists = dists[i,k_pred_inds]
            k_pred_classes = self.y_train[k_pred_inds]
            class_pred = np.argmax(np.bincount(k_pred_classes))
            predictions.append((k_pred_inds, k_pred_dists, k_pred_classes, class_pred))
        return predictions



In [15]:

    
knn = KNN()
knn.train(x_train[:10000], y_train[:10000])
knn.compute_l2_dist(x_val[:100])



In [16]:

    
k_acc = []
for k in range(1,50,1):
    print k
    preds = knn.predict_k(k=k)
    num_correct = 0.0
    correct_imgs = []
    incorrect_imgs = []
    for i,pred in enumerate(preds):
        inds, dists, classes, c_pred = pred
        if c_pred == y_val[i]:
            num_correct += 1
            correct_imgs.append((i,pred))
        else:
            incorrect_imgs.append((i,pred))

    acc = num_correct / len(preds)
    k_acc.append((acc, correct_imgs, incorrect_imgs))
    print acc



In [49]:

    
accs = []
for k in range(len(k_acc)):
    acc, _, _ = k_acc[k]
    accs.append(acc)
plt.plot(accs)
plt.title('L2 Distance K-Nearest Neighbors Validation Accuracy')
plt.ylabel('Validation Accuracy')
plt.xlabel('Choice of K')
plt.show()
plt.savefig('l2_knn_val_acc.png')









    












    





<matplotlib.figure.Figure at 0x1672d1390>



In [57]:

    
def displayable(x, i):
    return np.rollaxis(x[i,:],0,3).astype('uint8')

def display_top(n, acc, accs, save_filename, mode='correct'):
    print 'best k =', np.argmax(accs) + 1
    k = np.argmax(accs)
    f, axarr = plt.subplots(n, k + 3, figsize=(20, 6))
    acc, cor_ims, inc_ims = k_acc[k]
    trunc_cor_ims = cor_ims[:n]
    trunc_inc_ims = inc_ims[:n]
    for ind,im in enumerate(trunc_cor_ims if mode == 'correct' else trunc_inc_ims):
        i, pred = im
        inds, dists, classes, c_pred = pred
        im1 = displayable(x_val, i)
        axarr[ind, 0].imshow(im1)
        axarr[ind, 0].axis('off')
        axarr[ind, 1].axis('off')
        for j in xrange(k + 1):
            im2 = displayable(x_train, inds[j])
            axarr[ind, j + 2].imshow(im2)
            axarr[ind, j + 2].axis('off')
    plt.show()



In [61]:

    
display_top(5, k_acc, accs, save_filename='k_correct', mode='correct')









    



  File "<ipython-input-61-263f802075fe>", line 1
    display_top(5, k_acc, accs, save_filename='k_correct', mode='correct')1
                                                                          ^
SyntaxError: invalid syntax



In [59]:

    
print 'best k =', np.argmax(accs)
acc, cor_ims, inc_ims = k_acc[np.argmax(accs)]
confusion_matrix = np.zeros((10,10))
print len(cor_ims)
print len(inc_ims)
for ind, im in enumerate(cor_ims):
    i, pred = im
    inds, dists, classes, c_pred = pred
    confusion_matrix[c_pred, y_val[i]] += 1
    
for ind, im in enumerate(inc_ims):
    i, pred = im
    inds, dists, classes, c_pred = pred
    confusion_matrix[c_pred, y_val[i]] += 1
    
plt.matshow(confusion_matrix)
plt.colorbar()
plt.savefig('l2_knn_confusion_matrix.png')









    



best k = 11
38
62






    



/Users/wilbury/anaconda/lib/python2.7/site-packages/matplotlib/collections.py:590: FutureWarning: elementwise comparison failed; returning scalar instead, but in the future will perform elementwise comparison
  if self._edgecolors == str('face'):



In [19]:

    
s_knn = KNN()
s_knn.train(x_train[:10000], y_train[:10000])
s_knn.compute_siam_dist(sn,x_val[:100])









    



---------------------------------------------------------------------------
NameError                                 Traceback (most recent call last)
<ipython-input-19-29d84ea61a66> in <module>()
      1 s_knn = KNN()
      2 s_knn.train(x_train[:10000], y_train[:10000])
----> 3 s_knn.compute_siam_dist(sn,x_val[:100])

NameError: name 'sn' is not defined



In [33]:

    
siam_acc = []
for k in range(1,50,1):
    print k
    preds = s_knn.predict_k(mode='siam',k=k)
    num_correct = 0.0
    correct_imgs = []
    incorrect_imgs = []
    for i,pred in enumerate(preds):
        inds, dists, classes, c_pred = pred
        if c_pred == y_val[i]:
            num_correct += 1
            correct_imgs.append((i,pred))
        else:
            incorrect_imgs.append((i,pred))

    acc = num_correct / len(preds)
    siam_acc.append((acc, correct_imgs, incorrect_imgs))
    print acc



In [34]:

    
accs = []
for k in range(len(siam_acc)):
    acc, _, _ = siam_acc[k]
    accs.append(acc)
plt.plot(accs)
plt.title('Siamese Distance K-Nearest Neighbors Validation Accuracy')
plt.ylabel('Validation Accuracy')
plt.xlabel('Choice of K')
plt.show()
plt.savefig('siam_knn_val_acc.png')









    












    





<matplotlib.figure.Figure at 0x7f453e711e50>



In [35]:

    
acc, cor_ims, inc_ims = siam_acc[33]
confusion_matrix = np.zeros((10,10))
print len(cor_ims)
print len(inc_ims)
for ind, im in enumerate(cor_ims):
    i, pred = im
    inds, dists, classes, c_pred = pred
    confusion_matrix[c_pred, y_val[i]] += 1
    
for ind, im in enumerate(inc_ims):
    i, pred = im
    inds, dists, classes, c_pred = pred
    confusion_matrix[c_pred, y_val[i]] += 1
    
plt.matshow(confusion_matrix)
plt.colorbar()
plt.savefig('siam_knn_confusion_matrix.png')



In [36]:

    
display_top(10, siam_acc, accs)



In [ ]: