notebook.community

Edit and run



In [1]:

    
import sys; print('Python \t\t{0[0]}.{0[1]}'.format(sys.version_info))
import tensorflow as tf; print('Tensorflow \t{}'.format(tf.__version__))
import keras; print('Keras \t\t{}'.format(keras.__version__))









    



Python 		3.6
Tensorflow 	1.0.0






    



Using TensorFlow backend.






    



Keras 		2.0.3



In [2]:

    
%matplotlib inline 

import numpy as np
import matplotlib.pyplot as plt



In [3]:

    
from tensorflow.examples.tutorials.mnist import input_data
mnist = input_data.read_data_sets("../mnist-data/", one_hot=True)









    



Extracting ../mnist-data/train-images-idx3-ubyte.gz
Extracting ../mnist-data/train-labels-idx1-ubyte.gz
Extracting ../mnist-data/t10k-images-idx3-ubyte.gz
Extracting ../mnist-data/t10k-labels-idx1-ubyte.gz



In [4]:

    
mnist.train.images.shape









    Out[4]:





(55000, 784)



In [5]:

    
plt.figure(figsize=(15,5))
for i in list(range(10)):
    plt.subplot(1, 10, i+1)
    pixels = mnist.test.images[i]
    pixels = pixels.reshape((28, 28))
    plt.imshow(pixels, cmap='gray_r')
plt.show()



In [6]:

    
import tensorflow as tf



In [7]:

    
# Set parameters
learning_rate = 0.01
training_iteration = 10
batch_size = 250
print_freq=1



In [8]:

    
# TF graph input
x = tf.placeholder('float', [None, 784]) # mnist data image of shape 28*28=784
y = tf.placeholder('float', [None, 10]) # 0-9 digits recognition => 10 classes

keep_rate = tf.placeholder(tf.float32)



In [9]:

    
def weight_variable(shape):
  initial = tf.constant(0.0, shape=shape)
  return tf.Variable(initial)

def bias_variable(shape):
  initial = tf.constant(0.1, shape=shape)
  return tf.Variable(initial)



In [10]:

    
with tf.name_scope("hidden_1") as scope:

    # Set model weights
    W_layer1 = weight_variable([784, 512])
    b_layer1 = bias_variable([512])

    # Construct a dense linear model, with act=relu and dropout
    layer_1 = tf.nn.dropout(tf.nn.relu(tf.matmul(x, W_layer1) + b_layer1), keep_rate) # Relu, dropout
        
    # Add summary ops to collect data
    tf.summary.histogram("W1_weights", W_layer1)
    tf.summary.histogram("B1_biases", b_layer1)



In [11]:

    
with tf.name_scope("hidden_2") as scope:

    # Set model weights
    W_layer2 = weight_variable([512, 512])
    b_layer2 = bias_variable([512])

    # Construct a dense linear model, with act=relu and dropout
    layer_2 = tf.nn.dropout(tf.nn.relu(tf.matmul(layer_1, W_layer2) + b_layer2), keep_rate) # Relu, dropout
    
    # Add summary ops to collect data
    tf.summary.histogram("W2_weights", W_layer2)
    tf.summary.histogram("B2_biases", b_layer2)



In [12]:

    
with tf.name_scope("output") as scope:

    # Set model weights
    W_layer3 = weight_variable([512, 10])
    b_layer3 = bias_variable([10])

    # Construct a dense linear model, with act=relu and dropout
    layer_3 = tf.add(tf.matmul(layer_2, W_layer3), b_layer3)
    
    # Add summary ops to collect data
    tf.summary.histogram("W3_weights", W_layer3)
    tf.summary.histogram("B3_biases", b_layer3)



In [13]:

    
#unscaled log probabilities
y_hat = layer_3

#model output
y_out = tf.nn.softmax(y_hat)

# More name scopes will clean up graph representation
with tf.name_scope("cost_function") as scope:
    # Minimize error using cross entropy
    # Cross entropy
    cost_function = tf.reduce_mean(tf.nn.softmax_cross_entropy_with_logits(labels=y,logits=y_hat))
    # Create a summary to monitor the cost function
    tf.summary.scalar("cost_function", cost_function)



In [14]:

    
with tf.name_scope("train") as scope:
    # Gradient descent
    optimizer = tf.train.AdamOptimizer().minimize(cost_function)



In [15]:

    
# Initializing the variables
init = tf.global_variables_initializer()

# Merge all summaries into a single operator
merged_summary_op = tf.summary.merge_all()



In [16]:

    
# Launch the graph
sess = tf.InteractiveSession()
sess.run(init)



In [17]:

    
# Change this to a location on your computer
summary_writer = tf.summary.FileWriter('./tensorboard/tf', graph=sess.graph)



In [18]:

    
# Training cycle
for iteration in range(training_iteration):
    avg_cost = 0.
    total_batch = int(mnist.train.num_examples/batch_size)
    # Loop over all batches
    for i in range(total_batch):
        batch_xs, batch_ys = mnist.train.next_batch(batch_size)
        
        # dropout placeholder
        batch_kr = 0.75
        
        # Fit training using batch data
        sess.run(optimizer, feed_dict={x: batch_xs, keep_rate: batch_kr, y: batch_ys})
        
        # Compute the average loss
        avg_cost += sess.run(cost_function, feed_dict={x: batch_xs, keep_rate: batch_kr, y: batch_ys})/(total_batch+1)

        # Write logs for each iteration
        summary_str = sess.run(merged_summary_op, feed_dict={x: batch_xs, keep_rate:batch_kr, y: batch_ys})
        summary_writer.add_summary(summary_str, iteration*total_batch + i)
        
    # Display logs per iteration step
    if iteration % print_freq ==0 :
        print("Iteration:", '%04d' % (iteration), "cost=", "{:.9f}".format(avg_cost))









    



Iteration: 0000 cost= 0.683263521
Iteration: 0001 cost= 0.189000007
Iteration: 0002 cost= 0.123381180
Iteration: 0003 cost= 0.088558772
Iteration: 0004 cost= 0.071210058
Iteration: 0005 cost= 0.056130819
Iteration: 0006 cost= 0.045940143
Iteration: 0007 cost= 0.038140648
Iteration: 0008 cost= 0.032672639
Iteration: 0009 cost= 0.028221791



In [19]:

    
# Test the model
predictions = tf.equal(tf.argmax(y_out, 1), tf.argmax(y, 1))

# Calculate accuracy
accuracy = tf.reduce_mean(tf.cast(predictions, "float"))
print("Accuracy:", accuracy.eval({x: mnist.test.images, keep_rate:1.0, y: mnist.test.labels}))









    



Accuracy: 0.9795



In [20]:

    
# test item #100 is a six
pixels = mnist.test.images[100]

#predict
result = sess.run(y_out, feed_dict={x:[pixels], keep_rate:1.0})
dict(zip(range(10), result[0]))









    Out[20]:





{0: 6.0899251e-06,
 1: 6.2345753e-06,
 2: 4.9691484e-06,
 3: 3.3737287e-08,
 4: 3.3895682e-07,
 5: 4.0409548e-05,
 6: 0.99992764,
 7: 2.2955151e-08,
 8: 1.4148809e-05,
 9: 1.5094564e-10}



In [21]:

    
def test_render(pixels, result, truth):
    #pixels, result and truth are np vectors
    plt.figure(figsize=(10,5))
    plt.subplot(1, 2, 1)
    pixels = pixels.reshape((28, 28))
    plt.imshow(pixels, cmap='gray_r')

    plt.subplot(1, 2, 2)
    
    #index, witdh
    ind = np.arange(len(result))
    width = 0.4

    plt.barh(ind,result, width, color='orange', edgecolor='k', hatch="/")
    plt.barh(ind+width,truth,width, color='g', edgecolor='k')
    plt.yticks(ind+width, range(10))
    plt.margins(y=0)

    plt.show()



In [23]:

    
import random
i = random.randint(0,mnist.test.images.shape[0])

pixels = mnist.test.images[i]
truth  = mnist.test.labels[i]
result = sess.run(y_out, feed_dict={x:[pixels], keep_rate:1.0})[0]

test_render(pixels, result, truth)



In [24]:

    
### What went wrong?
pixels = mnist.test.images
truth = mnist.test.labels

feed_dict = {x:pixels}
feed_dict.update({keep_rate:1.0})

result = sess.run(y_out, feed_dict=feed_dict)



In [25]:

    
acc = result.argmax(axis=1) == truth.argmax(axis=1)
incorrect = np.argwhere(acc==False).flatten()

print("Incorrect predictions: {}".format(len(incorrect)))









    



Incorrect predictions: 205



In [26]:

    
plt.figure(figsize=(20,5))
plt_idx = 1
for i in list(incorrect[:16]):
    plt.subplot(1, 16, plt_idx)
    pixels = mnist.test.images[i]
    pixels = pixels.reshape((28, 28))
    plt.imshow(pixels, cmap='gray_r')
    plt_idx += 1
plt.show()



In [27]:

    
i = random.choice(list(incorrect))

pixels = mnist.test.images[i]
truth  = mnist.test.labels[i]

feed_dict = {x:[pixels]}
feed_dict.update({keep_rate:1.0})
result = sess.run(y_out, feed_dict=feed_dict)[0]

test_render(pixels, result, truth)



In [ ]:

    
# Close the Session when we're done.
# sess.close()



In [ ]: