Single-layer Perceptron For MNIST Dataset

Load the dataset

In [1]:
import tensorflow as tf
import numpy as np

from tensorflow.examples.tutorials.mnist import input_data
mnist_data = input_data.read_data_sets('/tmp/data', one_hot=True)

Extracting /tmp/data/train-images-idx3-ubyte.gz
Extracting /tmp/data/train-labels-idx1-ubyte.gz
Extracting /tmp/data/t10k-images-idx3-ubyte.gz
Extracting /tmp/data/t10k-labels-idx1-ubyte.gz

Visualize a sample subset of data

In [2]:
import matplotlib.pyplot as plt
%matplotlib inline

import numpy as np

f,a = plt.subplots(5,10,figsize=(10,5))
for i in range(5):
    for j in range(10):
        index = (i-1)*5 + j
        a[i][j].imshow(np.reshape(mnist_data.test.images[index],(28,28)), cmap='Greys_r')

Side Note: What are Tensors?

  • A vector is one-dimensional
  • A matrix is 2-dimensional
  • A tensor can have $k$ dimenions $$\left[\begin{array}{ccc} & & & \\ & & & \\ & & & \end{array}\right]_{n_1\times n_2 \times ... n_k}$$

    Read about tensors: Animashree Anand Kumar

Set Network and Learning Parameters

In [7]:
## set learning parameters
learning_rate = 0.5
batch_size = 128
trainig_iters = 2000
dispay_step = 20

# set network parameters
num_weights = 32
num_dims = 784    ## number of input pixels
num_classes = 10  
num_layers = 1    ## number of hidden layers

# create placeholders for data
x = tf.placeholder(tf.float32, [None, num_dims]) 
y_ = tf.placeholder(tf.float32, [None, num_classes])
#### 2-D tensor of floating-point numbers, with a shape [None, 784]. 
####  --> None means that a dimension can be of any length
####  -->  placeholder x is store a batch of data samples
####  -->  placeholder y_ is for the true (onehot emcoder) labels

## define weights: intiailize using 
weights = tf.Variable(tf.truncated_normal([num_dims, num_classes], 
                                          mean=0, stddev=1.0/num_dims))
biases = tf.Variable(tf.zeros(shape=[num_classes]))
# --> intiial weights are normal distribited, with sigma=(1/n)

## define the model (network)
y = tf.nn.softmax(tf.matmul(x, weights) + biases)

## define the loss-function: Cross-Entropy Loss Function
### One way to define the loss is as follows 
###  (but it is numericlly unstable and should be avoided)
# cross_entropy = tf.reduce_mean(-tf.reduce_sum(y_ * tf.log(y), reduction_indices=[1]))
#### --> tf.reduce_sum adds the elements in dimension s[ecified by reduction_indices
#### --> tf.reduce_mean computes the mean over all the examples in the batch

## Instead, we use tf.nn.softmax_cross_entropy_with_logits
cross_entropy = tf.reduce_mean(tf.nn.softmax_cross_entropy_with_logits(y, y_))

## Training:
train_step = tf.train.GradientDescentOptimizer(learning_rate).minimize(cross_entropy)

Tensorflow Session

In [8]:
## define initialization of variables
init = tf.initialize_all_variables()

## start a Tensorflow session and intitalize variables
sess = tf.Session()

losses = []
for i in range(trainig_iters):
    batch_xs, batch_ys = mnist_data.train.next_batch(batch_size), feed_dict={x: batch_xs, y_: batch_ys})
    _, loss_val =[train_step, cross_entropy], 
                           feed_dict={x: batch_xs, y_: batch_ys})

fig = plt.figure(figsize=(10,5))
plt.plot(np.arange(len(losses)), losses)

Evaluating the model

In [9]:
correct_prediction = tf.equal(tf.argmax(y,1), tf.argmax(y_,1))

accuracy = tf.reduce_mean(tf.cast(correct_prediction, tf.float32))

print(, feed_dict={x: mnist_data.test.images, y_: mnist_data.test.labels}))


In [6]:
with sess.as_default():
    W = weights.eval()
    fig,ax = plt.subplots(2,5,figsize=(20,8))
    for i in range(10):
            ax[i/5][i%5].imshow(np.reshape(W[:,i], (28,28)), cmap='Greys_r')

In [ ]: