In [2]:
'''
A Multilayer Perceptron implementation example using TensorFlow library.
This example is using the MNIST database of handwritten digits
(http://yann.lecun.com/exdb/mnist/)

Author: Aymeric Damien
Project: https://github.com/aymericdamien/TensorFlow-Examples/
'''

'\nA Multilayer Perceptron implementation example using TensorFlow library.\nThis example is using the MNIST database of handwritten digits\n(http://yann.lecun.com/exdb/mnist/)\n\nAuthor: Aymeric Damien\nProject: https://github.com/aymericdamien/TensorFlow-Examples/\n'

In [3]:
# Import MINST data
from tensorflow.examples.tutorials.mnist import input_data
mnist = input_data.read_data_sets("MNIST_data/", one_hot=True)

import tensorflow as tf


# Parameters
batch_size = 100
num_steps = 4000
data_showing_step = 100

# Network Parameters
n_hidden_1 = 256 # 1st layer number of features
n_hidden_2 = 256 # 2nd layer number of features
n_input = 784 # MNIST data input (img shape: 28*28)
n_classes = 10 # MNIST total classes (0-9 digits)

# tf Graph input
x = tf.placeholder("float", [None, n_input])
y = tf.placeholder("float", [None, n_classes])
learning_rate_decayed = tf.placeholder(tf.float32, shape=[])

Extracting MNIST_data/train-images-idx3-ubyte.gz
Extracting MNIST_data/train-labels-idx1-ubyte.gz
Extracting MNIST_data/t10k-images-idx3-ubyte.gz
Extracting MNIST_data/t10k-labels-idx1-ubyte.gz


In [4]:
# Create model
def multilayer_perceptron(x, weights, biases):
    # Hidden layer with RELU activation
    layer_1 = tf.add(tf.matmul(x, weights['h1']), biases['b1'])
    layer_1 = tf.nn.relu(layer_1)
    # Hidden layer with RELU activation
    layer_2 = tf.add(tf.matmul(layer_1, weights['h2']), biases['b2'])
    layer_2 = tf.nn.relu(layer_2)
    # Output layer with linear activation
    out_layer = tf.matmul(layer_2, weights['out']) + biases['out']
    return out_layer


# Store layers weight & bias
weights = {
    'h1': tf.Variable(tf.random_normal([n_input, n_hidden_1])),
    'h2': tf.Variable(tf.random_normal([n_hidden_1, n_hidden_2])),
    'out': tf.Variable(tf.random_normal([n_hidden_2, n_classes]))
}
biases = {
    'b1': tf.Variable(tf.random_normal([n_hidden_1])),
    'b2': tf.Variable(tf.random_normal([n_hidden_2])),
    'out': tf.Variable(tf.random_normal([n_classes]))
}

# Construct model
pred = multilayer_perceptron(x, weights, biases)

# Define loss and optimizer
cost = tf.reduce_mean(tf.nn.softmax_cross_entropy_with_logits(logits=pred, labels=y))
optimizer = tf.train.AdamOptimizer(learning_rate=learning_rate_decayed).minimize(cost)

# Initializing the variables
init = tf.global_variables_initializer()

In [5]:
# Launch the graph
sess = tf.InteractiveSession()
sess.run(init)

# Training cycle
for step in range(num_steps):
    
    avg_cost = 0.
    total_batch = int(mnist.train.num_examples/batch_size)
    
    if 30000 < step < 80000:
        learning_rate = 0.01 / 10
    elif 80000 <= step < 200000:
        learning_rate = 0.01 / 100
    else:
        learning_rate = 0.01

    # set a offset
    offset = (step * batch_size) % (mnist.train.labels.shape[0] - batch_size)

    # Generate a minibatch.
    batch_data = mnist.train.images[offset:(offset + batch_size), :]
    batch_labels = mnist.train.labels[offset:(offset + batch_size), :]
    
    feed_dict = {x: batch_data, 
                 y: batch_labels,
                 learning_rate_decayed: learning_rate}
    
    _, c = sess.run([optimizer, cost], feed_dict=feed_dict)
    
    # Compute average loss
    avg_cost += c / total_batch
    
    if (step % data_showing_step == 0):
        print "step:", '%04d' % (step+batch_size), "cost=", "{:.9f}".format(avg_cost)

print "Optimization Finished!"

step: 0100 cost= 3.612372159
step: 0200 cost= 0.046545570
step: 0300 cost= 0.036489483
step: 0400 cost= 0.027970713
step: 0500 cost= 0.018557151
step: 0600 cost= 0.009317975
step: 0700 cost= 0.018626598
step: 0800 cost= 0.012463570
step: 0900 cost= 0.007882543
step: 1000 cost= 0.006299686
step: 1100 cost= 0.008945249
step: 1200 cost= 0.007009433
step: 1300 cost= 0.008139231
step: 1400 cost= 0.008677087
step: 1500 cost= 0.001134169
step: 1600 cost= 0.008046789
step: 1700 cost= 0.010661273
step: 1800 cost= 0.000055152
step: 1900 cost= 0.005470282
step: 2000 cost= 0.000717611
step: 2100 cost= 0.014976241
step: 2200 cost= 0.010334287
step: 2300 cost= 0.001379655
step: 2400 cost= 0.001192659
step: 2500 cost= 0.010680760
step: 2600 cost= 0.010929030
step: 2700 cost= 0.005955373
step: 2800 cost= 0.002402276
step: 2900 cost= 0.001472202
step: 3000 cost= 0.000511149
step: 3100 cost= 0.000419174
step: 3200 cost= 0.001526392
step: 3300 cost= 0.013002790
step: 3400 cost= 0.000887756
step: 3500 cos

In [6]:
# Test model
correct_prediction = tf.equal(tf.argmax(pred, 1), tf.argmax(y, 1))
# Calculate accuracy
accuracy = tf.reduce_mean(tf.cast(correct_prediction, "float"))
print "Accuracy:", accuracy.eval({x: mnist.test.images, y: mnist.test.labels})

#sess.close()

Accuracy: 0.9516


In [7]:
predict = sess.run(pred, feed_dict={x: mnist.test.images})

In [8]:
predict[0]

array([-102.1829834 ,  -65.20870972,   26.33320808,   78.12233734,
       -115.69210052,  -25.75245667, -353.78411865,  522.88085938,
        -70.0782547 ,   89.16830444], dtype=float32)

In [9]:
mnist.test.labels[0]

array([ 0.,  0.,  0.,  0.,  0.,  0.,  0.,  1.,  0.,  0.])