## Multi-layer Perceptron

In [1]:
import tensorflow as tf
from tensorflow.examples.tutorials.mnist import input_data

### Load data

In [2]:
mnist = input_data.read_data_sets("MNIST_data/", one_hot=True)
trX, trY, teX, teY = mnist.train.images, mnist.train.labels, mnist.test.images, mnist.test.labels

Extracting MNIST_data/train-images-idx3-ubyte.gz
Extracting MNIST_data/train-labels-idx1-ubyte.gz
Extracting MNIST_data/t10k-images-idx3-ubyte.gz
Extracting MNIST_data/t10k-labels-idx1-ubyte.gz


### Helper functions

In [3]:
def init_weights(shape, name):
    return tf.Variable(tf.random_normal(shape, stddev=0.01), name=name)

# This network is the same as the previous one except with an extra hidden layer + dropout
def model(X, w_h1, w_h2, w_o, p_keep_input, p_keep_hidden):
    # Add layer name scopes for better graph visualization
    with tf.name_scope("layer1"):
        X = tf.nn.dropout(X, p_keep_input)
        h = tf.nn.relu(tf.matmul(X, w_h1))
    with tf.name_scope("layer2"):
        h = tf.nn.dropout(h, p_keep_hidden)
        h2 = tf.nn.relu(tf.matmul(h, w_h2))
    with tf.name_scope("layer3"):
        h2 = tf.nn.dropout(h2, p_keep_hidden)
        return tf.matmul(h2, w_o)

### Build graph

In [4]:
X = tf.placeholder("float", [None, 784], name="X")
Y = tf.placeholder("float", [None, 10], name="Y")

w_h1 = init_weights([784, 625], "w_h1")
w_h2 = init_weights([625, 625], "w_h2")
w_o = init_weights([625, 10], "w_o")

# Add histogram summaries for weights
tf.histogram_summary("w_h1", w_h1)
tf.histogram_summary("w_h2", w_h2)
tf.histogram_summary("w_o", w_o)

p_keep_input = tf.placeholder("float", name="p_keep_input")
p_keep_hidden = tf.placeholder("float", name="p_keep_hidden")
py_x = model(X, w_h1, w_h2, w_o, p_keep_input, p_keep_hidden)

with tf.name_scope("cost"):
    cost = tf.reduce_mean(tf.nn.softmax_cross_entropy_with_logits(py_x, Y))
    train_op = tf.train.RMSPropOptimizer(0.001, 0.9).minimize(cost)
    # Add scalar summary for cost
    tf.scalar_summary("cost", cost)

with tf.name_scope("accuracy"):
    correct_pred = tf.equal(tf.argmax(Y, 1), tf.argmax(py_x, 1)) # Count correct predictions
    acc_op = tf.reduce_mean(tf.cast(correct_pred, "float")) # Cast boolean to float to average
    # Add scalar summary for accuracy
    tf.scalar_summary("accuracy", acc_op)

### Launch graph

In [5]:
with tf.Session() as sess:
    # create a log writer. run 'tensorboard --logdir=./logs/multi-layer-perceptron'
    writer = tf.train.SummaryWriter("./logs/multi-layer-perceptron", sess.graph)
    merged = tf.merge_all_summaries()

    # you need to initialize all variables
    tf.initialize_all_variables().run()

    for i in range(100):
        for start, end in zip(range(0, len(trX), 128), range(128, len(trX)+1, 128)):
            sess.run(train_op, feed_dict={X: trX[start:end], Y: trY[start:end],
                                          p_keep_input: 0.8, p_keep_hidden: 0.5})
        summary, acc = sess.run([merged, acc_op], feed_dict={X: teX, Y: teY,
                                          p_keep_input: 1.0, p_keep_hidden: 1.0})
        writer.add_summary(summary, i)
        print(i, acc)

(0, 0.9320001)
(1, 0.96030021)
(2, 0.96940011)
(3, 0.97550011)
(4, 0.97510016)
(5, 0.97370017)
(6, 0.97700012)
(7, 0.97720015)
(8, 0.97610021)
(9, 0.97840011)
(10, 0.97970009)
(11, 0.98090011)
(12, 0.98140013)
(13, 0.97980005)
(14, 0.98010015)
(15, 0.98100013)
(16, 0.98100019)
(17, 0.98240012)
(18, 0.98080009)
(19, 0.98100013)
(20, 0.98190016)
(21, 0.98220009)
(22, 0.98120022)
(23, 0.98110008)
(24, 0.98310018)
(25, 0.98160017)
(26, 0.9819001)
(27, 0.98260009)
(28, 0.98300016)
(29, 0.98300004)
(30, 0.98260009)
(31, 0.98270011)
(32, 0.98270017)
(33, 0.98290014)
(34, 0.98220015)
(35, 0.98240012)
(36, 0.9819001)
(37, 0.98300016)
(38, 0.98350012)
(39, 0.98250014)
(40, 0.98300016)
(41, 0.98300016)
(42, 0.98210019)
(43, 0.98260015)
(44, 0.98380011)
(45, 0.98360008)
(46, 0.98280013)
(47, 0.9830001)
(48, 0.98360014)
(49, 0.9823001)
(50, 0.98340011)
(51, 0.98240006)
(52, 0.98470008)
(53, 0.98260021)
(54, 0.98410004)
(55, 0.98380011)
(56, 0.9837001)
(57, 0.98430014)
(58, 0.98470014)
(59, 0.982800