In [1]:
import tensorflow as tf

In [2]:
from tensorflow.examples.tutorials.mnist import input_data

In [None]:
mnist = input_data.read_data_sets("MNIST_data/", one_hot=True)

In [8]:
# Init weights
def init_weights(shape):
    init_random_dist = tf.truncated_normal(shape, stddev=.1)
    return tf.Variable(init_random_dist)

In [9]:
# Init bias
def init_bias(shape):
    init_bias_vals = tf.constant(.1, shape=shape)
    return tf.Variable(init_bias_vals)

In [18]:
# Tensor & Filter --> 2D Convolution
def conv2d(x, w):
    # x --> [batch, height, width, channels]
    # w --> [filterH, filterW, channelsIn, channelsOut]
    return tf.nn.conv2d(x, w, strides=[1, 1, 1, 1], padding='SAME')

In [19]:
# Pooling
def max_pool_2x2(x):
    # x --> [batch, height, width, channels]
    return tf.nn.max_pool(x, ksize=[1, 2, 2, 1], strides=[1, 2, 2, 1], padding='SAME')

In [12]:
# Convolutional Layer
def conv_layer(input_x, shape):
    w = init_weights(shape)
    b = init_bias([shape[3]])
    return tf.nn.relu(conv2d(input_x, w) + b)

In [13]:
# Fully Connected Layer
def dense_layer(input_layer, size):
    input_size = int(input_layer.get_shape()[1])
    w = init_weights([input_size, size])
    b = init_bias([size])
    return tf.matmul(input_layer, w) + b

In [15]:
# Placeholders
x = tf.placeholder(tf.float32, shape=[None, 784])
y_true = tf.placeholder(tf.float32, shape=[None, 10])

In [16]:
# Layers
x_img = tf.reshape(x, [-1, 28, 28, 1])

In [20]:
conv1 = conv_layer(x_img, shape=[5, 5, 1, 32])
conv1_pooling = max_pool_2x2(conv1)

In [21]:
conv2 = conv_layer(conv1_pooling, shape=[5, 5, 32, 64])
conv2_pooling = max_pool_2x2(conv2)

In [22]:
conv2_flat = tf.reshape(conv2_pooling, [-1, 7*7*64])
dense1 = tf.nn.relu(dense_layer(conv2_flat, 1024))

In [24]:
# Dropout
hold_prob = tf.placeholder(tf.float32)
dense_drop1 = tf.nn.dropout(dense1, keep_prob=hold_prob)

In [25]:
y_pred = dense_layer(dense_drop1, 10)

In [26]:
# Loss function
cross_entropy = tf.reduce_mean(
    tf.nn.softmax_cross_entropy_with_logits(labels=y_true, logits=y_pred))

Instructions for updating:

Future major versions of TensorFlow will allow gradients to flow
into the labels input on backprop by default.

See `tf.nn.softmax_cross_entropy_with_logits_v2`.



In [27]:
# Optimizer
optimizer = tf.train.AdamOptimizer(learning_rate=.001)
train = optimizer.minimize(cross_entropy)

In [28]:
init = tf.global_variables_initializer()

In [31]:
steps = 1000
with tf.Session() as s:
    s.run(init)
    
    for i in range(steps):
        batch_x, batch_y = mnist.train.next_batch(50)
        s.run(train, feed_dict={x: batch_x, y_true: batch_y, hold_prob:.5})
        
        if i % 100 == 0:
            print("On step: {}".format(i))
            print("Accuracy: ")
            matches = tf.equal(tf.argmax(y_pred, 1), tf.argmax(y_true, 1))
            acc = tf.reduce_mean(tf.cast(matches, tf.float32))
            print(s.run(
                acc, feed_dict={x:mnist.test.images, y_true: mnist.test.labels, hold_prob: 1}))

On step: 0
Accuracy: 
0.1873
On step: 100
Accuracy: 
0.9406
On step: 200
Accuracy: 
0.9582
On step: 300
Accuracy: 
0.9692
On step: 400
Accuracy: 
0.9741
On step: 500
Accuracy: 
0.9758
On step: 600
Accuracy: 
0.9828
On step: 700
Accuracy: 
0.9812
On step: 800
Accuracy: 
0.9815
On step: 900
Accuracy: 
0.9819
