# MNIST CNN

In [22]:
import tensorflow as tf

In [23]:
from tensorflow.examples.tutorials.mnist import input_data

In [24]:
mnist = input_data.read_data_sets('MNIST_data/',one_hot=True)

Extracting MNIST_data/train-images-idx3-ubyte.gz
Extracting MNIST_data/train-labels-idx1-ubyte.gz
Extracting MNIST_data/t10k-images-idx3-ubyte.gz
Extracting MNIST_data/t10k-labels-idx1-ubyte.gz


# Helper
## Intialize Weights

In [25]:
def init_weights(shape, layers):
    init_rand_dist = tf.truncated_normal(shape=shape, stddev=(1/(layers + 512)))
    return tf.Variable(init_rand_dist)

# Initial Bias

In [26]:
def init_bias(shape):
    init_bias_val = tf.constant(0.1, shape=shape)
    return tf.Variable(init_bias_val)

# Conv2d

In [27]:
def conv2d(x, w):
    
    return tf.nn.conv2d(x, w, strides=[1,1,1,1], padding='SAME')

## Pooling

In [28]:
def max_pool_2by2(x):
    return tf.nn.max_pool(x,ksize=[1,2,2,1],strides=[1,2,2,1],padding='SAME') 

# Layers

In [29]:
def convolve_layer(input_x, shape):
    w = init_weights(shape=shape,layers = shape[3])
    b = init_bias([shape[3]])
    return tf.nn.relu(conv2d(input_x,w) + b)

# Fully connected

In [43]:
def fully_connected(input_layer,size):
    input_size = int(input_layer.get_shape()[1])
    w = init_weights([input_size, size],layers = size)
    b = init_bias([size])
    return tf.matmul(input_layer, w) + b

# Placeholders

In [44]:
x = tf.placeholder(tf.float32,shape=[None,784])

In [45]:
y_true = tf.placeholder(tf.float32, shape=[None,10])

In [46]:
x_image = tf.reshape(x,[-1,28,28,1])

In [47]:
conv1 = convolve_layer(x_image, shape=[3,3,1,32])
pool1_conv  = max_pool_2by2(conv1)

In [48]:
conv2 = convolve_layer(pool1_conv,shape=[4,4,32,64])
pool2_conv = max_pool_2by2(conv2)

In [49]:
conv2flat = tf.reshape(pool2_conv,[-1, 7*7*64])
full_layer_1 = tf.nn.relu(fully_connected(conv2flat, 512))

In [50]:
hold_prob = tf.placeholder(tf.float32)
full_one_drop = tf.nn.dropout(full_layer_1, keep_prob=hold_prob)

In [51]:
y_pred = fully_connected(full_one_drop, 10)

## Loss function

In [52]:
cross_en=tf.reduce_mean(tf.nn.softmax_cross_entropy_with_logits(labels=y_true,logits=y_pred))

## Optimizer

In [53]:
opt = tf.train.AdamOptimizer(learning_rate=0.01)
train = opt.minimize(cross_en)

In [54]:
init = tf.global_variables_initializer()

In [55]:
steps = 5000
with tf.Session() as sess:
    
    sess.run(init)
    
    for i in range(steps):
        batch_x, batch_y = mnist.train.next_batch(50)
        
        sess.run(train, feed_dict={x:batch_x,y_true: batch_y,hold_prob:0.4})
        
        if i % 100 == 0:
            
            print("ON STEP: {}".format(i))
            print('ACCURACY')
            matches = tf.equal(tf.argmax(y_pred, 1),tf.argmax(y_true, 1))
            
            acc = tf.reduce_mean(tf.cast(matches, tf.float32))
            
            print(sess.run(acc, feed_dict={x: mnist.test.images, y_true: mnist.test.labels,
                                          hold_prob: 1.0}))
            print("\n")

ON STEP: 0
ACCURACY
0.0982


ON STEP: 100
ACCURACY
0.9147


ON STEP: 200
ACCURACY
0.9466


ON STEP: 300
ACCURACY
0.9598


ON STEP: 400
ACCURACY
0.9658


ON STEP: 500
ACCURACY
0.9689


ON STEP: 600
ACCURACY
0.9718


ON STEP: 700
ACCURACY
0.9617


ON STEP: 800
ACCURACY
0.9736


ON STEP: 900
ACCURACY
0.9601


ON STEP: 1000
ACCURACY
0.9618


ON STEP: 1100
ACCURACY
0.9751


ON STEP: 1200
ACCURACY
0.9717


ON STEP: 1300
ACCURACY
0.977


ON STEP: 1400
ACCURACY
0.9733


ON STEP: 1500
ACCURACY
0.9771


ON STEP: 1600
ACCURACY
0.9774


ON STEP: 1700
ACCURACY
0.9765


ON STEP: 1800
ACCURACY
0.973


ON STEP: 1900
ACCURACY
0.9768


ON STEP: 2000
ACCURACY
0.9812


ON STEP: 2100
ACCURACY
0.9755


ON STEP: 2200
ACCURACY
0.9806


ON STEP: 2300
ACCURACY
0.9772


ON STEP: 2400
ACCURACY
0.9758


ON STEP: 2500
ACCURACY
0.9778


ON STEP: 2600
ACCURACY
0.9781


ON STEP: 2700
ACCURACY
0.9723


ON STEP: 2800
ACCURACY
0.9764


ON STEP: 2900
ACCURACY
0.9778


ON STEP: 3000
ACCURACY
0.9764


ON STEP: 3100
ACCURACY