In [2]:
import tensorflow as tf
from tensorflow.examples.tutorials.mnist import input_data
import numpy as np

tf.set_random_seed(777)
mnist = input_data.read_data_sets("MNIST_data/", one_hot=True)

Extracting MNIST_data/train-images-idx3-ubyte.gz
Extracting MNIST_data/train-labels-idx1-ubyte.gz
Extracting MNIST_data/t10k-images-idx3-ubyte.gz
Extracting MNIST_data/t10k-labels-idx1-ubyte.gz


In [3]:
class Model:
    def __init__(self, sess, name):
        self.sess = sess
        self.name = name
        self._build_net()
        
    def _build_net(self):
        with tf.variable_scope(self.name):
            # dropout(keep_prob) rate 0.7~0.5 on training, but should be 1
            # for testing
            self.training = tf.placeholder(tf.bool)
            
            # input placeholders
            self.X = tf.placeholder(tf.float32, shape=[None, 28*28])
            
            # img 28 x 28 x 1, input layer
            X_img = tf.reshape(self.X, [-1, 28, 28, 1])
            self.Y = tf.placeholder(tf.float32, shape=[None, 10])
            
            # Convolutional layer #1 and Pooling layer # 1 (input img ?, 28, 28, 1)
            conv1 = tf.layers.conv2d(inputs=X_img, filters=32, kernel_size=[3, 3], padding="SAME", activation=tf.nn.relu)
            pool1 = tf.layers.max_pooling2d(inputs=conv1, pool_size=[2, 2], padding="SAME", strides=2)
            dropout1 = tf.layers.dropout(inputs=pool1, rate=0.3, training=self.training)
            
            # convolutional layer #2 and Pooling layer #2 (input img 14, 14, 1, 32)
            conv2 = tf.layers.conv2d(inputs=dropout1, filters=64, kernel_size=[3, 3], padding="SAME", activation=tf.nn.relu)
            pool2 = tf.layers.max_pooling2d(inputs=conv2, pool_size=[2, 2], padding="SAME", strides=2)
            dropout2 = tf.layers.dropout(inputs=pool2, rate=0.3, training=self.training)
            
            # convolutional layer #3 and Pooling layer #3 (input img 7, 7, 1, 64)
            conv3 = tf.layers.conv2d(inputs=dropout2, filters=128, kernel_size=[3, 3], padding="SAME", activation=tf.nn.relu)
            pool3 = tf.layers.max_pooling2d(inputs=conv3, pool_size=[2, 2], padding="SAME", strides=2)
            dropout3 = tf.layers.dropout(inputs=pool3, rate=0.3, training=self.training)
            
            # Dense Layer with Relu (input img 4, 4, 1, 128)
            flat = tf.reshape(dropout3, [-1, 4 * 4 * 128])
            dense4 = tf.layers.dense(inputs=flat, units=625, activation=tf.nn.relu)
            dropout4 = tf.layers.dropout(inputs=dense4, rate=0.5, training=self.training)
            
        # Logits(no activation) layer: L5 Final FC 625 inputs -> 10 outputs
        self.logits = tf.layers.dense(inputs=dropout4, units=10)
            
            
        # define cost/loss and optimizer
        self.cost = tf.reduce_mean(tf.nn.softmax_cross_entropy_with_logits_v2(logits=self.logits, labels=self.Y))
        self.optimizer = tf.train.AdamOptimizer(learning_rate=learning_rate).minimize(self.cost)
            
        correct_prediction = tf.equal(tf.argmax(self.logits, 1), tf.argmax(self.Y, 1))
        self.accuracy = tf.reduce_mean(tf.cast(correct_prediction, dtype=tf.float32))
            
    def predict(self, x_test, training=False):
        return self.sess.run(self.logits, feed_dict={self.X: x_test, self.training: training})
        
    def get_accuracy(self, x_test, y_test, training=False):
        return self.sess.run(self.accuracy, feed_dict={self.X: x_test, self.Y: y_test, self.training:training})
        
    def train(self, x_train, y_train, training=True):
        return self.sess.run([self.cost, self.optimizer], feed_dict={self.X: x_train, self.Y: y_train, self.training: training})

In [4]:
# parameters
batch_size = 100
num_epochs = 15
learning_rate = 0.001
num_iterations = int(mnist.train.num_examples / batch_size)

# initialize 
sess = tf.Session()
m1 = Model(sess, 'm1')
sess.run(tf.global_variables_initializer())

print("Learning Started!")

# train the model
for epoch in range(num_epochs):
    avg_cost = 0
    
    for i in range(num_iterations):
        batch_xs, batch_ys = mnist.train.next_batch(batch_size)
        c, _ = m1.train(batch_xs, batch_ys)
        avg_cost += c / num_iterations
        
    print("Epoch:", "%04d" % (epoch+1), "Cost:", "%.9f" % (avg_cost))

print('Learning Finished!')

Instructions for updating:
Use keras.layers.conv2d instead.
Instructions for updating:
Colocations handled automatically by placer.
Instructions for updating:
Use keras.layers.max_pooling2d instead.
Instructions for updating:
Use keras.layers.dropout instead.
Instructions for updating:
Please use `rate` instead of `keep_prob`. Rate should be set to `rate = 1 - keep_prob`.
Instructions for updating:
Use keras.layers.dense instead.
Learning Started!
Epoch: 0001 Cost: 0.292316119
Epoch: 0002 Cost: 0.092085041
Epoch: 0003 Cost: 0.067789306
Epoch: 0004 Cost: 0.056765077
Epoch: 0005 Cost: 0.049974664
Epoch: 0006 Cost: 0.046826896
Epoch: 0007 Cost: 0.040395696
Epoch: 0008 Cost: 0.040456974
Epoch: 0009 Cost: 0.035972636
Epoch: 0010 Cost: 0.033343539
Epoch: 0011 Cost: 0.031386594
Epoch: 0012 Cost: 0.031871886
Epoch: 0013 Cost: 0.027765510
Epoch: 0014 Cost: 0.028236290
Epoch: 0015 Cost: 0.028185746
Learning Finished!


In [5]:
# Accuracy
print("Accuracy", m1.get_accuracy(mnist.test.images, mnist.test.labels))

Accuracy 0.9943
