In [60]:
import tensorflow as tf
import numpy as np

# Download MNIST data
from tensorflow.examples.tutorials.mnist import input_data
mnist = input_data.read_data_sets("data/multilayer-perceptron/", one_hot=True)

# The features are already scaled and the data is shuffled
train_features = mnist.train.images
test_features = mnist.test.images

Extracting data/multilayer-perceptron/train-images-idx3-ubyte.gz
Extracting data/multilayer-perceptron/train-labels-idx1-ubyte.gz
Extracting data/multilayer-perceptron/t10k-images-idx3-ubyte.gz
Extracting data/multilayer-perceptron/t10k-labels-idx1-ubyte.gz


In [67]:
# Parameters
learning_rate = 0.001
training_epochs = 20
batch_size = 128 # decrease your batch size if you don't have enough memories
display_step = 1

n_input = 784 # MNIST data input (img shape : 28*28)
n_classes = 10 # MNIST total classes (0-9 digits)

train_labels = mnist.train.labels.astype(np.float32)
test_labels = mnist.test.labels.astype(np.float32)

# Hidden Layer Parameters
n_hidden_layer = 256 # Layer number of features

In [68]:
# Weights and Biases
weights = {
    'hidden_layer': tf.Variable(tf.random_normal([n_input, n_hidden_layer])),
    'out' : tf.Variable(tf.random_normal([n_hidden_layer, n_classes]))
}
biases = {
    'hidden_layer': tf.Variable(tf.random_normal([n_hidden_layer])),
    'out' : tf.Variable(tf.random_normal([n_classes]))
}

save_file = './train_model.ckpt'
saver = tf.train.Saver()

In [69]:
# input
x = tf.placeholder("float", [None, n_input])
y = tf.placeholder("float", [None, n_classes])
x_flat = tf.reshape(x, [-1, n_input]) # put "-1" means create automatically with n_input

In [70]:
# Hidden_layer with ReLU activation 
layer_1 = tf.add(tf.matmul(x_flat, weights['hidden_layer']), biases['hidden_layer'])
layer_1 = tf.nn.relu(layer_1)
# output layer with linear activation
logits = tf.add(tf.matmul(layer_1, weights['out']), biases['out'])

In [71]:
# Optimizer
# Define loss and optimizer
cost = tf.reduce_mean(tf.nn.softmax_cross_entropy_with_logits(logits=logits, labels=y))
optimizer = tf.train.GradientDescentOptimizer(learning_rate=learning_rate).minimize(cost)

# Calculate accuracy
correct_prediction = tf.equal(tf.argmax(logits, 1), tf.argmax(y, 1))
accuracy = tf.reduce_mean(tf.cast(correct_prediction, tf.float32))

In [73]:
# Session
# initialize the variables
init = tf.global_variables_initializer()

# Launch the gragh
with tf.Session() as sess:
    sess.run(init)
    # Training cycle
    for epoch in range(training_epochs):
        total_batch = int(mnist.train.num_examples/batch_size)
        # Loop over all batches
        for i in range(total_batch):
            batch_x, batch_y = mnist.train.next_batch(batch_size)
            # Run optimization op (backprop) and cost op (to get loss value)
            sess.run(optimizer, feed_dict = {x: batch_x, y: batch_y})
        # Print status for every 10 epochs
        if epoch % 5 == 0:
            valid_accuracy = sess.run(accuracy, feed_dict={x: test_features, y: test_labels})
            print('Epoch {:<3} - Validation Accuracy: {}'.format(epoch, valid_accuracy))
    # Save the model
    saver.save(sess, save_file)
    print('Trained Model Saved.')
            
    # Calculate accuracy for test dataset
    test_accuracy = sess.run(accuracy, feed_dict={x: test_features, y: test_labels})
    
print('Test Accuracy: {}'.format(test_accuracy))

Epoch 0   - Validation Accuracy: 0.3774000108242035
Epoch 5   - Validation Accuracy: 0.7282999753952026
Epoch 10  - Validation Accuracy: 0.7912999987602234
Epoch 15  - Validation Accuracy: 0.8212000131607056
Trained Model Saved.
Test Accuracy: 0.8330000042915344


In [74]:
# Launch the graph
with tf.Session() as sess:
    saver.restore(sess, save_file)

    test_accuracy = sess.run(
        accuracy,
        feed_dict={x: test_features, y: test_labels})

print('Test Accuracy: {}'.format(test_accuracy))

INFO:tensorflow:Restoring parameters from ./train_model.ckpt
Test Accuracy: 0.8330000042915344
