**Import Packages**

In [None]:
import tensorflow as tf
from tensorflow.keras import datasets, layers, models
import numpy as np
import matplotlib.pyplot as plt

**Load Data**

In [None]:
(train_images, train_labels), (test_images, test_labels) = datasets.mnist.load_data()

# Normalize pixel values to be between 0 and 1
train_images, test_images = train_images / 255.0, test_images / 255.0

train_images= train_images.reshape(train_images.shape[0], 28, 28, 1)
test_images= test_images.reshape(test_images.shape[0], 28, 28, 1)

print(train_images.shape)
print(test_images.shape)

**Plot Examples**

In [None]:
plt.figure(figsize=(10,10))
for i in range(25):
    plt.subplot(5,5,i+1)
    plt.xticks([])
    plt.yticks([])
    plt.grid(False)
    plt.imshow(train_images[i][:,:,0])
    plt.xlabel(train_labels[i])
plt.show()

**Build (partial) Model and Display the Architecture (Convolutional Layers)**

In [None]:
model = models.Sequential()
model.add(layers.Conv2D(28, 3, activation='relu', input_shape=(28, 28, 1)))
model.add(layers.MaxPooling2D((2, 2)))
model.add(layers.Conv2D(56, 3, activation='relu'))

model.summary()

**Build FC Layers and Display the Architecture**

In [None]:
model.add(layers.Flatten())
model.add(layers.Dense(56, activation='relu'))
model.add(layers.Dense(10))

model.summary()

**Training the Model**

In [None]:
model.compile(optimizer='adam',
              loss=tf.keras.losses.SparseCategoricalCrossentropy(from_logits=True),
              metrics=['accuracy'])

'''
    Update network parameters according to update rule from
    Stochastic Gradient Descent.

    θ = θ - η * ∇J(x, y), 
        theta θ:            a network parameter (e.g. a weight w)
        eta η:              the learning rate
        gradient ∇J(x, y):  the gradient of the objective function,
                            i.e. the change for a specific theta θ
'''

history = model.fit(train_images, train_labels, batch_size=64, epochs=5, validation_data=(test_images, test_labels))

**Show Final Results**

In [None]:
plt.plot(history.history['accuracy'], label='accuracy')
plt.plot(history.history['val_accuracy'], label = 'val_accuracy')
plt.xlabel('Epoch')
plt.ylabel('Accuracy')
plt.ylim([0.5, 1])
plt.legend(loc='lower right')

test_loss, test_acc = model.evaluate(test_images,  test_labels, verbose=2)


print("test accuracy: {:.4f}".format(test_acc))