In [1]:
%config Completer.use_jedi = False

In [2]:
from tensorflow.keras.models import Sequential
from tensorflow.keras.layers import Conv2D, MaxPooling2D, Activation, Flatten, Dense, AveragePooling2D
import tensorflow as tf
from tensorflow.keras.datasets import mnist
from tensorflow import keras
from sklearn.model_selection import train_test_split

import matplotlib.pyplot as plt
import numpy as np

In [3]:
(train_X, train_y), (testData, testLabels) = mnist.load_data()

In [4]:
print("Train Data shape : ", train_X.shape)
print("Train Labels shape : ", train_y.shape)
print("Test Data shape : ", testData.shape)
print("Test Labels shape : ", testLabels.shape)

Train Data shape :  (60000, 28, 28)
Train Labels shape :  (60000,)
Test Data shape :  (10000, 28, 28)
Test Labels shape :  (10000,)


In [5]:
trainData, valData, trainLabels, valLabels = train_test_split(train_X, train_y, test_size=0.10, random_state=42)

In [6]:
# reshape image dimensions
trainData = trainData.reshape(trainData.shape[0], 28, 28, 1)
valData = valData.reshape(valData.shape[0], 28, 28, 1)
testData = testData.reshape(testData.shape[0], 28, 28, 1)

In [7]:
print("Train Data shape : ", trainData.shape)
print("Validation Data shape : ", valData.shape)
print("Test Data shape : ", testData.shape)

Train Data shape :  (54000, 28, 28, 1)
Validation Data shape :  (6000, 28, 28, 1)
Test Data shape :  (10000, 28, 28, 1)


In [8]:
# Normalization
trainData = tf.keras.utils.normalize(trainData, axis=1)
valData = tf.keras.utils.normalize(valData, axis=1)
testData = tf.keras.utils.normalize(testData, axis=1)

In [9]:
trainData[0].shape

(28, 28, 1)

In [10]:
# Le-net 5 model building
leNet_model = Sequential()
leNet_model.add(Conv2D(filters=6, kernel_size=5, strides=1, activation='tanh', input_shape=trainData[0].shape, padding='valid'))
leNet_model.add(AveragePooling2D())
leNet_model.add(Conv2D(filters=16, kernel_size=5, strides=1, activation='tanh', padding='valid'))
leNet_model.add(AveragePooling2D())
leNet_model.add(Flatten())
leNet_model.add(Dense(120, activation='tanh'))
leNet_model.add(Dense(84, activation='tanh'))
leNet_model.add(Dense(10, activation='softmax'))

In [11]:
leNet_model.summary()

Model: "sequential"
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
conv2d (Conv2D)              (None, 24, 24, 6)         156       
_________________________________________________________________
average_pooling2d (AveragePo (None, 12, 12, 6)         0         
_________________________________________________________________
conv2d_1 (Conv2D)            (None, 8, 8, 16)          2416      
_________________________________________________________________
average_pooling2d_1 (Average (None, 4, 4, 16)          0         
_________________________________________________________________
flatten (Flatten)            (None, 256)               0         
_________________________________________________________________
dense (Dense)                (None, 120)               30840     
_________________________________________________________________
dense_1 (Dense)              (None, 84)                1

In [12]:
leNet_model.compile(loss=keras.losses.sparse_categorical_crossentropy, optimizer=keras.optimizers.Adam(), metrics=['accuracy'])

In [13]:
leNet_model.fit(trainData, trainLabels, epochs=20, validation_data=(valData, valLabels))

Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20


<tensorflow.python.keras.callbacks.History at 0x196cb0a3308>

In [14]:
predictions = leNet_model.predict(testData)

In [15]:
predictions

array([[3.1413783e-10, 1.7321423e-10, 1.7648553e-09, ..., 1.0000000e+00,
        1.1271797e-11, 2.6377860e-08],
       [4.5325072e-07, 1.7737767e-06, 9.9982798e-01, ..., 2.2952524e-11,
        1.6663519e-04, 2.7868188e-10],
       [1.0670389e-12, 9.9999976e-01, 4.9654841e-10, ..., 5.0112586e-10,
        2.4474770e-07, 6.0192677e-11],
       ...,
       [1.8703439e-13, 1.6395212e-10, 1.3257401e-11, ..., 5.6091814e-08,
        1.2083430e-07, 1.2439435e-07],
       [8.1436455e-11, 1.5543168e-10, 5.7920587e-12, ..., 3.4488583e-09,
        2.6257699e-06, 3.4405302e-11],
       [8.6808355e-10, 3.1768383e-09, 4.5228146e-10, ..., 7.4440318e-13,
        1.0878789e-08, 6.0387789e-12]], dtype=float32)

In [16]:
print(np.argmax(predictions[0]))

7


In [17]:
score = leNet_model.evaluate(testData, testLabels)



In [19]:
print('Test loss: {:.3f} %'.format(score[0] * 100))
print('Test accuracy: {:.3f} %'.format(score[1] * 100))

Test loss: 7.313 %
Test accuracy: 98.200 %
