In [1]:
import numpy as np
from tensorflow.keras.layers import Dense, Dropout, Input
from tensorflow.keras.datasets import mnist
from tensorflow.keras.layers import Conv2D, MaxPooling2D, Flatten
from tensorflow.keras.utils import to_categorical
from tensorflow.keras.models import Model

In [2]:
# load mnist dataset
(x_train, y_train), (x_test, y_test) = mnist.load_data()

In [3]:
y_train

array([5, 0, 4, ..., 5, 6, 8], dtype=uint8)

In [4]:
# from sparse label to categorical (one-hot vector)
num_labels = len(np.unique(y_train))
y_train = to_categorical(y_train)
y_test = to_categorical(y_test)

In [5]:
y_train

array([[0., 0., 0., ..., 0., 0., 0.],
       [1., 0., 0., ..., 0., 0., 0.],
       [0., 0., 0., ..., 0., 0., 0.],
       ...,
       [0., 0., 0., ..., 0., 0., 0.],
       [0., 0., 0., ..., 0., 0., 0.],
       [0., 0., 0., ..., 0., 1., 0.]], dtype=float32)

In [6]:
# reshape and normalize input images
image_size = x_train.shape[1]
x_train = np.reshape(x_train, [-1, image_size, image_size, 1])
x_test  = np.reshape(x_test, [-1, image_size, image_size, 1])
x_train = x_train.astype('float32') / 255
x_test  = x_test.astype('float32') / 255

In [7]:
# network params
input_shape = (image_size, image_size, 1)
batch_size = 128
dropout = 0.3
filters = 64
kernel_size = 3

In [8]:
# use functional API to build CNN layers

inputs = Input(shape=input_shape)
y = Conv2D(filters=filters, 
         kernel_size=kernel_size, 
         activation='relu')(inputs)
y = MaxPooling2D()(y)
y = Conv2D(filters=filters, 
         kernel_size=kernel_size, 
         activation='relu')(y)
y = MaxPooling2D()(y)
y = Conv2D(filters=filters, 
         kernel_size=kernel_size, 
         activation='relu')(y)

# image to vector before connectiong to Dense layer
y = Flatten()(y)
# dropout regularization
y = Dropout(dropout)(y)

outputs = Dense(num_labels, activation='softmax')(y)

# build the model by supplying inputs/ outputs
model = Model(inputs=inputs, outputs=outputs)

# network model in text
model.summary()

Model: "model"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 input_1 (InputLayer)        [(None, 28, 28, 1)]       0         
                                                                 
 conv2d (Conv2D)             (None, 26, 26, 64)        640       
                                                                 
 max_pooling2d (MaxPooling2D  (None, 13, 13, 64)       0         
 )                                                               
                                                                 
 conv2d_1 (Conv2D)           (None, 11, 11, 64)        36928     
                                                                 
 max_pooling2d_1 (MaxPooling  (None, 5, 5, 64)         0         
 2D)                                                             
                                                                 
 conv2d_2 (Conv2D)           (None, 3, 3, 64)          36928 

In [9]:
# classifier loss, optimizer, accuracy
model.compile(loss='categorical_crossentropy', 
              optimizer='adam', 
              metrics=['accuracy'])

In [10]:
# train the model
model.fit(x_train, y_train, 
          validation_data = (x_test, y_test), 
          epochs=20, 
          batch_size=batch_size)

Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20


<keras.callbacks.History at 0x2131ba37f70>

In [11]:
# evaluate the model
score = model.evaluate(x_test, y_test, 
                       batch_size=batch_size, 
                       verbose=0)

print("\nTest accuracy: %.1f%%" % (100 * score[1]))


Test accuracy: 99.4%
