In [1]:
import tensorflow.keras as keras

# MNIST Example Network
Example code showing a CNN running on the MNIST dataset

In [2]:
from tensorflow.keras.layers import Input, Conv2D, MaxPooling2D, Flatten, Dense, GlobalAveragePooling2D
from tensorflow.keras.models import Model

use_max_pooling = False

inputTensor = Input(shape=(28, 28, 1))
currentTensor = inputTensor

currentTensor = Conv2D(filters=32, 
                       kernel_size=(3, 3), 
                       strides=(2,2),
                       padding='valid',
                       dilation_rate=1,
                       activation='relu')(currentTensor)

if use_max_pooling:
    currentTensor = MaxPooling2D(pool_size=(2, 2))(currentTensor)

currentTensor = Conv2D(filters=64, 
                       kernel_size=(3, 3), 
                       strides=1,
                       padding='valid',
                       dilation_rate=2,
                       activation='relu')(currentTensor)

if use_max_pooling:
    currentTensor = MaxPooling2D(pool_size=(2, 2))(currentTensor)

currentTensor = Conv2D(filters=64, 
                       kernel_size=(3, 3), 
                       strides=1,
                       padding='valid',
                       dilation_rate=1,
                       activation='relu')(currentTensor)

model = Model(inputTensor, currentTensor)
model.summary()

Model: "model"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 input_1 (InputLayer)        [(None, 28, 28, 1)]       0         
                                                                 
 conv2d (Conv2D)             (None, 13, 13, 32)        320       
                                                                 
 conv2d_1 (Conv2D)           (None, 9, 9, 64)          18496     
                                                                 
 conv2d_2 (Conv2D)           (None, 7, 7, 64)          36928     
                                                                 
Total params: 55,744
Trainable params: 55,744
Non-trainable params: 0
_________________________________________________________________


In [3]:
use_gap = True

if not use_gap:
    currentTensor = Flatten()(currentTensor)
    currentTensor = Dense(units=64, activation='relu')(currentTensor)
else:
    currentTensor = GlobalAveragePooling2D()(currentTensor)
    currentTensor = Dense(units=32, activation='relu')(currentTensor)

currentTensor = Dense(units=10, activation='softmax')(currentTensor)

outputTensor = currentTensor
model = Model(inputTensor, outputTensor)
model.summary()

Model: "model_1"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 input_1 (InputLayer)        [(None, 28, 28, 1)]       0         
                                                                 
 conv2d (Conv2D)             (None, 13, 13, 32)        320       
                                                                 
 conv2d_1 (Conv2D)           (None, 9, 9, 64)          18496     
                                                                 
 conv2d_2 (Conv2D)           (None, 7, 7, 64)          36928     
                                                                 
 global_average_pooling2d (G  (None, 64)               0         
 lobalAveragePooling2D)                                          
                                                                 
 dense (Dense)               (None, 32)                2080      
                                                           

In [4]:
from tensorflow.keras.datasets import mnist
from tensorflow.keras.utils import to_categorical

(train_images, train_labels), (test_images, test_labels) = mnist.load_data()

train_images = train_images.reshape((60000, 28, 28, 1))
train_images = train_images.astype('float32') / 255

test_images = test_images.reshape((10000, 28, 28, 1))
test_images = test_images.astype('float32') / 255

train_labels = to_categorical(train_labels)
test_labels = to_categorical(test_labels)

In [5]:
model.compile(optimizer='rmsprop',
              loss='categorical_crossentropy',
              metrics=['accuracy'])
model.fit(train_images, 
          train_labels, 
          epochs=5, 
          batch_size=64)

Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


<keras.callbacks.History at 0x7ff63040e9a0>

In [6]:
test_loss, test_acc = model.evaluate(test_images, test_labels)



In [7]:
test_acc

0.9807000160217285