In [12]:
################ 5.0 Loading the MNIST dataset in Keras #####################
from keras.datasets import mnist
from keras import models
from keras import layers
from keras.utils import to_categorical

(train_images, train_labels), (test_images, test_labels) = mnist.load_data()

################ 5.1 Instantiating a small convnet ################################

model = models.Sequential()
model.add(layers.Conv2D(32, (3, 3), activation='relu', input_shape=(28, 28, 1))) 
## the first convolution layer takes a feature map of size (28,28, 1) and outputs a feature map of size (26, 26, 32):
## (3, 3) - Size of the patches extracted from the inputs
## 32 - Depth of the output feature map, i. e. number of filters computed by the convolution.
## In Keras Conv2D layers, the first arguments passed to the layer Conv2D(output_depth, (window_height, window_width))

model.add(layers.MaxPool2D((2, 2)))
## the max-pooling operation halves the feature map (26 × 26) into 13 × 13
## That’s the role of max pooling, aggressively downsample feature maps
## Max pooling consists of extracting windows from the input feature maps & outputting the max value of each channel.
## It’s conceptually similar to convolution, Except that instead of transforming local patches via a learned linear 
## transformation they’re transformed via a hardcoded tensor operation max
## max pooling is usually done with 2 × 2 windows & stride 2 in order to downsample the feature maps by a factor of 2

model.add(layers.Conv2D(64, (3, 3), activation='relu'))
model.add(layers.MaxPool2D((2, 2)))
model.add(layers.Conv2D(64, (3, 3), activation='relu'))

# model.summary()

################ 5.2 Adding a classifier on top of the convnet #####################

model.add(layers.Flatten())
model.add(layers.Dense(64, activation='relu'))
model.add(layers.Dense(10, activation='softmax'))

# model.summary()


################ 5.3 Training the convnet on MNIST images #####################

train_images = train_images.reshape((60000, 28, 28, 1))
train_images = train_images.astype('float32')/255

test_images = test_images.reshape((10000, 28, 28, 1))
test_images = test_images.astype('float')/255

train_labels = to_categorical(train_labels)
test_labels = to_categorical(test_labels)

# model.compile(optimizer='rmsprop', loss='categorical_crossentropy', metrics=['accuracy'])

# model.fit(train_images, train_labels, batch_size=65, epochs=5)

# test_loss, test_acc = model.evaluate(test_images, test_labels)

# test_acc

_________________________________________________________________
Layer (type)                 Output Shape              Param #   
conv2d_16 (Conv2D)           (None, 26, 26, 32)        320       
_________________________________________________________________
max_pooling2d_11 (MaxPooling (None, 13, 13, 32)        0         
_________________________________________________________________
conv2d_17 (Conv2D)           (None, 11, 11, 64)        18496     
_________________________________________________________________
max_pooling2d_12 (MaxPooling (None, 5, 5, 64)          0         
_________________________________________________________________
conv2d_18 (Conv2D)           (None, 3, 3, 64)          36928     
Total params: 55,744
Trainable params: 55,744
Non-trainable params: 0
_________________________________________________________________
