In [1]:
from keras import layers
from keras import models


Using TensorFlow backend.
  return f(*args, **kwds)


In [2]:
model = models.Sequential()
model.add(layers.Conv2D(32, (3,3), activation='relu', input_shape=(28,28, 1)))
model.add(layers.MaxPooling2D((2,2)))
model.add(layers.Conv2D(64, (3,3), activation='relu'))
model.add(layers.MaxPooling2D((2, 2)))
model.add(layers.Conv2D(64, (3,3), activation='relu'))

In [3]:
model.summary()

_________________________________________________________________
Layer (type)                 Output Shape              Param #   
conv2d_1 (Conv2D)            (None, 26, 26, 32)        320       
_________________________________________________________________
max_pooling2d_1 (MaxPooling2 (None, 13, 13, 32)        0         
_________________________________________________________________
conv2d_2 (Conv2D)            (None, 11, 11, 64)        18496     
_________________________________________________________________
max_pooling2d_2 (MaxPooling2 (None, 5, 5, 64)          0         
_________________________________________________________________
conv2d_3 (Conv2D)            (None, 3, 3, 64)          36928     
Total params: 55,744
Trainable params: 55,744
Non-trainable params: 0
_________________________________________________________________


The next step is to feed the last output data into a densely connected classifier network.

Classifiers process vectors which are 1D, whereas the current output is a 3D tensor. Si it will need to be flattened and then add a few Dense layers on top.

In [4]:
model.add(layers.Flatten())
model.add(layers.Dense(64, activation='relu'))
model.add(layers.Dense(10, activation='softmax'))
model.summary()

_________________________________________________________________
Layer (type)                 Output Shape              Param #   
conv2d_1 (Conv2D)            (None, 26, 26, 32)        320       
_________________________________________________________________
max_pooling2d_1 (MaxPooling2 (None, 13, 13, 32)        0         
_________________________________________________________________
conv2d_2 (Conv2D)            (None, 11, 11, 64)        18496     
_________________________________________________________________
max_pooling2d_2 (MaxPooling2 (None, 5, 5, 64)          0         
_________________________________________________________________
conv2d_3 (Conv2D)            (None, 3, 3, 64)          36928     
_________________________________________________________________
flatten_1 (Flatten)          (None, 576)               0         
_________________________________________________________________
dense_1 (Dense)              (None, 64)                36928     
__________

# Load the mnist images

In [5]:
from keras.datasets import mnist
from keras.utils import to_categorical

(train_images, train_labels), (test_images, test_labels) = mnist.load_data()

In [6]:
type(train_images)
print(train_images.shape)
print(test_images.shape)
## page 122

(60000, 28, 28)
(10000, 28, 28)


In [7]:
train_images = train_images.reshape((60000, 28, 28, 1))
print(train_images.shape)

(60000, 28, 28, 1)


In [8]:
train_images = train_images.astype('float32') / 255

In [9]:
print(test_images.shape)
test_images = test_images.reshape((10000, 28, 28, 1))
print(test_images.shape)
test_images = test_images.astype('float32') / 255

print(train_labels[0])

(10000, 28, 28)
(10000, 28, 28, 1)
5


In [10]:
train_labels = to_categorical(train_labels)
test_labels = to_categorical(test_labels)
#to_categorical takes integers and converts them into a binary class matrix.
#for use with categorical_crossentropy loss function.
print(train_labels[0])

[0. 0. 0. 0. 0. 1. 0. 0. 0. 0.]


In [11]:
model.compile(optimizer='rmsprop',
             loss='categorical_crossentropy',
             metrics=['accuracy'])
model.fit(train_images, train_labels, epochs=5, batch_size=64)

Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


<keras.callbacks.History at 0x12460ff98>

In [12]:
#Evaluate on the data
test_loss, test_acc = model.evaluate(test_images, test_labels)



In [13]:
test_loss, test_acc = model.evaluate(test_images, test_labels)




In [14]:
test_acc

0.9909

In [15]:
test_loss

0.03147862863912614