In [1]:
from keras import models, layers

Using TensorFlow backend.


In [2]:
model = models.Sequential()

# This time we insert Conv2D layers with 32 filters of shape (3,3)
model.add(layers.Conv2D(32, (3,3), activation='relu', input_shape=(28,28,1)))

# We downsample with (2,2) field, which rougly halves the input tensor size
model.add(layers.MaxPooling2D((2,2)))

model.add(layers.Conv2D(64, (3,3), activation='relu'))
model.add(layers.MaxPooling2D((2,2)))

model.add(layers.Conv2D(64, (3,3), activation='relu'))

# We need to flatten the final Conv2D output to pass it to the DenseNet classifier
model.add(layers.Flatten())

model.add(layers.Dense(64, activation='relu'))
model.add(layers.Dense(10, activation='softmax'))


In [3]:
# Let us have a look into the model structure
model.summary()

_________________________________________________________________
Layer (type)                 Output Shape              Param #   
conv2d_1 (Conv2D)            (None, 26, 26, 32)        320       
_________________________________________________________________
max_pooling2d_1 (MaxPooling2 (None, 13, 13, 32)        0         
_________________________________________________________________
conv2d_2 (Conv2D)            (None, 11, 11, 64)        18496     
_________________________________________________________________
max_pooling2d_2 (MaxPooling2 (None, 5, 5, 64)          0         
_________________________________________________________________
conv2d_3 (Conv2D)            (None, 3, 3, 64)          36928     
_________________________________________________________________
flatten_1 (Flatten)          (None, 576)               0         
_________________________________________________________________
dense_1 (Dense)              (None, 64)                36928     
__________

In [4]:
from keras.utils.vis_utils import plot_model
plot_model(model, to_file='MNIST_CNN_plot.png', show_shapes=True, show_layer_names=True)

In [1]:
from keras.datasets import mnist

(train_images, train_labels), (test_images, test_labels) = mnist.load_data()


Using TensorFlow backend.


In [3]:
train_labels[0:10]

array([5, 0, 4, 1, 9, 2, 1, 3, 1, 4], dtype=uint8)

In [4]:
train_images = train_images.reshape((60000, 28, 28, 1))
train_images = train_images.astype('float32')/255

test_images = test_images.reshape((10000, 28, 28, 1))
test_images = test_images.astype('float32')/255

In [5]:
from keras.utils import to_categorical

train_labels = to_categorical(train_labels)
test_labels = to_categorical(test_labels)

In [6]:
train_labels[0]

array([0., 0., 0., 0., 0., 1., 0., 0., 0., 0.], dtype=float32)

In [8]:
model.compile(optimizer='rmsprop',
               loss='categorical_crossentropy',
               metrics=['accuracy'])

In [9]:
import time

start_time = time.time()
model.fit(train_images, train_labels, epochs=5, batch_size=64)
print("----- %s seconds ----- " % (time.time() - start_time ))

Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5
----- 75.57900166511536 seconds ----- 


In [21]:
# Testing the model performance
test_loss, test_acc = model.evaluate(test_images, test_labels)



In [22]:
# The ultimate accuracy, to be compared with the DenseNet
test_acc

0.98950000000000005