In [14]:
from keras.models import Sequential
from keras.layers import Dense, Dropout, Flatten
from keras.layers.convolutional import Convolution2D, MaxPooling2D
from keras.utils import np_utils
import numpy as np


In [15]:
from keras.datasets import mnist
(X_train, y_train), (X_test, y_test) = mnist.load_data()

In [16]:
X_train.shape

(60000, 28, 28)

In [17]:
num_pixels = X_train.shape[1] * X_train.shape[2]
n_channels = 1
def preprocess(matrix):
    return matrix.reshape(matrix.shape[0], \
                          n_channels, \
                          matrix.shape[1], \
                          matrix.shape[2]
                         ).astype('float32') / 255.

In [18]:
X_train, X_test = preprocess(X_train), preprocess(X_test)

In [19]:
X_train.shape, X_train.dtype, np.max(X_train)

((60000, 1, 28, 28), dtype('float32'), 1.0)

In [20]:
y_train = np_utils.to_categorical(y_train)
y_test = np_utils.to_categorical(y_test)
num_classes = y_train.shape[1]

In [21]:
y_train.shape

(60000, 10)

In [22]:
def baseline_model():
    # create model
    model = Sequential()
    model.add(Flatten(input_shape=(1, 28, 28)))
    model.add(Dense(num_pixels, init='normal', activation='relu'))
    model.add(Dense(num_classes, init='normal', activation='softmax'))
    # Compile model
    model.compile(loss='categorical_crossentropy', optimizer='adam', metrics=['accuracy'])
    return model

In [23]:
def convolution_small():
    # create model
    model = Sequential()
    model.add(Convolution2D(32, 5, 5, border_mode='valid', input_shape=(1, 28, 28), activation='relu'))
    model.add(MaxPooling2D(pool_size=(2, 2)))
    model.add(Dropout(0.2))
    model.add(Flatten())
    model.add(Dense(128, activation='relu'))
    model.add(Dense(num_classes, activation='softmax'))
    # Compile model
    model.compile(loss='categorical_crossentropy', optimizer='adam', metrics=['accuracy'])
    return model


In [25]:
def convolution_large():
    # create model
    model = Sequential()
    model.add(Convolution2D(30, 5, 5, border_mode='valid', input_shape=(1, 28, 28), activation='relu'))
    model.add(MaxPooling2D(pool_size=(2, 2)))
    model.add(Convolution2D(15, 3, 3, activation='relu'))
    model.add(MaxPooling2D(pool_size=(2, 2)))
    model.add(Dropout(0.2))
    model.add(Flatten())
    model.add(Dense(128, activation='relu'))
    model.add(Dense(50, activation='relu'))
    model.add(Dense(num_classes, activation='softmax'))
    # Compile model
    model.compile(loss='categorical_crossentropy', optimizer='adam', metrics=['accuracy'])
    return model

In [120]:
# build the model
np.random.seed(101)
models = [('baseline', baseline_model()), 
          ('small', convolution_small()), 
          ('large', convolution_large())]

for name, model in models:
    print("With model:", name)
    # Fit the model
    model.fit(X_train, y_train, validation_data=(X_test, y_test), nb_epoch=10, batch_size=100, verbose=2)
    # Final evaluation of the model
    scores = model.evaluate(X_test, y_test, verbose=0)
    print("Baseline Error: %.2f%%" % (100-scores[1]*100))
    print()

With model: baseline
Train on 60000 samples, validate on 10000 samples
Epoch 1/10
3s - loss: 0.2332 - acc: 0.9313 - val_loss: 0.1113 - val_acc: 0.9670
Epoch 2/10
3s - loss: 0.0897 - acc: 0.9735 - val_loss: 0.0864 - val_acc: 0.9737
Epoch 3/10
3s - loss: 0.0559 - acc: 0.9829 - val_loss: 0.0682 - val_acc: 0.9792
Epoch 4/10
3s - loss: 0.0382 - acc: 0.9886 - val_loss: 0.0642 - val_acc: 0.9789
Epoch 5/10
2s - loss: 0.0270 - acc: 0.9919 - val_loss: 0.0617 - val_acc: 0.9802
Epoch 6/10
2s - loss: 0.0188 - acc: 0.9947 - val_loss: 0.0579 - val_acc: 0.9818
Epoch 7/10
3s - loss: 0.0143 - acc: 0.9962 - val_loss: 0.0650 - val_acc: 0.9805
Epoch 8/10
2s - loss: 0.0115 - acc: 0.9966 - val_loss: 0.0788 - val_acc: 0.9771
Epoch 9/10
2s - loss: 0.0107 - acc: 0.9970 - val_loss: 0.0829 - val_acc: 0.9766
Epoch 10/10
2s - loss: 0.0102 - acc: 0.9970 - val_loss: 0.0724 - val_acc: 0.9796
Baseline Error: 2.04%

With model: small
Train on 60000 samples, validate on 10000 samples
Epoch 1/10
17s - loss: 0.1878 - acc: 