In [1]:
import numpy
from keras.datasets import mnist
from keras.models import Sequential
from keras.layers import Dense
from keras.layers import Dropout
from keras.layers import Flatten
from keras.layers.convolutional import Convolution2D
from keras.layers.convolutional import MaxPooling2D
from keras.utils import np_utils
from keras import backend as K

# fix random seed for reproducibility
seed = 7
numpy.random.seed(seed)

Using TensorFlow backend.


In [2]:
# load data
(X_train, y_train), (X_test, y_test) = mnist.load_data()

# reshape to be [samples][width][height][channels]
X_train = X_train.reshape(X_train.shape[0], 28, 28, 1).astype('float32')
X_test = X_test.reshape(X_test.shape[0], 28, 28, 1).astype('float32')

In [3]:
# normalize inputs from 0-255 to 0-1
X_train = X_train / 255
X_test = X_test / 255

# one hot encode outputs
y_train = np_utils.to_categorical(y_train)
y_test = np_utils.to_categorical(y_test)
num_classes = y_test.shape[1]

In [4]:
def baseline_model():
    # create model
    model = Sequential()
    model.add(Convolution2D(32, 5, 5, border_mode='valid', input_shape=(28, 28, 1), activation='relu'))
    model.add(MaxPooling2D(pool_size=(2, 2)))
    model.add(Dropout(0.2))
    model.add(Flatten())
    model.add(Dense(128, activation='relu'))
    model.add(Dense(num_classes, activation='softmax'))
    
    # compile model
    model.compile(loss='categorical_crossentropy', optimizer='adam', metrics=['accuracy'])
    return model

In [5]:
# build the model
model = baseline_model()

# fit the model
model.fit(X_train, y_train, validation_data=(X_test, y_test), nb_epoch=10, batch_size=200, verbose=2)

# final evaluation of the model
scores = model.evaluate(X_test, y_test, verbose=0)
print("Baseline Error: %.2f%%" % (100-scores[1]*100))

Train on 60000 samples, validate on 10000 samples
Epoch 1/10
23s - loss: 0.2520 - acc: 0.9272 - val_loss: 0.0861 - val_acc: 0.9748
Epoch 2/10
22s - loss: 0.0767 - acc: 0.9770 - val_loss: 0.0631 - val_acc: 0.9796
Epoch 3/10
23s - loss: 0.0553 - acc: 0.9825 - val_loss: 0.0488 - val_acc: 0.9835
Epoch 4/10
23s - loss: 0.0423 - acc: 0.9875 - val_loss: 0.0403 - val_acc: 0.9872
Epoch 5/10
23s - loss: 0.0346 - acc: 0.9893 - val_loss: 0.0349 - val_acc: 0.9886
Epoch 6/10
23s - loss: 0.0288 - acc: 0.9909 - val_loss: 0.0350 - val_acc: 0.9886
Epoch 7/10
23s - loss: 0.0233 - acc: 0.9927 - val_loss: 0.0339 - val_acc: 0.9884
Epoch 8/10
24s - loss: 0.0192 - acc: 0.9939 - val_loss: 0.0351 - val_acc: 0.9888
Epoch 9/10
23s - loss: 0.0174 - acc: 0.9940 - val_loss: 0.0320 - val_acc: 0.9888
Epoch 10/10
23s - loss: 0.0133 - acc: 0.9957 - val_loss: 0.0332 - val_acc: 0.9898
Baseline Error: 1.02%


In [6]:
def larger_model():
    # create model
    model = Sequential()
    model.add(Convolution2D(30, 5, 5, border_mode='valid', input_shape=(28, 28, 1), activation='relu'))
    model.add(MaxPooling2D(pool_size=(2, 2)))
    model.add(Convolution2D(15, 3, 3, activation='relu'))
    model.add(MaxPooling2D(pool_size=(2, 2)))
    model.add(Dropout(0.2))
    model.add(Flatten())
    model.add(Dense(128, activation='relu'))
    model.add(Dense(50, activation='relu'))
    model.add(Dense(num_classes, activation='softmax'))
    
    # compile model
    model.compile(loss='categorical_crossentropy', optimizer='adam', metrics=['accuracy'])
    return model

In [7]:
# build the model
model = larger_model()

# fit the model
model.fit(X_train, y_train, validation_data=(X_test, y_test), nb_epoch=10, batch_size=200, verbose=2)

# final evaluation of the model
scores = model.evaluate(X_test, y_test, verbose=0)
print("Baseline Error: %.2f%%" % (100-scores[1]*100))

Train on 60000 samples, validate on 10000 samples
Epoch 1/10
27s - loss: 0.4038 - acc: 0.8777 - val_loss: 0.0859 - val_acc: 0.9725
Epoch 2/10
27s - loss: 0.0989 - acc: 0.9699 - val_loss: 0.0508 - val_acc: 0.9830
Epoch 3/10
28s - loss: 0.0693 - acc: 0.9792 - val_loss: 0.0390 - val_acc: 0.9873
Epoch 4/10
27s - loss: 0.0601 - acc: 0.9812 - val_loss: 0.0340 - val_acc: 0.9881
Epoch 5/10
27s - loss: 0.0484 - acc: 0.9847 - val_loss: 0.0306 - val_acc: 0.9903
Epoch 6/10
27s - loss: 0.0441 - acc: 0.9858 - val_loss: 0.0283 - val_acc: 0.9910
Epoch 7/10
27s - loss: 0.0396 - acc: 0.9875 - val_loss: 0.0373 - val_acc: 0.9886
Epoch 8/10
29s - loss: 0.0368 - acc: 0.9878 - val_loss: 0.0263 - val_acc: 0.9920
Epoch 9/10
28s - loss: 0.0307 - acc: 0.9902 - val_loss: 0.0272 - val_acc: 0.9915
Epoch 10/10
28s - loss: 0.0304 - acc: 0.9904 - val_loss: 0.0242 - val_acc: 0.9918
Baseline Error: 0.82%
