In [1]:
import sys
import keras
from keras.models import Sequential
from keras.layers import Dense
from keras.utils import to_categorical
from keras.layers.convolutional import Conv2D # to add convolutional layers
from keras.layers.convolutional import MaxPooling2D # to add pooling layers
from keras.layers import Flatten # to flatten data for fully connected layers
# import data
from keras.datasets import mnist

Using TensorFlow backend.


In [2]:
# load data
(X_train, y_train), (X_test, y_test) = mnist.load_data()
print(X_train.shape, X_test.shape)
# (60000, 28, 28) (10000, 28, 28)
# reshape to be [samples][pixels][width][height]
X_train = X_train.reshape(X_train.shape[0], 28, 28, 1).astype('float32')
X_test = X_test.reshape(X_test.shape[0], 28, 28, 1).astype('float32')
X_train = X_train / 255 # normalize training data
X_test = X_test / 255 # normalize test data
y_train = to_categorical(y_train)
y_test = to_categorical(y_test)
num_classes = y_test.shape[1] # number of categories

def convolutional_model():    

    # create model
    model = Sequential()
    model.add(Conv2D(64, (5, 5), strides=(1, 1), activation='relu', input_shape=(28, 28, 1)))
    model.add(MaxPooling2D(pool_size=(2, 2), strides=(2, 2)))
    model.add(Flatten())
    model.add(Dense(100, activation='relu'))
    model.add(Dense(num_classes, activation='softmax'))  
    # compile model
    model.compile(optimizer='adam', loss='categorical_crossentropy', metrics=['accuracy'])
    return model

# build the model
model = convolutional_model()
model.summary()

Downloading data from https://s3.amazonaws.com/img-datasets/mnist.npz
(60000, 28, 28) (10000, 28, 28)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
conv2d_1 (Conv2D)            (None, 24, 24, 64)        1664      
_________________________________________________________________
max_pooling2d_1 (MaxPooling2 (None, 12, 12, 64)        0         
_________________________________________________________________
flatten_1 (Flatten)          (None, 9216)              0         
_________________________________________________________________
dense_1 (Dense)              (None, 100)               921700    
_________________________________________________________________
dense_2 (Dense)              (None, 10)                1010      
Total params: 924,374
Trainable params: 924,374
Non-trainable params: 0
_________________________________________________________________


In [None]:
# fit the model
model.fit(X_train, y_train, validation_data=(X_test, y_test), epochs=10, batch_size=200, verbose=2)
# evaluate the model
scores = model.evaluate(X_test, y_test, verbose=0)
print("Accuracy: {} \n Error: {}".format(scores[1], 100-scores[1]*100))

Train on 60000 samples, validate on 10000 samples
Epoch 1/10
 - 57s - loss: 0.2237 - acc: 0.9366 - val_loss: 0.0654 - val_acc: 0.9799
Epoch 2/10
 - 62s - loss: 0.0610 - acc: 0.9823 - val_loss: 0.0488 - val_acc: 0.9844
Epoch 3/10
 - 81s - loss: 0.0424 - acc: 0.9869 - val_loss: 0.0385 - val_acc: 0.9875
Epoch 4/10
 - 82s - loss: 0.0318 - acc: 0.9904 - val_loss: 0.0433 - val_acc: 0.9862
Epoch 5/10
 - 67s - loss: 0.0254 - acc: 0.9923 - val_loss: 0.0335 - val_acc: 0.9891
Epoch 6/10
 - 64s - loss: 0.0194 - acc: 0.9942 - val_loss: 0.0335 - val_acc: 0.9894
Epoch 7/10
 - 64s - loss: 0.0150 - acc: 0.9954 - val_loss: 0.0339 - val_acc: 0.9887
Epoch 8/10
 - 64s - loss: 0.0108 - acc: 0.9969 - val_loss: 0.0364 - val_acc: 0.9885
Epoch 9/10
 - 70s - loss: 0.0099 - acc: 0.9970 - val_loss: 0.0328 - val_acc: 0.9897
Epoch 10/10
Accuracy: 0.9877 
 Error: 1.230000000000004
