In [71]:
import numpy as np
import tensorflow as tf
from keras.datasets import mnist
from keras.models import Sequential
from keras.layers import Dense
from keras.layers import Dropout
from keras.layers import Flatten
from keras import activations
from keras.layers.convolutional import Convolution2D
from keras.layers.convolutional import MaxPooling2D
from keras.utils import np_utils
from keras import backend as K

In [72]:
# fix random seed for reproducibility
seed = 7
numpy.random.seed(seed)

In [73]:
# load data
(X_train, y_train), (X_test, y_test) = mnist.load_data()
X_train.shape

(60000, 28, 28)

In [74]:
# reshape to be [samples][channels][width][height]
X_train = X_train.reshape(X_train.shape[0], 28, 28, 1).astype(np.float32 )
X_test = X_test.reshape(X_test.shape[0], 28, 28, 1).astype(np.float32 )

# normalize inputs from 0-255 to 0-1
X_train = X_train / 255
X_test = X_test / 255

In [75]:
# one hot encode outputs
y_train = np_utils.to_categorical(y_train)
y_test = np_utils.to_categorical(y_test)
num_classes = y_test.shape[1]

In [76]:
# define a simple CNN model
def baseline_model():
    # create model
    model = Sequential()
    # 32 maps with filter size size 3X3
    model.add(Convolution2D(32, (3,3), input_shape=(28, 28, 1), activation='relu'))
    model.add(MaxPooling2D(pool_size=(2, 2)))
    model.add(Dropout(0.2))
    model.add(Flatten())
    model.add(Dense(128, activation='relu'))
    model.add(Dense(num_classes, activation='softmax'))
    return model

# build the model
model = baseline_model()
# Compile model
model.compile(loss='categorical_crossentropy', optimizer='adam', metrics=[ 'accuracy' ])

In [78]:
# Fit the model
model.fit(X_train, y_train, validation_data=(X_test, y_test), epochs=10, batch_size=200, verbose=2)

Epoch 1/10
300/300 - 13s - loss: 0.2745 - accuracy: 0.9212 - val_loss: 0.0985 - val_accuracy: 0.9716 - 13s/epoch - 45ms/step
Epoch 2/10
300/300 - 13s - loss: 0.0872 - accuracy: 0.9746 - val_loss: 0.0664 - val_accuracy: 0.9802 - 13s/epoch - 44ms/step
Epoch 3/10
300/300 - 13s - loss: 0.0610 - accuracy: 0.9816 - val_loss: 0.0495 - val_accuracy: 0.9831 - 13s/epoch - 44ms/step
Epoch 4/10
300/300 - 14s - loss: 0.0471 - accuracy: 0.9855 - val_loss: 0.0461 - val_accuracy: 0.9847 - 14s/epoch - 46ms/step
Epoch 5/10
300/300 - 14s - loss: 0.0377 - accuracy: 0.9882 - val_loss: 0.0405 - val_accuracy: 0.9858 - 14s/epoch - 47ms/step
Epoch 6/10
300/300 - 13s - loss: 0.0333 - accuracy: 0.9894 - val_loss: 0.0492 - val_accuracy: 0.9847 - 13s/epoch - 44ms/step
Epoch 7/10
300/300 - 16s - loss: 0.0267 - accuracy: 0.9916 - val_loss: 0.0409 - val_accuracy: 0.9865 - 16s/epoch - 53ms/step
Epoch 8/10
300/300 - 15s - loss: 0.0228 - accuracy: 0.9929 - val_loss: 0.0383 - val_accuracy: 0.9871 - 15s/epoch - 48ms/step


<keras.callbacks.History at 0x1a81fb30a60>

In [None]:
# Final evaluation of the model
scores = model.evaluate(X_test, y_test, verbose=0)
print("CNN Error: %.2f%%" % (100-scores[1]*100))