# Convolutional Network on Keras (MNIST)

Import libraries and modules

In [1]:
import numpy as np
np.random.seed(123)  # for reproducibility

In [2]:
from keras.models import Sequential
from keras.layers import Dense, Dropout, Activation, Flatten
from keras.layers import Conv2D, MaxPooling2D
from keras.utils import np_utils
from keras.datasets import mnist

Using TensorFlow backend.


Load pre-shuffled MNIST data into train and test sets

In [3]:
(X_train, y_train), (X_test, y_test) = mnist.load_data()
 
# 5. Preprocess input data
X_train = X_train.reshape(X_train.shape[0], 28, 28, 1)
X_test = X_test.reshape(X_test.shape[0], 28, 28, 1)
X_train = X_train.astype('float32')
X_test = X_test.astype('float32')
X_train /= 255
X_test /= 255

# 6. Preprocess class labels
Y_train = np_utils.to_categorical(y_train, 10)
Y_test = np_utils.to_categorical(y_test, 10)

print X_train.shape
print Y_train.shape

(60000, 28, 28, 1)
(60000, 10)


Define model architecture

In [4]:
model = Sequential()
 
model.add(Conv2D(32, (3, 3), activation='relu', input_shape=X_train.shape[1:]))
#model.add(Conv2D(32, (3, 3), activation='relu'))
model.add(MaxPooling2D(pool_size=(2,2)))
model.add(Dropout(0.25))
model.add(Flatten())
model.add(Dense(128, activation='relu'))
model.add(Dropout(0.5))
model.add(Dense(10, activation='softmax'))
 
# Compile model
model.compile(loss='categorical_crossentropy', optimizer='adam', metrics=['accuracy'])

Fit model on training data

In [5]:
model.fit(X_train, Y_train, batch_size=64, epochs=1)

Epoch 1/1


<keras.callbacks.History at 0x7f523cb0e910>

Evaluate model on test data

In [6]:
model.evaluate(X_test, Y_test, verbose=0)

[0.07614485906027257, 0.977]