In [1]:
import keras
from keras.models import Sequential
from keras.layers import Dense
from keras.utils import to_categorical

When working with convolutional neural networks in particular, we will need additional packages.

In [2]:
from keras.layers.convolutional import Conv2D # to add convolutional layers
from keras.layers.convolutional import MaxPooling2D # to add pooling layers
from keras.layers import Flatten # to flatten data for fully connected layers

In [3]:
# import data
from keras.datasets import mnist

# load data
(X_train, y_train), (X_test, y_test) = mnist.load_data()

# reshape to be [samples][pixels][width][height]
X_train = X_train.reshape(X_train.shape[0], 28, 28, 1).astype('float32')
X_test = X_test.reshape(X_test.shape[0], 28, 28, 1).astype('float32')

Downloading data from https://storage.googleapis.com/tensorflow/tf-keras-datasets/mnist.npz


Let's normalize the pixel values to be between 0 and 1

In [4]:
X_train = X_train / 255 # normalize training data
X_test = X_test / 255 # normalize test data

Next, let's convert the target variable into binary categories


In [5]:
y_train = to_categorical(y_train)
y_test = to_categorical(y_test)

num_classes = y_test.shape[1] # number of categories

Define a function that creates our model. The convolutional model has two convolutional and pooling layers.

In [6]:
def convolutional_model():
    
    # create model
    model = Sequential()
    model.add(Conv2D(16, (5, 5), activation='relu', input_shape=(28, 28, 1)))
    model.add(MaxPooling2D(pool_size=(2, 2), strides=(2, 2)))
    
    model.add(Conv2D(8, (2, 2), activation='relu'))
    model.add(MaxPooling2D(pool_size=(2, 2), strides=(2, 2)))
    
    model.add(Flatten())
    model.add(Dense(100, activation='relu'))
    model.add(Dense(num_classes, activation='softmax'))
    
    # Compile model
    model.compile(optimizer='adam', loss='categorical_crossentropy',  metrics=['accuracy'])
    return model

Finally, let's call the function to create the model, and then let's train it and evaluate it.

In [7]:
# build the model
model = convolutional_model()

# fit the model
model.fit(X_train, y_train, validation_data=(X_test, y_test), epochs=10, batch_size=200, verbose=2)

# evaluate the model
scores = model.evaluate(X_test, y_test, verbose=0)
print("Accuracy: {} \n Error: {}".format(scores[1], 100-scores[1]*100))

Epoch 1/10
300/300 - 14s - loss: 0.4827 - accuracy: 0.8529 - val_loss: 0.1305 - val_accuracy: 0.9631 - 14s/epoch - 48ms/step
Epoch 2/10
300/300 - 14s - loss: 0.1184 - accuracy: 0.9648 - val_loss: 0.0818 - val_accuracy: 0.9742 - 14s/epoch - 45ms/step
Epoch 3/10
300/300 - 13s - loss: 0.0854 - accuracy: 0.9740 - val_loss: 0.0698 - val_accuracy: 0.9782 - 13s/epoch - 43ms/step
Epoch 4/10
300/300 - 13s - loss: 0.0678 - accuracy: 0.9794 - val_loss: 0.0553 - val_accuracy: 0.9829 - 13s/epoch - 44ms/step
Epoch 5/10
300/300 - 13s - loss: 0.0576 - accuracy: 0.9826 - val_loss: 0.0541 - val_accuracy: 0.9829 - 13s/epoch - 43ms/step
Epoch 6/10
300/300 - 13s - loss: 0.0499 - accuracy: 0.9847 - val_loss: 0.0428 - val_accuracy: 0.9861 - 13s/epoch - 43ms/step
Epoch 7/10
300/300 - 13s - loss: 0.0452 - accuracy: 0.9863 - val_loss: 0.0473 - val_accuracy: 0.9849 - 13s/epoch - 45ms/step
Epoch 8/10
300/300 - 13s - loss: 0.0406 - accuracy: 0.9874 - val_loss: 0.0401 - val_accuracy: 0.9869 - 13s/epoch - 43ms/step
