# Classifying MNIST Database Using Convolutional Neural Networks with Keras

## Import Keras and Packages


In [9]:
#!pip install numpy==1.21.4
#!pip install pandas==1.3.4
!pip install keras==3.4.1



In [10]:
import keras
from keras.models import Sequential
from keras.layers import Dense
from keras.utils import to_categorical

In [11]:
from keras.layers import Conv2D # to add convolutional layers
from keras.layers import MaxPooling2D # to add pooling layers
from keras.layers import Flatten # to flatten data for fully connected layers

## Convolutional Layer with One set of convolutional and pooling layers


In [12]:
# import data
from keras.datasets import mnist

# load data
(X_train, y_train), (X_test, y_test) = mnist.load_data()

# reshape to be [samples][pixels][width][height]
X_train = X_train.reshape(X_train.shape[0], 28, 28, 1).astype('float32')
X_test = X_test.reshape(X_test.shape[0], 28, 28, 1).astype('float32')

In [13]:
X_train = X_train / 255 # normalize training data
X_test = X_test / 255 # normalize test data

In [14]:
y_train = to_categorical(y_train)
y_test = to_categorical(y_test)

num_classes = y_test.shape[1] # number of categories

In [15]:
def convolutional_model():

    # create model
    model = Sequential()
    model.add(Conv2D(16, (5, 5), strides=(1, 1), activation='relu', input_shape=(28, 28, 1)))
    model.add(MaxPooling2D(pool_size=(2, 2), strides=(2, 2)))

    model.add(Flatten())
    model.add(Dense(100, activation='relu'))
    model.add(Dense(num_classes, activation='softmax'))

    # compile model
    model.compile(optimizer='adam', loss='categorical_crossentropy',  metrics=['accuracy'])
    return model

Finally, let's call the function to create the model, and then let's train it and evaluate it.


In [16]:
# build the model
model = convolutional_model()

# fit the model
model.fit(X_train, y_train, validation_data=(X_test, y_test), epochs=10, batch_size=200, verbose=2)

# evaluate the model
scores = model.evaluate(X_test, y_test, verbose=0)
print("Accuracy: {} \n Error: {}".format(scores[1], 100-scores[1]*100))

  super().__init__(activity_regularizer=activity_regularizer, **kwargs)


Epoch 1/10
300/300 - 26s - 88ms/step - accuracy: 0.9153 - loss: 0.2999 - val_accuracy: 0.9662 - val_loss: 0.1142
Epoch 2/10
300/300 - 23s - 77ms/step - accuracy: 0.9757 - loss: 0.0862 - val_accuracy: 0.9788 - val_loss: 0.0653
Epoch 3/10
300/300 - 40s - 134ms/step - accuracy: 0.9833 - loss: 0.0580 - val_accuracy: 0.9845 - val_loss: 0.0499
Epoch 4/10
300/300 - 21s - 69ms/step - accuracy: 0.9859 - loss: 0.0456 - val_accuracy: 0.9869 - val_loss: 0.0423
Epoch 5/10
300/300 - 22s - 73ms/step - accuracy: 0.9892 - loss: 0.0368 - val_accuracy: 0.9864 - val_loss: 0.0414
Epoch 6/10
300/300 - 40s - 135ms/step - accuracy: 0.9911 - loss: 0.0302 - val_accuracy: 0.9866 - val_loss: 0.0397
Epoch 7/10
300/300 - 40s - 134ms/step - accuracy: 0.9928 - loss: 0.0250 - val_accuracy: 0.9869 - val_loss: 0.0386
Epoch 8/10
300/300 - 22s - 73ms/step - accuracy: 0.9931 - loss: 0.0224 - val_accuracy: 0.9866 - val_loss: 0.0388
Epoch 9/10
300/300 - 20s - 68ms/step - accuracy: 0.9948 - loss: 0.0180 - val_accuracy: 0.9876

## Convolutional Layer with Multiple sets of convolutional and pooling layers


In [17]:
def convolutional_model():

    # create model
    model = Sequential()
    model.add(Conv2D(16, (5, 5), activation='relu', input_shape=(28, 28, 1)))
    model.add(MaxPooling2D(pool_size=(2, 2), strides=(2, 2)))
    model.add(Dense(100, activation='relu'))

    model.add(Conv2D(8, (2, 2), activation='relu'))
    model.add(MaxPooling2D(pool_size=(2, 2), strides=(2, 2)))

    model.add(Dense(200, activation='relu'))
    model.add(Conv2D(8, (2, 2), activation='relu'))
    model.add(MaxPooling2D(pool_size=(2, 2), strides=(2, 2)))

    model.add(Flatten())
    model.add(Dense(300, activation='relu'))
    model.add(Dense(num_classes, activation='softmax'))

    # Compile model
    model.compile(optimizer='adam', loss='categorical_crossentropy',  metrics=['accuracy'])
    return model

Now, let's call the function to create our new convolutional neural network, and then let's train it and evaluate it.


In [20]:
# build the model
model = convolutional_model()

# fit the model
model.fit(X_train, y_train, validation_data=(X_test, y_test), epochs=10, batch_size=200, verbose=2)

# evaluate the model
scores = model.evaluate(X_test, y_test, verbose=0)
print("Accuracy: {} \n Error: {}".format(scores[1], 100-scores[1]*100))

Epoch 1/10
300/300 - 64s - 212ms/step - accuracy: 0.8235 - loss: 0.5410 - val_accuracy: 0.9488 - val_loss: 0.1654
Epoch 2/10
300/300 - 60s - 198ms/step - accuracy: 0.9574 - loss: 0.1366 - val_accuracy: 0.9680 - val_loss: 0.1004
Epoch 3/10
300/300 - 80s - 267ms/step - accuracy: 0.9693 - loss: 0.0991 - val_accuracy: 0.9730 - val_loss: 0.0838
Epoch 4/10
300/300 - 81s - 271ms/step - accuracy: 0.9737 - loss: 0.0819 - val_accuracy: 0.9805 - val_loss: 0.0642
Epoch 5/10
300/300 - 82s - 273ms/step - accuracy: 0.9773 - loss: 0.0735 - val_accuracy: 0.9800 - val_loss: 0.0607
Epoch 6/10
300/300 - 81s - 271ms/step - accuracy: 0.9804 - loss: 0.0614 - val_accuracy: 0.9829 - val_loss: 0.0521
Epoch 7/10
300/300 - 83s - 278ms/step - accuracy: 0.9825 - loss: 0.0552 - val_accuracy: 0.9848 - val_loss: 0.0507
Epoch 8/10
300/300 - 81s - 271ms/step - accuracy: 0.9837 - loss: 0.0508 - val_accuracy: 0.9848 - val_loss: 0.0491
Epoch 9/10
300/300 - 78s - 260ms/step - accuracy: 0.9850 - loss: 0.0467 - val_accuracy: 