In [4]:
# Importing necessary libraries
from keras.datasets import mnist
from keras.models import Sequential
from keras.layers import Dense, Dropout, Flatten
from keras.layers import Conv2D, MaxPooling2D
from keras.callbacks import EarlyStopping
from tensorflow.keras.utils import to_categorical
from sklearn.metrics import classification_report, confusion_matrix

In [5]:
# Loading the MNIST dataset
(x_train, y_train), (x_test, y_test) = mnist.load_data()

Downloading data from https://storage.googleapis.com/tensorflow/tf-keras-datasets/mnist.npz


In [6]:
# Reshaping the data to match the input shape expected by the model
x_train = x_train.reshape(x_train.shape[0], 28, 28, 1)
x_test = x_test.reshape(x_test.shape[0], 28, 28, 1)
input_shape = (28, 28, 1)

In [7]:
# Setting some hyperparameters
batch_size = 128
num_classes = 10
epochs = 10

In [8]:
# Converting labels to categorical (one-hot encoding)
y_train = to_categorical(y_train, num_classes)
y_test = to_categorical(y_test, num_classes)

In [9]:
# Normalizing pixel values to be between 0 and 1
x_train = x_train.astype('float32')
x_test = x_test.astype('float32')
x_train /= 255
x_test /= 255
print('x_train shape:', x_train.shape)
print(x_train.shape[0], 'train samples')
print(x_test.shape[0], 'test samples')

x_train shape: (60000, 28, 28, 1)
60000 train samples
10000 test samples


In [10]:
# Creating the neural network model
model = Sequential()
model.add(Conv2D(32, kernel_size=(3, 3), activation='relu', input_shape=input_shape))
model.add(Conv2D(64, (3, 3), activation='relu'))
model.add(MaxPooling2D(pool_size=(2, 2)))
model.add(Dropout(0.25))
model.add(Flatten())
model.add(Dense(256, activation='relu'))
model.add(Dropout(0.5))
model.add(Dense(num_classes, activation='softmax'))

# Compiling the model
model.compile(optimizer='adadelta', loss='categorical_crossentropy', metrics=['accuracy'])

# Adding early stopping for model training
early_stopping = EarlyStopping(monitor='val_loss', patience=3)

In [11]:
# Training the model
hist = model.fit(x_train, y_train, batch_size=batch_size, epochs=epochs, verbose=1, validation_data=(x_test, y_test), callbacks=[early_stopping])

# Saving the trained model
model.save('mnist.h5')
print("Saving the model as mnist.h5")

Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
Saving the model as mnist.h5


  saving_api.save_model(


In [12]:
# Evaluating the model on the test data
score = model.evaluate(x_test, y_test, verbose=0)
print('Test loss:', score[0])
print('Test accuracy:', score[1])

Test loss: 0.6699315905570984
Test accuracy: 0.8508999943733215


In [14]:
import numpy as np
y_pred = model.predict(x_test)
y_pred_classes = np.argmax(y_pred, axis=1)
y_true = np.argmax(y_test, axis=1)

# Classification Report
print("Classification Report:")
print(classification_report(y_true, y_pred_classes))

# Confusion Matrix
confusion_mtx = confusion_matrix(y_true, y_pred_classes)
print("Confusion Matrix:")
print(confusion_mtx)

Classification Report:
              precision    recall  f1-score   support

           0       0.89      0.95      0.92       980
           1       0.88      0.96      0.91      1135
           2       0.89      0.85      0.87      1032
           3       0.80      0.89      0.84      1010
           4       0.83      0.80      0.82       982
           5       0.92      0.64      0.76       892
           6       0.86      0.91      0.89       958
           7       0.91      0.85      0.88      1028
           8       0.80      0.79      0.80       974
           9       0.76      0.84      0.80      1009

    accuracy                           0.85     10000
   macro avg       0.85      0.85      0.85     10000
weighted avg       0.85      0.85      0.85     10000

Confusion Matrix:
[[ 934    0    1    3    0    2   21    1   18    0]
 [   0 1087   19   10    1    1    5    0    9    3]
 [  17    9  873   13   17    1   33   21   46    2]
 [   4    7   30  894    0   15    4   15