# Simple CNN for MNIST


## Setup

In [2]:
import numpy as np
from tensorflow import keras
from tensorflow.keras import layers
from tensorflow.keras.models import Sequential
from tensorflow.keras.layers import Conv2D, Flatten, Dropout, Dense, MaxPooling2D

## Prepare the data

In [3]:
# Model / data parameters
num_classes = 10
input_shape = (28, 28, 1)

# Load the data and split it between train and test sets
(x_train, y_train), (x_test, y_test) = keras.datasets.mnist.load_data()

# Scale images to the [0, 1] range
x_train = x_train.astype("float32") / 255
x_test = x_test.astype("float32") / 255
# Make sure images have shape (28, 28, 1)
x_train = np.expand_dims(x_train, -1)
x_test = np.expand_dims(x_test, -1)
print("x_train shape:", x_train.shape)
print(x_train.shape[0], "train samples")
print(x_test.shape[0], "test samples")


# convert class vectors to binary class matrices
y_train = keras.utils.to_categorical(y_train, num_classes)
y_test = keras.utils.to_categorical(y_test, num_classes)

Downloading data from https://storage.googleapis.com/tensorflow/tf-keras-datasets/mnist.npz
x_train shape: (60000, 28, 28, 1)
60000 train samples
10000 test samples


## Build the model

In [11]:
model = keras.Sequential(
    [
        # To-do
        keras.Input(shape=input_shape),  # Define the input shape of the model
        # Add a convolutional layer with 8 filters and ReLU activation
        Conv2D(filters = 8,kernel_size = (3,3), activation = 'relu'),
        MaxPooling2D(pool_size = (2,2)),# Add a max pooling layer with pool size 2x2
        Conv2D(filters = 16, kernel_size = (3,3), activation = 'relu'),# Add another convolutional layer with 16 filters and ReLU activation
        MaxPooling2D(pool_size = (3,3)),# Add another max pooling layer with pool size 2x2
        Flatten(),# Flatten the 2D feature maps into a 1D vector
        Dropout(0.5),# Apply dropout regularization with a rate of 0.5
        Dense(units = num_classes, activation = 'softmax')# Add a dense (fully connected) layer with softmax activation for classification
    ]
)

model.summary()

Model: "sequential_1"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 conv2d_5 (Conv2D)           (None, 26, 26, 8)         80        
                                                                 
 max_pooling2d_3 (MaxPoolin  (None, 13, 13, 8)         0         
 g2D)                                                            
                                                                 
 conv2d_6 (Conv2D)           (None, 11, 11, 16)        1168      
                                                                 
 max_pooling2d_4 (MaxPoolin  (None, 3, 3, 16)          0         
 g2D)                                                            
                                                                 
 flatten_1 (Flatten)         (None, 144)               0         
                                                                 
 dropout_1 (Dropout)         (None, 144)              

## Train the model

In [12]:
batch_size = 128  # Number of samples per gradient update
epochs = 15  # Number of times to iterate over the entire training dataset

# Configure the model for training
model.compile(loss="categorical_crossentropy", optimizer="adam", metrics=["accuracy"])

# Train the model on the training data
model.fit(x_train, y_train, batch_size=batch_size, epochs=epochs, validation_split=0.1)
# x_train: input training data
# y_train: target training data
# batch_size: number of samples per gradient update
# epochs: number of times to iterate over the entire training dataset
# validation_split: the fraction of the training data to be used as validation data during training


Epoch 1/15
Epoch 2/15
Epoch 3/15
Epoch 4/15
Epoch 5/15
Epoch 6/15
Epoch 7/15
Epoch 8/15
Epoch 9/15
Epoch 10/15
Epoch 11/15
Epoch 12/15
Epoch 13/15
Epoch 14/15
Epoch 15/15


<keras.src.callbacks.History at 0x7909f8ca4670>

## Evaluate the trained model

In [13]:
score = model.evaluate(x_test, y_test, verbose=0)
print("Test accuracy:", score[1])

Test accuracy: 0.9776999950408936
