In [1]:
import numpy as np
import keras
from keras import layers

In [10]:
# Model / data parameters
num_classes = 10
input_shape = (28, 28, 1)

# Load the data and split it between train and test sets
(x_train, y_train), (x_test, y_test) = keras.datasets.mnist.load_data()

# Scale images to the [0, 1] range
x_train = x_train.astype("float32") / 255
x_test = x_test.astype("float32") / 255
# Make sure images have shape (28, 28, 1)
x_train = np.expand_dims(x_train, -1) ## adds one dimension (60000, 28, 28) -> (60000, 28, 28, 1)
x_test = np.expand_dims(x_test, -1)
print("x_train shape:", x_train.shape)
print(x_train.shape[0], "train samples") ## print num of train/test samples
print(x_test.shape[0], "test samples")


# convert class vectors to binary class matrices -- if you want to visualize print before and after
#print ("Before:", y_train)
y_train = keras.utils.to_categorical(y_train, num_classes)
#print("After:", y_train)
y_test = keras.utils.to_categorical(y_test, num_classes)

x_train shape: (60000, 28, 28, 1)
60000 train samples
10000 test samples


In [11]:
model = keras.Sequential(
    [
        keras.Input(shape=input_shape),
        layers.Conv2D(32, kernel_size=(3, 3), activation="relu"),
        layers.MaxPooling2D(pool_size=(2, 2)),
        layers.Conv2D(64, kernel_size=(3, 3), activation="relu"),
        layers.MaxPooling2D(pool_size=(2, 2)),
        layers.Flatten(),
        layers.Dropout(0.5),
        layers.Dense(num_classes, activation="softmax"),
    ]
)

model.summary()

In [12]:
batch_size = 128
epochs = 15

model.compile(loss="categorical_crossentropy", optimizer="adam", metrics=["accuracy"])

model.fit(x_train, y_train, batch_size=batch_size, epochs=epochs, validation_split=0.1)

Epoch 1/15
[1m422/422[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m48s[0m 111ms/step - accuracy: 0.7750 - loss: 0.7394 - val_accuracy: 0.9792 - val_loss: 0.0782
Epoch 2/15
[1m422/422[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m42s[0m 99ms/step - accuracy: 0.9639 - loss: 0.1195 - val_accuracy: 0.9862 - val_loss: 0.0554
Epoch 3/15
[1m422/422[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m42s[0m 99ms/step - accuracy: 0.9729 - loss: 0.0864 - val_accuracy: 0.9873 - val_loss: 0.0455
Epoch 4/15
[1m422/422[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m83s[0m 102ms/step - accuracy: 0.9776 - loss: 0.0726 - val_accuracy: 0.9882 - val_loss: 0.0423
Epoch 5/15
[1m422/422[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m49s[0m 116ms/step - accuracy: 0.9815 - loss: 0.0598 - val_accuracy: 0.9908 - val_loss: 0.0353
Epoch 6/15
[1m422/422[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m43s[0m 101ms/step - accuracy: 0.9834 - loss: 0.0528 - val_accuracy: 0.9903 - val_loss: 0.0346
Epoch 7/15


<keras.src.callbacks.history.History at 0x7e09c4174c80>

In [14]:
model.save("model.h5") ## save the model- change path as needed



In [13]:
score = model.evaluate(x_test, y_test, verbose=0) ## evaluates the model on test samples
print("Test loss:", score[0])
print("Test accuracy:", score[1])

Test loss: 0.026942122727632523
Test accuracy: 0.9908000230789185


source: https://keras.io/examples/vision/mnist_convnet/