# Simple MNIST convnet

**Author:** [fchollet](https://twitter.com/fchollet)<br>
**Date created:** 2015/06/19<br>
**Last modified:** 2020/04/21<br>
**Description:** A simple convnet that achieves ~99% test accuracy on MNIST.

## Setup

In [None]:
import numpy as np
import keras
from keras import layers

In [1]:
import os
import numpy as np
from tensorflow.keras.datasets import mnist
from PIL import Image

# Load MNIST data
(x_train, y_train), (x_test, y_test) = mnist.load_data()

# Base directory for saving images
base_dir = 'data'  # Update this path

os.makedirs(base_dir, exist_ok=True)

# Create subdirectories for train and test datasets
for split in ['train', 'test']:
    for i in range(10):  # There are 10 classes (0-9)
        os.makedirs(os.path.join(base_dir, split, str(i)), exist_ok=True)

# Function to save images
def save_images(images, labels, split):
    for idx, (image, label) in enumerate(zip(images, labels)):
        folder = os.path.join(base_dir, split, str(label))
        image_path = os.path.join(folder, f'{idx}.png')
        im = Image.fromarray(image)
        im.save(image_path)

# Save training images
save_images(x_train, y_train, 'train')

# Save testing images
save_images(x_test, y_test, 'test')

print(f'Images successfully saved under {base_dir}')


Downloading data from https://storage.googleapis.com/tensorflow/tf-keras-datasets/mnist.npz
[1m11490434/11490434[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m2s[0m 0us/step
Images successfully saved under data


## Prepare the data

In [2]:
# Model / data parameters
num_classes = 10
input_shape = (28, 28, 1)

# Load the data and split it between train and test sets
(x_train, y_train), (x_test, y_test) = keras.datasets.mnist.load_data()

# Scale images to the [0, 1] range
x_train = x_train.astype("float32") / 255
x_test = x_test.astype("float32") / 255
# Make sure images have shape (28, 28, 1)
x_train = np.expand_dims(x_train, -1)
x_test = np.expand_dims(x_test, -1)
print("x_train shape:", x_train.shape)
print(x_train.shape[0], "train samples")
print(x_test.shape[0], "test samples")


# convert class vectors to binary class matrices
y_train = keras.utils.to_categorical(y_train, num_classes)
y_test = keras.utils.to_categorical(y_test, num_classes)

NameError: name 'keras' is not defined

## Build the model

In [None]:
model = keras.Sequential(
    [
        keras.Input(shape=input_shape),
        layers.Conv2D(32, kernel_size=(3, 3), activation="relu"),
        layers.MaxPooling2D(pool_size=(2, 2)),
        layers.Conv2D(64, kernel_size=(3, 3), activation="relu"),
        layers.MaxPooling2D(pool_size=(2, 2)),
        layers.Flatten(),
        layers.Dropout(0.5),
        layers.Dense(num_classes, activation="softmax"),
    ]
)

model.summary()

## Train the model

In [3]:
batch_size = 128
epochs = 15

model.compile(loss="categorical_crossentropy", optimizer="adam", metrics=["accuracy"])

model.fit(x_train, y_train, batch_size=batch_size, epochs=epochs, validation_split=0.1)

NameError: name 'model' is not defined

## Evaluate the trained model

In [None]:
score = model.evaluate(x_test, y_test, verbose=0)
print("Test loss:", score[0])
print("Test accuracy:", score[1])

Test loss: 0.028691280633211136
Test accuracy: 0.9908000230789185


Downloading data from https://storage.googleapis.com/tensorflow/tf-keras-datasets/mnist.npz
[1m11490434/11490434[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m1s[0m 0us/step
Images successfully saved under data


In [None]:
model.summary()

In [None]:
image_path = "data/train/4/1004.png"
data = keras.utils.load_img(image_path)

In [None]:
data = keras.utils.img_to_array(data)[:, :, 0]

In [None]:
data = np.expand_dims(data, axis=0)
data = np.expand_dims(data, axis=-1)

In [None]:
data.shape

(1, 28, 28, 1)

In [None]:
model.predict(data)

[1m1/1[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m0s[0m 32ms/step


array([[0., 0., 0., 0., 1., 0., 0., 0., 0., 0.]], dtype=float32)

In [None]:
import time

In [None]:
start = time.time()
model.predict(data)
end = time.time()

[1m1/1[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m0s[0m 52ms/step


In [None]:
print("time : ", end - start)

time :  0.16785216331481934
