In [1]:
import tensorflow as tf
from tensorflow.keras.models import Sequential
from tensorflow.keras.layers import Conv2D, MaxPooling2D, Flatten, Dense, Dropout, BatchNormalization
from tensorflow.keras.preprocessing.image import ImageDataGenerator
from tensorflow.keras.datasets import mnist
import numpy as np

In [2]:
# Load and preprocess MNIST dataset
(X_train, y_train), (X_test, y_test) = mnist.load_data()

In [3]:
# Normalize pixel values to range [0, 1]
X_train, X_test = X_train / 255.0, X_test / 255.0

In [4]:
# Reshape to fit CNN input format
X_train = X_train.reshape(-1, 28, 28, 1)
X_test = X_test.reshape(-1, 28, 28, 1)

In [5]:
# Data augmentation to improve generalization
datagen = ImageDataGenerator(
    rotation_range=10,
    zoom_range=0.1,
    width_shift_range=0.1,
    height_shift_range=0.1,
    shear_range=0.1
)

In [6]:

# Build CNN model
model = Sequential([
    Conv2D(32, (3,3), activation='relu', input_shape=(28,28,1)),
    BatchNormalization(),
    MaxPooling2D((2,2)),
    
    Conv2D(64, (3,3), activation='relu'),
    BatchNormalization(),
    MaxPooling2D((2,2)),

    Flatten(),
    Dense(128, activation='relu'),
    Dropout(0.2),  # Reduce overfitting
    Dense(10, activation='softmax')  # 10 output classes (digits 0-9)
])

  super().__init__(activity_regularizer=activity_regularizer, **kwargs)


In [7]:
# Compile model
model.compile(optimizer='adam', loss='sparse_categorical_crossentropy', metrics=['accuracy'])


In [None]:
# Train model with augmentation
model.fit(datagen.flow(X_train, y_train, batch_size=32), epochs=50, validation_data=(X_test, y_test))


Epoch 1/50


  self._warn_if_super_not_called()


[1m1875/1875[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m84s[0m 43ms/step - accuracy: 0.8601 - loss: 0.4531 - val_accuracy: 0.9845 - val_loss: 0.0524
Epoch 2/50
[1m1875/1875[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m101s[0m 53ms/step - accuracy: 0.9661 - loss: 0.1181 - val_accuracy: 0.9833 - val_loss: 0.0565
Epoch 3/50
[1m1875/1875[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m139s[0m 74ms/step - accuracy: 0.9738 - loss: 0.0895 - val_accuracy: 0.9843 - val_loss: 0.0471
Epoch 4/50
[1m1875/1875[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m126s[0m 67ms/step - accuracy: 0.9765 - loss: 0.0790 - val_accuracy: 0.9880 - val_loss: 0.0380
Epoch 5/50
[1m1875/1875[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m135s[0m 72ms/step - accuracy: 0.9807 - loss: 0.0669 - val_accuracy: 0.9894 - val_loss: 0.0370
Epoch 6/50
[1m1875/1875[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m141s[0m 75ms/step - accuracy: 0.9808 - loss: 0.0658 - val_accuracy: 0.9887 - val_loss: 0.0361
Epoch 7/50

In [9]:
# Save trained model
model.save("digit_recognition_model.h5")

print("Model training complete. Model saved as 'digit_recognition_model.h5'.")
  



✅ Model training complete. Model saved as 'digit_recognition_model.h5'.
