In [None]:
import tensorflow as tf
from tensorflow.keras.models import Sequential
from tensorflow.keras.layers import Conv2D, MaxPooling2D, Flatten, Dense, Dropout, BatchNormalization
from tensorflow.keras.utils import to_categorical
from tensorflow.keras.datasets import mnist
from tensorflow.keras.preprocessing.image import ImageDataGenerator
import numpy as np

# 📌 Load MNIST dataset
(X_train, y_train), (X_test, y_test) = mnist.load_data()

# 📌 Normalize and reshape
X_train, X_test = X_train / 255.0, X_test / 255.0  # Normalize
X_train = X_train.reshape(-1, 28, 28, 1)  # Reshape to (28,28,1)
X_test = X_test.reshape(-1, 28, 28, 1)

# 📌 Convert labels to categorical
num_classes = 10
y_train = to_categorical(y_train, num_classes)
y_test = to_categorical(y_test, num_classes)

# 📌 Data Augmentation
datagen = ImageDataGenerator(
    rotation_range=10, 
    width_shift_range=0.1, 
    height_shift_range=0.1, 
    shear_range=0.1, 
    zoom_range=0.1
)
datagen.fit(X_train)  # Apply augmentation only to training data

# 📌 Define Improved CNN Model
model = Sequential([
    Conv2D(32, (3,3), activation='relu', input_shape=(28,28,1)),
    BatchNormalization(),
    MaxPooling2D(2,2),

    Conv2D(64, (3,3), activation='relu'),
    BatchNormalization(),
    MaxPooling2D(2,2),

    Conv2D(128, (3,3), activation='relu'),
    BatchNormalization(),
    MaxPooling2D(2,2),

    Flatten(),
    Dense(256, activation='relu'),
    Dropout(0.3),  # Reduce overfitting
    Dense(num_classes, activation='softmax')  # Output Layer
])

# 📌 Compile Model
model.compile(optimizer='adam', loss='categorical_crossentropy', metrics=['accuracy'])

# 📌 Train Model using Augmented Data
model.fit(datagen.flow(X_train, y_train, batch_size=32), epochs=10, validation_data=(X_test, y_test))

# 📌 Save Model
model.save("digit_model_improved.h5")

# 📌 Test Prediction
sample_idx = np.random.randint(0, len(X_test), size=5)  # Pick 5 random samples
sample_images = X_test[sample_idx]
sample_labels = np.argmax(y_test[sample_idx], axis=1)

predictions = np.argmax(model.predict(sample_images), axis=1)

print("Actual Labels:    ", sample_labels)
print("Predicted Labels: ", predictions)


Epoch 1/5
[1m1875/1875[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m27s[0m 13ms/step - accuracy: 0.8508 - loss: 0.4664 - val_accuracy: 0.9735 - val_loss: 0.0796
Epoch 2/5
[1m1875/1875[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m26s[0m 14ms/step - accuracy: 0.9549 - loss: 0.1458 - val_accuracy: 0.9826 - val_loss: 0.0516
Epoch 3/5
[1m1875/1875[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m25s[0m 13ms/step - accuracy: 0.9631 - loss: 0.1211 - val_accuracy: 0.9838 - val_loss: 0.0493
Epoch 4/5
[1m1875/1875[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m27s[0m 14ms/step - accuracy: 0.9705 - loss: 0.0989 - val_accuracy: 0.9732 - val_loss: 0.0849
Epoch 5/5
[1m1875/1875[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m26s[0m 14ms/step - accuracy: 0.9710 - loss: 0.0947 - val_accuracy: 0.9822 - val_loss: 0.0580
[1m1/1[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m0s[0m 134ms/step
Actual Labels:     [6 5 2 6 1]
Predicted Labels:  [6 5 2 6 1]
