In [None]:
import tensorflow
import numpy
import matplotlib.pyplot as plt
from sklearn.model_selection import train_test_split
import pandas as pd

In [None]:
dataSet=tensorflow.keras.datasets.mnist

In [None]:
(X_train,y_train),(X_test,y_test)=dataSet.load_data()

 # We have 60000 test samples

In [None]:
X_train.shape

# We use 30% of the test samples for validation

In [None]:
X_train,X_val,y_train,y_val=train_test_split(X_train,y_train,test_size=0.3,random_state=101)

In [None]:
X_train.shape

In [None]:
X_val.shape

In [None]:
from tensorflow import keras
from tensorflow.keras import layers
from tensorflow.keras import callbacks

In [None]:
early_stopping=callbacks.EarlyStopping(min_delta=0.01,
                                      patience=10,
                                      restore_best_weights=True)

In [None]:
model=keras.Sequential([
    layers.Flatten(input_shape=[28,28]),
    layers.Dense(units=256,activation='relu'),
    layers.BatchNormalization(),
    layers.Dropout(0.3),
    layers.Dense(units=128,activation='relu'),
    layers.Dense(units=10,activation='softmax')
])

In [None]:
model.compile(optimizer='adam',loss=tensorflow.keras.losses.SparseCategoricalCrossentropy(from_logits=True))

In [None]:
history=model.fit(X_train,y_train,validation_data=(X_val,y_val),batch_size=256,epochs=30,callbacks=[early_stopping])

In [None]:
history_df=pd.DataFrame(history.history)
history_df.plot()

# We have used Callbacks to avoid overfitting the model. Droup out layers also serve for the same reason.

In [None]:
results_prob=model.predict(X_test)

In [None]:
results=numpy.argmax(results_prob,axis=1)

In [None]:
results.shape

In [None]:
accurate_results=numpy.array(results==y_test)

# Accuracy computed to be 0.9807

In [None]:
sum(accurate_results)/len(accurate_results)

In [None]:
plt.figure(figsize=(20,10))
for i in range(1,32,2):
    plt.subplot(4,8,i)
    plt.xticks([])
    plt.yticks([])
    plt.imshow(X_test[i])
    plt.title("Predicted Value : "+str(results[i]))
    plt.subplot(4,8,i+1)
    plt.bar(range(10),results_prob[i])
    plt.xticks(range(10))
plt.tight_layout()

In [None]:
from sklearn.metrics import confusion_matrix,classification_report

In [None]:
print(classification_report(y_test,results))
print()
print(confusion_matrix(y_test,results))

In [None]:
model.summary()