<a href="https://colab.research.google.com/github/fatehtariq/Fashion-MNIST-Classifier/blob/main/Fashion_MNIST_Classifier.ipynb" target="_parent"><img src="https://colab.research.google.com/assets/colab-badge.svg" alt="Open In Colab"/></a>

# Fashion MNIST Classifier

**Libraries**

In [78]:
import tensorflow as tf
import numpy as np
import matplotlib.pyplot as plt
from keras.layers.normalization import BatchNormalization
import pandas as pd
from tensorflow.math import confusion_matrix
from sklearn.metrics import plot_confusion_matrix

**Loading Dataset**

In [None]:
(x_train, y_train), (x_test, y_test) = tf.keras.datasets.fashion_mnist.load_data()

Downloading data from https://storage.googleapis.com/tensorflow/tf-keras-datasets/train-labels-idx1-ubyte.gz
Downloading data from https://storage.googleapis.com/tensorflow/tf-keras-datasets/train-images-idx3-ubyte.gz
Downloading data from https://storage.googleapis.com/tensorflow/tf-keras-datasets/t10k-labels-idx1-ubyte.gz
Downloading data from https://storage.googleapis.com/tensorflow/tf-keras-datasets/t10k-images-idx3-ubyte.gz


In [None]:
print("x_train shape (Training Images):", x_train.shape, "y_train shape (Training Labels):", y_train.shape)

x_train shape (Training Images): (60000, 28, 28) y_train shape (Training Labels): (60000,)


**Preprocessing Data**

In [None]:
W, H = 28, 28
x_train = x_train.reshape(x_train.shape[0], W, H, 1)
x_test = x_test.reshape(x_test.shape[0], W, H, 1)

x_train.shape

(60000, 28, 28, 1)

**Model**

In [None]:
from tensorflow.keras.layers import Dense, Conv2D, MaxPooling2D, Dropout, Flatten, Activation

Model with Categorical Cross Entropy

In [None]:
model1 = tf.keras.Sequential()

model1.add(Conv2D(filters=8, kernel_size=5, padding='same', activation='relu', input_shape=(28,28,1)))          
model1.add(MaxPooling2D(pool_size=2))
model1.add(Dropout(0.3))

model1.add(Conv2D(filters=32, kernel_size=7, activation='relu', input_shape=(8,8,1)))              
model1.add(MaxPooling2D(pool_size=1))
model1.add(Dropout(0.3))

model1.add(Conv2D(filters=64, kernel_size=5,activation='relu', input_shape=(4,4,1)))             
model1.add(MaxPooling2D(pool_size=1))
model1.add(Dropout(0.3))

model1.add(Conv2D(128, (3, 3),activation='relu', input_shape=(2,2,1)))              
model1.add(MaxPooling2D(pool_size=1))
model1.add(Dropout(0.3))

model1.add(Flatten())

model1.add(Dense(512))                                      
model1.add(Activation('relu'))
model1.add(Dropout(0.3))

model1.add(Dense(128))                                      
model1.add(Activation('relu'))
model1.add(Dropout(0.3))

model1.add(Dense(10))                                     
model1.add(Activation('Softmax'))

model1.summary()

Model: "sequential_22"
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
conv2d_85 (Conv2D)           (None, 28, 28, 8)         208       
_________________________________________________________________
max_pooling2d_82 (MaxPooling (None, 14, 14, 8)         0         
_________________________________________________________________
dropout_118 (Dropout)        (None, 14, 14, 8)         0         
_________________________________________________________________
conv2d_86 (Conv2D)           (None, 8, 8, 32)          12576     
_________________________________________________________________
max_pooling2d_83 (MaxPooling (None, 8, 8, 32)          0         
_________________________________________________________________
dropout_119 (Dropout)        (None, 8, 8, 32)          0         
_________________________________________________________________
conv2d_87 (Conv2D)           (None, 4, 4, 64)        

Model with Mean Squared Error

In [59]:
model2 = tf.keras.Sequential()

model2.add(Conv2D(filters=8, kernel_size=5, padding='same', activation='relu', input_shape=(28,28,1)))          
model2.add(MaxPooling2D(pool_size=2))
model2.add(Dropout(0.3))

model2.add(Conv2D(filters=32, kernel_size=7, activation='relu', input_shape=(8,8,1)))              
model2.add(MaxPooling2D(pool_size=1))
model2.add(Dropout(0.3))

model2.add(Conv2D(filters=64, kernel_size=5,activation='relu', input_shape=(4,4,1)))             
model2.add(MaxPooling2D(pool_size=1))
model2.add(Dropout(0.3))

model2.add(Conv2D(128, (3, 3),activation='relu', input_shape=(2,2,1)))              
model2.add(MaxPooling2D(pool_size=1))
model2.add(Dropout(0.3))

model2.add(Flatten())

model2.add(Dense(512))                                      
model2.add(Activation('relu'))
model2.add(Dropout(0.3))

model2.add(Dense(128))                                      
model2.add(Activation('relu'))
model2.add(Dropout(0.3))

model2.add(Dense(10))                                     
model2.add(Activation('Softmax'))

model2.summary()

Model: "sequential_23"
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
conv2d_89 (Conv2D)           (None, 28, 28, 8)         208       
_________________________________________________________________
max_pooling2d_86 (MaxPooling (None, 14, 14, 8)         0         
_________________________________________________________________
dropout_124 (Dropout)        (None, 14, 14, 8)         0         
_________________________________________________________________
conv2d_90 (Conv2D)           (None, 8, 8, 32)          12576     
_________________________________________________________________
max_pooling2d_87 (MaxPooling (None, 8, 8, 32)          0         
_________________________________________________________________
dropout_125 (Dropout)        (None, 8, 8, 32)          0         
_________________________________________________________________
conv2d_91 (Conv2D)           (None, 4, 4, 64)        

**Compiling and Training the Model with Categorical Cross Entropy**

In [60]:
BATCH_SIZE=1000
EPOCHS = 50
model1.compile(loss='sparse_categorical_crossentropy',
             optimizer='adam',
             metrics=['accuracy'])

In [61]:
%time history = model1.fit(x_train, y_train, epochs=EPOCHS, batch_size=BATCH_SIZE, validation_split=0.2, verbose=1)

Epoch 1/50
Epoch 2/50
Epoch 3/50
Epoch 4/50
Epoch 5/50
Epoch 6/50
Epoch 7/50
Epoch 8/50
Epoch 9/50
Epoch 10/50
Epoch 11/50
Epoch 12/50
Epoch 13/50
Epoch 14/50
Epoch 15/50
Epoch 16/50
Epoch 17/50
Epoch 18/50
Epoch 19/50
Epoch 20/50
Epoch 21/50
Epoch 22/50
Epoch 23/50
Epoch 24/50
Epoch 25/50
Epoch 26/50
Epoch 27/50
Epoch 28/50
Epoch 29/50
Epoch 30/50
Epoch 31/50
Epoch 32/50
Epoch 33/50
Epoch 34/50
Epoch 35/50
Epoch 36/50
Epoch 37/50
Epoch 38/50
Epoch 39/50
Epoch 40/50
Epoch 41/50
Epoch 42/50
Epoch 43/50
Epoch 44/50
Epoch 45/50
Epoch 46/50
Epoch 47/50
Epoch 48/50
Epoch 49/50
Epoch 50/50
CPU times: user 1min 38s, sys: 2.64 s, total: 1min 40s
Wall time: 2min 22s


In [62]:
train_loss, train_accuracy = model1.evaluate(x_train, y_train, batch_size=BATCH_SIZE)
train_accuracy



0.9373999834060669

In [63]:
test_loss, test_accuracy = model1.evaluate(x_test, y_test, batch_size=BATCH_SIZE)
test_accuracy



0.9100000262260437

**Compiling and Training the Model with Mean Square Error**

In [64]:
BATCH_SIZE=1000
EPOCHS = 50
model2.compile(loss=tf.keras.losses.mean_squared_error,
             optimizer='adam',
             metrics=['accuracy'])

In [65]:
%time history = model2.fit(x_train, y_train, epochs=EPOCHS, batch_size=BATCH_SIZE, validation_split=0.2, verbose=1)

Epoch 1/50
Epoch 2/50
Epoch 3/50
Epoch 4/50
Epoch 5/50
Epoch 6/50
Epoch 7/50
Epoch 8/50
Epoch 9/50
Epoch 10/50
Epoch 11/50
Epoch 12/50
Epoch 13/50
Epoch 14/50
Epoch 15/50
Epoch 16/50
Epoch 17/50
Epoch 18/50
Epoch 19/50
Epoch 20/50
Epoch 21/50
Epoch 22/50
Epoch 23/50
Epoch 24/50
Epoch 25/50
Epoch 26/50
Epoch 27/50
Epoch 28/50
Epoch 29/50
Epoch 30/50
Epoch 31/50
Epoch 32/50
Epoch 33/50
Epoch 34/50
Epoch 35/50
Epoch 36/50
Epoch 37/50
Epoch 38/50
Epoch 39/50
Epoch 40/50
Epoch 41/50
Epoch 42/50
Epoch 43/50
Epoch 44/50
Epoch 45/50
Epoch 46/50
Epoch 47/50
Epoch 48/50
Epoch 49/50
Epoch 50/50
CPU times: user 1min 36s, sys: 2.55 s, total: 1min 39s
Wall time: 1min 40s


In [66]:
train_loss, train_accuracy = model2.evaluate(x_train, y_train, batch_size=BATCH_SIZE)
train_accuracy



0.10000000149011612

In [67]:
test_loss, test_accuracy = model2.evaluate(x_test, y_test, batch_size=BATCH_SIZE)
test_accuracy



0.10000000149011612

In [70]:
predictions1 = model1.predict(x_test)

In [71]:
predictions1

array([[7.56357321e-25, 2.40299943e-26, 7.09197313e-24, ...,
        2.38157936e-05, 6.74241799e-17, 9.99976158e-01],
       [4.61840983e-07, 1.22142612e-20, 9.99795854e-01, ...,
        9.66274318e-31, 7.57599550e-14, 2.51308354e-30],
       [0.00000000e+00, 1.00000000e+00, 0.00000000e+00, ...,
        0.00000000e+00, 0.00000000e+00, 0.00000000e+00],
       ...,
       [9.48029503e-20, 0.00000000e+00, 4.00741108e-30, ...,
        0.00000000e+00, 1.00000000e+00, 0.00000000e+00],
       [2.35550410e-29, 1.00000000e+00, 1.53393435e-33, ...,
        0.00000000e+00, 0.00000000e+00, 0.00000000e+00],
       [4.42030839e-08, 6.36963052e-11, 4.63495997e-09, ...,
        5.72378635e-02, 1.52920809e-04, 7.71280611e-05]], dtype=float32)

In [86]:
yhat_classes = model1.predict_classes(x_test, verbose=0)



**Confusion Matrix for Categorical Cross Entropy**

In [89]:
matrix = confusion_matrix(y_test, yhat_classes)
print(matrix)

tf.Tensor(
[[877   1  15  13   4   1  84   0   5   0]
 [  2 984   0  11   1   0   2   0   0   0]
 [ 17   0 824   7  74   0  77   0   1   0]
 [  9   6   6 925  35   0  19   0   0   0]
 [  1   1  35  26 865   0  72   0   0   0]
 [  0   0   0   0   0 972   0  23   0   5]
 [108   1  45  31  69   0 741   0   5   0]
 [  0   0   0   0   0   5   0 985   0  10]
 [  4   1   1   2   3   2   4   3 980   0]
 [  0   0   0   0   0   6   0  47   0 947]], shape=(10, 10), dtype=int32)


**Confusion Matrix for Mean Squared Error**

In [90]:
yhat_classes2 = model2.predict_classes(x_test, verbose=0)



In [92]:
matrix = confusion_matrix(y_test, yhat_classes2)
print(matrix)

tf.Tensor(
[[   0    0    0    0    0    0 1000    0    0    0]
 [   0    0    0    0    0    0 1000    0    0    0]
 [   0    0    0    0    0    0 1000    0    0    0]
 [   0    0    0    0    0    0 1000    0    0    0]
 [   0    0    0    0    0    0 1000    0    0    0]
 [   0    0    0    0    0    0 1000    0    0    0]
 [   0    0    0    0    0    0 1000    0    0    0]
 [   0    0    0    0    0    0 1000    0    0    0]
 [   0    0    0    0    0    0 1000    0    0    0]
 [   0    0    0    0    0    0 1000    0    0    0]], shape=(10, 10), dtype=int32)
