<a href="https://colab.research.google.com/github/thomsonnapitupulu/ai-ml-exercises/blob/main/Fashion_MNIST_Image_Classifier.ipynb" target="_parent"><img src="https://colab.research.google.com/assets/colab-badge.svg" alt="Open In Colab"/></a>

# Installs and Imports

In [1]:
#Activate TensorFlow 2.x version in Colab
%tensorflow_version 2.x

Colab only includes TensorFlow 2.x; %tensorflow_version has no effect.


In [5]:
#Import TensorFlow and tf.Keras
import tensorflow as tf

#Import numpy and helper libraries
import numpy as np
import matplotlib.pyplot as plt


# Data

# 1. Load the Fashion-MNIST Data

In [6]:
(train_images, train_labels), (test_images, test_labels) = tf.keras.datasets.fashion_mnist.load_data()

Downloading data from https://storage.googleapis.com/tensorflow/tf-keras-datasets/train-labels-idx1-ubyte.gz
Downloading data from https://storage.googleapis.com/tensorflow/tf-keras-datasets/train-images-idx3-ubyte.gz
Downloading data from https://storage.googleapis.com/tensorflow/tf-keras-datasets/t10k-labels-idx1-ubyte.gz
Downloading data from https://storage.googleapis.com/tensorflow/tf-keras-datasets/t10k-images-idx3-ubyte.gz


# 2. Explore the Fashion-MNIST dataset

In [8]:
print("train_images_shape: ", train_images.shape)
print("train_labels_shape: ", train_labels.shape)
print("test_images_shape: ", test_images.shape)
print("test_labels_shape: ", test_labels.shape)

train_images_shape:  (60000, 28, 28)
train_labels_shape:  (60000,)
test_images_shape:  (10000, 28, 28)
test_labels_shape:  (10000,)


# Data preprocessing

In [9]:
# Convert data into float32 and normalize the input data
train_images = train_images.astype(np.float32) / 255
test_images = test_images.astype(np.float32) / 255

In [11]:
# Reshape input data from (28, 28) to (28, 28, 1)
train_images = train_images.reshape(train_images.shape[0], 28, 28, 1)
test_images = test_images.reshape(test_images.shape[0], 28, 28, 1)

In [12]:
# Take a look at the dataset shape after reshaped
print("train_images_shape: ", train_images.shape)
print("train_labels_shape: ", train_labels.shape)
print("test_images_shape: ", test_images.shape)
print("test_labels_shape: ", test_labels.shape)

train_images_shape:  (60000, 28, 28, 1)
train_labels_shape:  (60000,)
test_images_shape:  (10000, 28, 28, 1)
test_labels_shape:  (10000,)


In [13]:
# One-hot encode the labels
train_labels = tf.keras.utils.to_categorical(train_labels, 10)
test_labels = tf.keras.utils.to_categorical(test_labels, 10)

Model Architecture

In [18]:
# Define a CNN with keras sequential model
def create_model():
  # Define the model architecture
  model = tf.keras.models.Sequential([
      # Must define the input shape in the first layer of the neural network
      tf.keras.layers.Conv2D(filters=32, kernel_size=3, padding='same', activation='relu', input_shape=(28, 28, 1)),
      tf.keras.layers.MaxPooling2D(pool_size=2),
      tf.keras.layers.Dropout(0.3),

      tf.keras.layers.Conv2D(filters=64, kernel_size=3, padding='same', activation='relu'),
      tf.keras.layers.MaxPooling2D(pool_size=2),
      tf.keras.layers.Dropout(0.3),

      tf.keras.layers.Flatten(),
      tf.keras.layers.Dense(10, activation='softmax')
  ])

  # Compile the model
  model.compile(loss=tf.keras.losses.categorical_crossentropy,
                optimizer=tf.keras.optimizers.Adam(),
                metrics=['accuracy'])

  return model

In [19]:
# Create the model
model = create_model()

In [20]:
# Inspect model architecture
model.summary()

Model: "sequential_1"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 conv2d_2 (Conv2D)           (None, 28, 28, 32)        320       
                                                                 
 max_pooling2d_2 (MaxPoolin  (None, 14, 14, 32)        0         
 g2D)                                                            
                                                                 
 dropout_2 (Dropout)         (None, 14, 14, 32)        0         
                                                                 
 conv2d_3 (Conv2D)           (None, 14, 14, 64)        18496     
                                                                 
 max_pooling2d_3 (MaxPoolin  (None, 7, 7, 64)          0         
 g2D)                                                            
                                                                 
 dropout_3 (Dropout)         (None, 7, 7, 64)         

In [21]:
%%time
# Train the model
history = model.fit(train_images, train_labels, batch_size=64, epochs= 5)

Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5
CPU times: user 9min 48s, sys: 14.5 s, total: 10min 2s
Wall time: 7min 23s


In [22]:
model.evaluate(test_images, test_labels, verbose=2)

313/313 - 3s - loss: 0.2833 - accuracy: 0.9009 - 3s/epoch - 11ms/step


[0.2832612693309784, 0.9009000062942505]