<a href="https://colab.research.google.com/github/emagawa/Transfer-Learning-with-TensorFlow-2.0/blob/main/1_4_Fashion_MNIST_Classifier.ipynb" target="_parent"><img src="https://colab.research.google.com/assets/colab-badge.svg" alt="Open In Colab"/></a>

## Installs & Imports

In [1]:
# Activate TensorFlow 2.x version in Colab
%tensorflow_version 2.x

Colab only includes TensorFlow 2.x; %tensorflow_version has no effect.


In [2]:
# Import TensorFlow and tf.keras
import tensorflow as tf

# Import Numpy & helper libraries
import numpy as np
import matplotlib.pyplot as plt

## Data

### 1. Load the Fashion-MNIST data

In [14]:
# Load the fashion-mnist pre-shuffled train data and test data from tf.keras.datasets
(train_images, train_labels), (test_images, test_labels) = tf.keras.datasets.fashion_mnist.load_data()


### 2. Explore the Fashion-MNIST dataset

In [4]:
# There are 60000 training examples with images (28x28) and corresponding labels
print("train_images shape:", train_images.shape, "train_labels shape:", train_labels.shape)
print("test_images shape:", test_images.shape, "test_labels shape:", test_labels.shape)

train_images shape: (60000, 28, 28) train_labels shape: (60000,)
test_images shape: (10000, 28, 28) test_labels shape: (10000,)


### 3. Data preprocessing

In [5]:
# Convert data to float32 and normalize the input data
train_images = train_images.astype('float32') / 255
test_images= test_images.astype('float32') / 255

In [6]:
# Reshape input data from (28, 28) to (28, 28, 1)
train_images = train_images.reshape(train_images.shape[0], 28, 28, 1)
test_images = test_images.reshape(test_images.shape[0], 28, 28, 1)

In [7]:
# Take a look the dataset shape after reshape
print("train_images shape:", train_images.shape, "train_labels shape:", train_labels.shape)
print("test_images shape:", test_images.shape, "test_labels shape:", test_labels.shape)

train_images shape: (60000, 28, 28, 1) train_labels shape: (60000,)
test_images shape: (10000, 28, 28, 1) test_labels shape: (10000,)


In [8]:
# One-hot encode the labels
train_labels = tf.keras.utils.to_categorical(train_labels, 10)
test_labels = tf.keras.utils.to_categorical(test_labels, 10)

Model architecture

In [9]:
# Define a CNN with keras sequential model
def create_model():

  # Define the model architecture
  model = tf.keras.models.Sequential([
    # Must define the input shape in the first layer of the neural network
    tf.keras.layers.Conv2D(filters=32, kernel_size=3, padding='same', activation='relu', input_shape=(28,28,1)),
    tf.keras.layers.MaxPooling2D(pool_size=2),
    tf.keras.layers.Dropout(0.3),

    tf.keras.layers.Conv2D(filters=64, kernel_size=3, padding='same', activation='relu'),
    tf.keras.layers.MaxPooling2D(pool_size=2),
    tf.keras.layers.Dropout(0.3),

    tf.keras.layers.Flatten(),
    tf.keras.layers.Dense(10, activation='softmax')
  ])

  # Compile the model
  model.compile(loss=tf.keras.losses.categorical_crossentropy,
         optimizer=tf.keras.optimizers.Adam(),
         metrics=['accuracy'])

  return model

In [10]:
# Create model
model = create_model()

In [11]:
# Inspect model architecture
model.summary()

Model: "sequential"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 conv2d (Conv2D)             (None, 28, 28, 32)        320       
                                                                 
 max_pooling2d (MaxPooling2  (None, 14, 14, 32)        0         
 D)                                                              
                                                                 
 dropout (Dropout)           (None, 14, 14, 32)        0         
                                                                 
 conv2d_1 (Conv2D)           (None, 14, 14, 64)        18496     
                                                                 
 max_pooling2d_1 (MaxPoolin  (None, 7, 7, 64)          0         
 g2D)                                                            
                                                                 
 dropout_1 (Dropout)         (None, 7, 7, 64)          0

In [12]:
%%time
model.fit(train_images,
         train_labels,
         batch_size=64,
         epochs=5)

Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5
CPU times: user 25.7 s, sys: 2.86 s, total: 28.5 s
Wall time: 42.3 s


<keras.src.callbacks.History at 0x7f116e6105b0>

In [13]:
model.evaluate(test_images,  test_labels, verbose=2)

313/313 - 1s - loss: 0.2744 - accuracy: 0.9030 - 1s/epoch - 3ms/step


[0.27439457178115845, 0.902999997138977]