<a href="https://colab.research.google.com/github/YukishigeKawaguchi/MachineLearning/blob/main/Fashion_mnist.ipynb" target="_parent"><img src="https://colab.research.google.com/assets/colab-badge.svg" alt="Open In Colab"/></a>

In [1]:
# Tensorflow
import tensorflow as tf

# Numpy
import numpy as np
import matplotlib.pyplot as plt

In [2]:
(train_images, train_labels), (test_images, test_labels) = tf.keras.datasets.fashion_mnist.load_data()

Downloading data from https://storage.googleapis.com/tensorflow/tf-keras-datasets/train-labels-idx1-ubyte.gz
Downloading data from https://storage.googleapis.com/tensorflow/tf-keras-datasets/train-images-idx3-ubyte.gz
Downloading data from https://storage.googleapis.com/tensorflow/tf-keras-datasets/t10k-labels-idx1-ubyte.gz
Downloading data from https://storage.googleapis.com/tensorflow/tf-keras-datasets/t10k-images-idx3-ubyte.gz


In [3]:
# data details
print("train_images shape: ", train_images.shape, "train_labels shape: ", train_labels.shape)
print("test_images shape: ", test_images.shape, "test_labels shape: ", test_labels.shape)

train_images shape:  (60000, 28, 28) train_labels shape:  (60000,)
test_images shape:  (10000, 28, 28) test_labels shape:  (10000,)


In [4]:
# Convert data to float32 and normalize the input data
train_images = train_images.astype('float32') / 255
test_images = test_images.astype('float32') / 255

In [5]:
# Reshape input data from (28, 28) to (28, 28, 1)
train_images = train_images.reshape(train_images.shape[0], 28, 28, 1)
test_images = test_images.reshape(test_images.shape[0], 28, 28, 1)

In [6]:
# Take a look the dataset shape after reshape
print("train_images shape: ", train_images.shape, "train_labels shape: ", train_labels.shape)
print("test_images shape: ", test_images.shape, "test_labels shape: ", test_labels.shape)

train_images shape:  (60000, 28, 28, 1) train_labels shape:  (60000,)
test_images shape:  (10000, 28, 28, 1) test_labels shape:  (10000,)


In [7]:
# One-hot encoding
train_labels = tf.keras.utils.to_categorical(train_labels, 10)
test_labels = tf.keras.utils.to_categorical(test_labels, 10)

In [8]:
# Define a CNN with keras sequential model
def create_model():

  # Define the model architecture
  model = tf.keras.models.Sequential([
      # Must define the input shape in the first layers of the neural network
      tf.keras.layers.Conv2D(filters=32, kernel_size=3, padding='same', activation='relu', input_shape=(28,28,1)),
      tf.keras.layers.MaxPooling2D(pool_size=2),
      tf.keras.layers.Dropout(0.3),

      tf.keras.layers.Conv2D(filters=64, kernel_size=3, padding='same', activation='relu'),
      tf.keras.layers.MaxPooling2D(pool_size=2),
      tf.keras.layers.Dropout(0.3),

      tf.keras.layers.Flatten(),
      tf.keras.layers.Dense(10, activation='softmax')                                
  ])

  # Compile the model
  model.compile(loss=tf.keras.losses.categorical_crossentropy,
                optimizer=tf.keras.optimizers.Adam(),
                metrics=['accuracy'])
  return model

In [9]:
# Create a model
model = create_model()

In [10]:
# Inspect model architecture
model.summary()

Model: "sequential"
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
conv2d (Conv2D)              (None, 28, 28, 32)        320       
_________________________________________________________________
max_pooling2d (MaxPooling2D) (None, 14, 14, 32)        0         
_________________________________________________________________
dropout (Dropout)            (None, 14, 14, 32)        0         
_________________________________________________________________
conv2d_1 (Conv2D)            (None, 14, 14, 64)        18496     
_________________________________________________________________
max_pooling2d_1 (MaxPooling2 (None, 7, 7, 64)          0         
_________________________________________________________________
dropout_1 (Dropout)          (None, 7, 7, 64)          0         
_________________________________________________________________
flatten (Flatten)            (None, 3136)              0

In [11]:
%%time
model.fit(train_images,
          train_labels,
          batch_size=64,
          epochs=5)

Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5
CPU times: user 18.9 s, sys: 2.68 s, total: 21.6 s
Wall time: 1min 22s


<tensorflow.python.keras.callbacks.History at 0x7fcc16110e10>

In [13]:
model.evaluate(test_images, test_labels, verbose=2)

313/313 - 1s - loss: 0.2794 - accuracy: 0.9013


[0.27944016456604004, 0.9013000130653381]