<a href="https://colab.research.google.com/github/Mirco-Nani/experiments_gradient_accumulation/blob/main/notebooks/fashion_mnist.ipynb" target="_parent"><img src="https://colab.research.google.com/assets/colab-badge.svg" alt="Open In Colab"/></a>

# Training a neural network on fashion MNIST with Keras

This simple example demonstrate how to plug TFDS into a Keras model.


Copyright 2020 The TensorFlow Datasets Authors, Licensed under the Apache License, Version 2.0

<table class="tfo-notebook-buttons" align="left">
  <td>
    <a target="_blank" href="https://www.tensorflow.org/datasets/keras_example"><img src="https://www.tensorflow.org/images/tf_logo_32px.png" />View on TensorFlow.org</a>
  </td>
  <td>
    <a target="_blank" href="https://colab.research.google.com/github/tensorflow/datasets/blob/master/docs/keras_example.ipynb"><img src="https://www.tensorflow.org/images/colab_logo_32px.png" />Run in Google Colab</a>
  </td>
  <td>
    <a target="_blank" href="https://github.com/tensorflow/datasets/blob/master/docs/keras_example.ipynb"><img src="https://www.tensorflow.org/images/GitHub-Mark-32px.png" />View source on GitHub</a>
  </td>
  <td>
    <a href="https://storage.googleapis.com/tensorflow_docs/datasets/docs/keras_example.ipynb"><img src="https://www.tensorflow.org/images/download_logo_32px.png" />Download notebook</a>
  </td>
</table>

In [None]:
import tensorflow as tf
import tensorflow_datasets as tfds
import matplotlib.pyplot as plt
from tqdm import tqdm

In [None]:
def plot_history(history):
  plt.figure(figsize=(20,10))

  plt.subplot(221)
  plt.plot(history['loss'])
  plt.plot(history['val_loss'])
  plt.title('model loss')
  plt.ylabel('loss')
  plt.xlabel('epoch')
  plt.legend(['train', 'val'])

  plt.subplot(222)
  plt.plot(history['sparse_categorical_accuracy'])
  plt.plot(history['val_sparse_categorical_accuracy'])
  plt.title('model sparse_categorical_accuracy')
  plt.ylabel('loss')
  plt.xlabel('epoch')
  plt.legend(['train', 'val'])

  plt.show()


def prepare_ds(batch_size=128, cache=True, shuffle=True):
  def normalize_img(image, label):
    """Normalizes images: `uint8` -> `float32`."""
    return tf.cast(image, tf.float32) / 255., label

  (ds_train, ds_test), ds_info = tfds.load(
      'fashion_mnist',
      split=['train', 'test'],
      shuffle_files=shuffle,
      as_supervised=True,
      with_info=True,
  )

  ds_train = ds_train.map(
      normalize_img, num_parallel_calls=tf.data.experimental.AUTOTUNE)
  if cache: ds_train = ds_train.cache()
  if shuffle: ds_train = ds_train.shuffle(ds_info.splits['train'].num_examples)
  ds_train = ds_train.batch(batch_size)
  ds_train = ds_train.prefetch(tf.data.experimental.AUTOTUNE)

  ds_test = ds_test.map(
    normalize_img, num_parallel_calls=tf.data.experimental.AUTOTUNE)
  ds_test = ds_test.batch(128)
  if cache: ds_test = ds_test.cache()
  ds_test = ds_test.prefetch(tf.data.experimental.AUTOTUNE)
  return ds_train, ds_test



def build_model():
  model = tf.keras.models.Sequential([
    tf.keras.layers.Flatten(input_shape=(28, 28)),
    tf.keras.layers.Dense(128,activation='relu'),
    tf.keras.layers.Dense(10)
  ])
  return model


def build_and_train(ds_train, ds_test, epochs):
  model = build_model()

  model.compile(
      optimizer=tf.keras.optimizers.Adam(0.001),
      loss=tf.keras.losses.SparseCategoricalCrossentropy(from_logits=True),
      metrics=[tf.keras.metrics.SparseCategoricalAccuracy()],
  )

  history = model.fit(
      ds_train,
      epochs=6,
      validation_data=ds_test,
  )

  return history.history


def build_and_custom_train(ds_train, ds_test, epochs):
  model = build_model()

  optimizer=tf.keras.optimizers.Adam(0.001)
  loss_function=tf.keras.losses.SparseCategoricalCrossentropy(from_logits=True)
  accuracy=tf.keras.metrics.SparseCategoricalAccuracy()
  
  history={'loss':[], 'val_loss':[], 'sparse_categorical_accuracy':[], 'val_sparse_categorical_accuracy':[]}

  for epoch in range(epochs):
    losses, accuracies = [0,0], [0,0]
    train = ds_train #iter(ds_train)
    valid = ds_test #iter(ds_test)
    for step, (images, labels) in tqdm(enumerate(train), desc=f"Training epoch {epoch}"):
      with tf.GradientTape(persistent=True) as tape:
        logits=model(images)
        loss=loss_function(labels, logits)
      gradients = tape.gradient(loss, model.trainable_weights)
      del tape #?
      optimizer.apply_gradients(zip(gradients, model.trainable_weights))

      step_loss = loss.numpy()
      print(step_loss)
      losses[0] += step_loss.sum()
      losses[1] += step_loss.shape[0]

      step_acc = accuracy(labels, logits).numpy()
      accuracies[0] += step_acc.sum()
      accuracies[1] += step_acc.shape[0]
    
    history['loss'].append(losses[0] / losses[1])
    history['sparse_categorical_accuracy'].append(accuracies[0] / accuracies[1])

    losses, accuracies = [0,0], [0,0]
    for step, (images, labels) in tqdm(enumerate(valid), desc=f"Validating epoch {epoch}"):
      logits=model(images)

      step_loss=loss_function(labels, logits).numpy()
      losses[0] += step_loss.sum()
      losses[1] += step_loss.shape[0]

      step_acc = accuracy(labels, logits).numpy()
      accuracies[0] += step_acc.sum()
      accuracies[1] += step_acc.shape[0]

    history['val_loss'].append(losses[0] / losses[1])
    history['val_sparse_categorical_accuracy'].append(accuracies[0] / accuracies[1])
  
  return history
    

def task(batch_size=128, cache_ds=True, epochs=6, deterministic=True):
  if deterministic:
    tf.random.set_seed(1234)
  ds_train, ds_test = prepare_ds(batch_size, cache_ds, shuffle=(not deterministic))
  history=build_and_train(ds_train, ds_test, epochs)
  plot_history(history)


def custom_task(batch_size=128, cache_ds=True, epochs=6, deterministic=True):
  if deterministic:
    tf.random.set_seed(1234)
  ds_train, ds_test = prepare_ds(batch_size, cache_ds, shuffle=(not deterministic))
  history=build_and_custom_train(ds_train, ds_test, epochs)
  plot_history(history)


custom_task()


In [None]:
task()

In [None]:
task()

In [None]:
task(cache_ds=False)

In [None]:
task(batch_size=8)

In [None]:
custom_task()

# tests

In [None]:
ds_train, ds_test = prepare_ds()
model = build_model()

model.compile(
    optimizer=tf.keras.optimizers.Adam(0.001),
    loss=tf.keras.losses.SparseCategoricalCrossentropy(from_logits=True),
    metrics=[tf.keras.metrics.SparseCategoricalAccuracy()],
)

history = model.fit(
    ds_train,
    epochs=6,
    validation_data=ds_test,
)

plot_history(history.history)

In [None]:
model.summary()

In [None]:
model.inputs

In [None]:
 ds_train

In [None]:
train = iter(ds_train)
loss=tf.keras.losses.SparseCategoricalCrossentropy(from_logits=True)
for step, (images, labels) in enumerate(train):
  print((images.shape, labels.shape))
  break
logits=model(images)

In [None]:
labels.shape

In [None]:
loss(labels, logits)

In [None]:
label

In [None]:
metric=tf.keras.metrics.SparseCategoricalAccuracy()

In [None]:
metric(labels, logits)

In [None]:
import numpy as np

np.array([2,3]).prod()