# Food Vision Project : A story of classifying food images

<p style="text-align:center;"><img src="https://i.pinimg.com/564x/70/b1/55/70b155d20647d2863805da7559cf169d.jpg" alt="Girl in a jacket" width="500" height="500" class="center"></p>

> <div class="alert alert-block alert-danger">
<b>Danger:</b> This notebook can make you hungry, since it includes very delicious foods!
</div>

Let's create some helper functions that will help us in many points during the project.
Here is the functions that we will build now :
* **load_and_prep_image** : A function to import an image and resize it to be able to be used with our model

* **make_confusion_matrix** : A function to create confusion matrix that is different than the Scikit Learn's function

* **pred_and_plot** :a function to predict on images and plot them (works with multi-class)

* **create_tensorboard_callback** : Creates a TensorBoard callback instand to store log files.

* **plot_loss_curves** : Returns separate loss curves for training and validation metrics.

* **compare_historys** : Compares two TensorFlow model History objects.

* **unzip_data** : Unzips filename into the current working directory.

* **walk_through_dir** : Walks through dir_path returning its contents.

* **calculate_results** : Calculates model accuracy, precision, recall and f1 score of a binary classification model.

In [None]:
import tensorflow as tf

# Create a function to import an image and resize it to be able to be used with our model
def load_and_prep_image(filename, img_shape=224, scale=True):
  """
  Reads in an image from filename, turns it into a tensor and reshapes into
  (224, 224, 3).

  Parameters
  ----------
  filename (str): string filename of target image
  img_shape (int): size to resize target image to, default 224
  scale (bool): whether to scale pixel values to range(0, 1), default True
  """
  # Read in the image
  img = tf.io.read_file(filename)
  # Decode it into a tensor
  img = tf.image.decode_jpeg(img)
  # Resize the image
  img = tf.image.resize(img, [img_shape, img_shape])
  if scale:
    # Rescale the image (get all values between 0 and 1)
    return img/255.
  else:
    return img

# Note: The following confusion matrix code is a remix of Scikit-Learn's 
# plot_confusion_matrix function - https://scikit-learn.org/stable/modules/generated/sklearn.metrics.plot_confusion_matrix.html
import itertools
import matplotlib.pyplot as plt
import numpy as np
from sklearn.metrics import confusion_matrix

# Our function needs a different name to sklearn's plot_confusion_matrix
def make_confusion_matrix(y_true, y_pred, classes=None, figsize=(10, 10), text_size=15, norm=False, savefig=False): 
  """Makes a labelled confusion matrix comparing predictions and ground truth labels.

  If classes is passed, confusion matrix will be labelled, if not, integer class values
  will be used.

  Args:
    y_true: Array of truth labels (must be same shape as y_pred).
    y_pred: Array of predicted labels (must be same shape as y_true).
    classes: Array of class labels (e.g. string form). If `None`, integer labels are used.
    figsize: Size of output figure (default=(10, 10)).
    text_size: Size of output figure text (default=15).
    norm: normalize values or not (default=False).
    savefig: save confusion matrix to file (default=False).
  
  Returns:
    A labelled confusion matrix plot comparing y_true and y_pred.

  Example usage:
    make_confusion_matrix(y_true=test_labels, # ground truth test labels
                          y_pred=y_preds, # predicted labels
                          classes=class_names, # array of class label names
                          figsize=(15, 15),
                          text_size=10)
  """  
  # Create the confustion matrix
  cm = confusion_matrix(y_true, y_pred)
  cm_norm = cm.astype("float") / cm.sum(axis=1)[:, np.newaxis] # normalize it
  n_classes = cm.shape[0] # find the number of classes we're dealing with

  # Plot the figure and make it pretty
  fig, ax = plt.subplots(figsize=figsize)
  cax = ax.matshow(cm, cmap=plt.cm.Blues) # colors will represent how 'correct' a class is, darker == better
  fig.colorbar(cax)

  # Are there a list of classes?
  if classes:
    labels = classes
  else:
    labels = np.arange(cm.shape[0])
  
  # Label the axes
  ax.set(title="Confusion Matrix",
         xlabel="Predicted label",
         ylabel="True label",
         xticks=np.arange(n_classes), # create enough axis slots for each class
         yticks=np.arange(n_classes), 
         xticklabels=labels, # axes will labeled with class names (if they exist) or ints
         yticklabels=labels)
  
  # Make x-axis labels appear on bottom
  ax.xaxis.set_label_position("bottom")
  ax.xaxis.tick_bottom()

  # Set the threshold for different colors
  threshold = (cm.max() + cm.min()) / 2.

  # Plot the text on each cell
  for i, j in itertools.product(range(cm.shape[0]), range(cm.shape[1])):
    if norm:
      plt.text(j, i, f"{cm[i, j]} ({cm_norm[i, j]*100:.1f}%)",
              horizontalalignment="center",
              color="white" if cm[i, j] > threshold else "black",
              size=text_size)
    else:
      plt.text(j, i, f"{cm[i, j]}",
              horizontalalignment="center",
              color="white" if cm[i, j] > threshold else "black",
              size=text_size)

  # Save the figure to the current working directory
  if savefig:
    fig.savefig("confusion_matrix.png")
  
# Make a function to predict on images and plot them (works with multi-class)
def pred_and_plot(model, filename, class_names):
  """
  Imports an image located at filename, makes a prediction on it with
  a trained model and plots the image with the predicted class as the title.
  """
  # Import the target image and preprocess it
  img = load_and_prep_image(filename)

  # Make a prediction
  pred = model.predict(tf.expand_dims(img, axis=0))

  # Get the predicted class
  if len(pred[0]) > 1: # check for multi-class
    pred_class = class_names[pred.argmax()] # if more than one output, take the max
  else:
    pred_class = class_names[int(tf.round(pred)[0][0])] # if only one output, round

  # Plot the image and predicted class
  plt.imshow(img)
  plt.title(f"Prediction: {pred_class}")
  plt.axis(False);
  
import datetime

def create_tensorboard_callback(dir_name, experiment_name):
  """
  Creates a TensorBoard callback instand to store log files.

  Stores log files with the filepath:
    "dir_name/experiment_name/current_datetime/"

  Args:
    dir_name: target directory to store TensorBoard log files
    experiment_name: name of experiment directory (e.g. efficientnet_model_1)
  """
  log_dir = dir_name + "/" + experiment_name + "/" + datetime.datetime.now().strftime("%Y%m%d-%H%M%S")
  tensorboard_callback = tf.keras.callbacks.TensorBoard(
      log_dir=log_dir
  )
  print(f"Saving TensorBoard log files to: {log_dir}")
  return tensorboard_callback

# Plot the validation and training data separately
import matplotlib.pyplot as plt

def plot_loss_curves(history):
  """
  Returns separate loss curves for training and validation metrics.

  Args:
    history: TensorFlow model History object (see: https://www.tensorflow.org/api_docs/python/tf/keras/callbacks/History)
  """ 
  loss = history.history['loss']
  val_loss = history.history['val_loss']

  accuracy = history.history['accuracy']
  val_accuracy = history.history['val_accuracy']

  epochs = range(len(history.history['loss']))

  # Plot loss
  plt.plot(epochs, loss, label='training_loss')
  plt.plot(epochs, val_loss, label='val_loss')
  plt.title('Loss')
  plt.xlabel('Epochs')
  plt.legend()

  # Plot accuracy
  plt.figure()
  plt.plot(epochs, accuracy, label='training_accuracy')
  plt.plot(epochs, val_accuracy, label='val_accuracy')
  plt.title('Accuracy')
  plt.xlabel('Epochs')
  plt.legend();

def compare_historys(original_history, new_history, initial_epochs=5):
    """
    Compares two TensorFlow model History objects.
    
    Args:
      original_history: History object from original model (before new_history)
      new_history: History object from continued model training (after original_history)
      initial_epochs: Number of epochs in original_history (new_history plot starts from here) 
    """
    
    # Get original history measurements
    acc = original_history.history["accuracy"]
    loss = original_history.history["loss"]

    val_acc = original_history.history["val_accuracy"]
    val_loss = original_history.history["val_loss"]

    # Combine original history with new history
    total_acc = acc + new_history.history["accuracy"]
    total_loss = loss + new_history.history["loss"]

    total_val_acc = val_acc + new_history.history["val_accuracy"]
    total_val_loss = val_loss + new_history.history["val_loss"]

    # Make plots
    plt.figure(figsize=(8, 8))
    plt.subplot(2, 1, 1)
    plt.plot(total_acc, label='Training Accuracy')
    plt.plot(total_val_acc, label='Validation Accuracy')
    plt.plot([initial_epochs-1, initial_epochs-1],
              plt.ylim(), label='Start Fine Tuning') # reshift plot around epochs
    plt.legend(loc='lower right')
    plt.title('Training and Validation Accuracy')

    plt.subplot(2, 1, 2)
    plt.plot(total_loss, label='Training Loss')
    plt.plot(total_val_loss, label='Validation Loss')
    plt.plot([initial_epochs-1, initial_epochs-1],
              plt.ylim(), label='Start Fine Tuning') # reshift plot around epochs
    plt.legend(loc='upper right')
    plt.title('Training and Validation Loss')
    plt.xlabel('epoch')
    plt.show()
  
# Create function to unzip a zipfile into current working directory 
# (since we're going to be downloading and unzipping a few files)
import zipfile

def unzip_data(filename):
  """
  Unzips filename into the current working directory.

  Args:
    filename (str): a filepath to a target zip folder to be unzipped.
  """
  zip_ref = zipfile.ZipFile(filename, "r")
  zip_ref.extractall()
  zip_ref.close()

# Walk through an image classification directory and find out how many files (images)
# are in each subdirectory.
import os

def walk_through_dir(dir_path):
  """
  Walks through dir_path returning its contents.

  Args:
    dir_path (str): target directory
  
  Returns:
    A print out of:
      number of subdiretories in dir_path
      number of images (files) in each subdirectory
      name of each subdirectory
  """
  for dirpath, dirnames, filenames in os.walk(dir_path):
    print(f"There are {len(dirnames)} directories and {len(filenames)} images in '{dirpath}'.")
    
# Function to evaluate: accuracy, precision, recall, f1-score
from sklearn.metrics import accuracy_score, precision_recall_fscore_support

def calculate_results(y_true, y_pred):
  """
  Calculates model accuracy, precision, recall and f1 score of a binary classification model.

  Args:
      y_true: true labels in the form of a 1D array
      y_pred: predicted labels in the form of a 1D array

  Returns a dictionary of accuracy, precision, recall, f1-score.
  """
  # Calculate model accuracy
  model_accuracy = accuracy_score(y_true, y_pred) * 100
  # Calculate model precision, recall and f1 score using "weighted average
  model_precision, model_recall, model_f1, _ = precision_recall_fscore_support(y_true, y_pred, average="weighted")
  model_results = {"accuracy": model_accuracy,
                  "precision": model_precision,
                  "recall": model_recall,
                  "f1": model_f1}
  return model_results

## Loading the Dataset from TFDS

In [None]:
## Use TensorFlow Datasets to download dataset
import tensorflow_datasets as tfds

In [None]:
# Listing some available datasets
datasets_list= tfds.list_builders()
datasets_list[:10]

In [None]:
# Is our target dataset in list of tfds datasets?
print("food101" in datasets_list)

In [None]:
# Load in data (It may take a bit time)
(train_data, test_data), ds_info = tfds.load(name="food101",
                                             split = ["train", "validation"],
                                             shuffle_files = True,
                                             as_supervised = True, #returns as a tuple e.g (data,label)
                                             with_info = True)

## Analyse the Data

#### Features of dataset

In [None]:
ds_info.features

#### Get the class names

In [None]:
class_names = ds_info.features["label"].names
class_names[:10]

#### Take one sample of train dataset

In [None]:
train_one_sample = train_data.take(1)
train_one_sample

 #### Output info about trainin sample

In [None]:
 for image,label in train_one_sample:
   print(f"""
   Image shape: {image.shape}
   Image datatype: {image.dtype}
   Target class (tensor form): {label}
   Class names : {class_names[label.numpy()]}
   """)

#### What does our image tensor look like?

In [None]:
image

#### What are the min max values of our image?

In [None]:
import tensorflow as tf
tf.reduce_min(image), tf.reduce_max(image)

#### Plot an image from the dataset :)

In [None]:
import matplotlib.pyplot as plt

plt.figure(figsize=(7,5))
plt.title(class_names[label.numpy()])
plt.imshow(image)
plt.axis(False)

## Preprocessing the Data

#### Create preprocessing functions for our data

In [None]:
def preprocess_image(image, label, image_shape=224):
  """
  Converts image datatype from 'uint_8' -> 'float32' and reshapes image to
  [img_shape, img_shape, colour_channels]
  """

  image= tf.image.resize(image,[image_shape, image_shape]) # resize the target image
  return tf.cast(image, tf.float32), label # returns tuple (float_32 image, label)

#### Preprocess a single image 

In [None]:
preprocessed_img = preprocess_image(image, label)[0]
print(f"Feature of normal image -> Shape: {image.shape}, DataType: {image.dtype}")
print(f"Feature of preprocessed image -> Shape: {preprocessed_img.shape}, DataType: {preprocessed_img.dtype}")

In [None]:
# Batch and prepare datasets
train_data = train_data.map(map_func= preprocess_image, num_parallel_calls=tf.data.AUTOTUNE)

# Shuffle train data and turn it into batches
train_data = train_data.shuffle(buffer_size=1000).batch(batch_size=32).prefetch(buffer_size=tf.data.AUTOTUNE)

# Map preprocessing function to test data
test_data = test_data.map(preprocess_image, num_parallel_calls=tf.data.AUTOTUNE).batch(32).prefetch(tf.data.AUTOTUNE)

In [None]:
train_data, test_data

### Creating callback function

This callback logs events for TensorBoard, including:

* Metrics summary plots
* Training graph visualization
* Weight histograms
* Sampled profiling

#### Create a model checkpoint callback

In [None]:
checkpoint_path = "model_checkpoints/cp.ckpt" 
model_checkpoint = tf.keras.callbacks.ModelCheckpoint(checkpoint_path,
                                                      monitor = "val_acc",
                                                      save_best_only=True,
                                                      save_weights_only=True,# saving weights easier than savign whole model
                                                      verbose=0)

### Mixed Precision

Mixed precision is the use of both 16-bit and 32-bit floating-point types in a model during training to make it run faster and use less memory. By keeping certain parts of the model in the 32-bit types for numeric stability, the model will have a lower step time and train equally as well in terms of the evaluation metrics such as accuracy. This guide describes how to use the Keras mixed precision API to speed up your models. Using this API can improve performance by more than 3 times on modern GPUs and 60% on TPUs.

#### Setup mixed precision training

In [None]:
from tensorflow.keras import mixed_precision
mixed_precision.set_global_policy("mixed_float16")

In [None]:
mixed_precision.global_policy()

## Building the Model

In [None]:
# Feature Extraction Model
from tensorflow.keras import layers
from tensorflow.keras.layers.experimental import preprocessing

# Create base model
input_shape = (224,224,3)
base_model = tf.keras.applications.EfficientNetB0(include_top = False)
base_model.trainable= False

# Create functional model
inputs = layers.Input(shape=input_shape, name= "input_layer")
# Note: Since EfficientNetBX models have rescaling no need to use preprocessing e.g. x= preprocessing.Rescaling(1/255.)

x=base_model(inputs, training=False)
x = layers.GlobalAveragePooling2D()(x)
x = layers.Dense(len(class_names))(x)
outputs = layers.Activation("softmax", dtype=tf.float32, name ="softmax_float32")(x)
model = tf.keras.Model(inputs,outputs)

#Compile the model
model.compile(loss = "sparse_categorical_crossentropy",
              optimizer = tf.keras.optimizers.Adam(),
              metrics=["accuracy"])

#Get a summary of model
model.summary()

In [None]:
for layer in model.layers:
  print(layer.dtype)

#### Check the top ten layers of base model

In [None]:
from numpy import dtype

for layer in model.layers[1].layers[:10]:
  print(layer.name, layer.trainable, layer.dtype, layer.dtype_policy)

#### Fit feature extraction model with callback

In [None]:
history_feature_extraction=model.fit(train_data,
                                     epochs = 3,
                                     steps_per_epoch=len(train_data),
                                     validation_data= test_data,
                                     validation_steps=(0.15*len(test_data)),
                                     callbacks = [create_tensorboard_callback(dir_name = "training_logs",
                                                                              experiment_name="efficientnetb0_101_classes_all_data_feature_extract"),
                                                  model_checkpoint])

In [None]:
results_feature_extraction_model = model.evaluate(test_data)
results_feature_extraction_model

#### Fine Tuning

In [None]:
base_model.trainable = True

for layer in base_model.layers[:-10]:
  layer.trainable = False

#Recompile the model
model.compile(loss = "sparse_categorical_crossentropy",
              optimizer = tf.keras.optimizers.Adam(learning_rate=0.0001),
              metrics=["accuracy"])

print(len(model.trainable_variables))

#### Check which layers are trainable

In [None]:
for layer_number, layer in enumerate(model.layers[1].layers):
  print(layer_number, layer.name, layer.trainable)

### Early Stopping and Learning Rate Reduction Callbacks

**Early Stopping Callback** stops training when a monitored metric has stopped improving.

**Learning Rate Reduction Callback** reduces learning rate when a metric has stopped improving.

In [None]:
# Setup EarlyStopping callback to stop training if model's val_loss doesn't improve for 3 epochs
early_stopping = tf.keras.callbacks.EarlyStopping(monitor="val_loss", # watch the val loss metric
                                                  patience=3)

# Creating learning rate reduction callback
reduce_lr = tf.keras.callbacks.ReduceLROnPlateau(monitor="val_loss",  
                                                 factor=0.2, # multiply the learning rate by 0.2 (reduce by 5x)
                                                 patience=2,
                                                 verbose=1, # print out when learning rate goes down 
                                                 min_lr=1e-7)

### Fit the Model

#### Fit feature extraction model with callback

In [None]:
history_fine_tuning=model.fit(train_data,
                              epochs = 100,
                              steps_per_epoch=len(train_data),
                              validation_data= test_data,
                              validation_steps=(0.15*len(test_data)),
                              callbacks = [create_tensorboard_callback(dir_name = "training_logs",
                                                                      experiment_name="efficientnetb0_101_classes_all_data_fine_tuning"),
                                           model_checkpoint,
                                          early_stopping, # stop model after X epochs of no improvements
                                           reduce_lr])

In [None]:
results_fine_tuned_model = model.evaluate(test_data)

#### Make predictions with model

In [None]:
pred_probs = model.predict(test_data, verbose = 1)

#### How many predictions are there?

In [None]:
len(pred_probs)

#### For the first prediction, lets look at the probs

In [None]:
print(f"Number of prediction probs for sample 0: {len(pred_probs[0])}")
print(f"What prediction probability sample looks like for sample 0: {pred_probs[0]}")
print(f"The class with the highest predicted probability for sample 0: {tf.argmax(pred_probs[0])}")

> <div class="alert alert-block alert-success">
<b>Success:</b> Don't Forget to upvote if you like the notebook
</div>