In [1]:
# Python ≥3.5 is required
import sys
assert sys.version_info >= (3, 5)

# Scikit-Learn ≥0.20 is required
import sklearn
assert sklearn.__version__ >= "0.20"

try:
    # %tensorflow_version only exists in Colab.
    %tensorflow_version 2.x
    !pip install -U tqdm
except Exception:
    pass

# TensorFlow ≥2.0 is required
import tensorflow as tf
from tensorflow import keras
assert tf.__version__ >= "2.0"

# Common imports
import numpy as np
import os

# to make this notebook's output stable across runs
np.random.seed(42)
tf.random.set_seed(42)

# To plot pretty figures
%matplotlib inline
import matplotlib as mpl
import matplotlib.pyplot as plt
mpl.rc('axes', labelsize=14)
mpl.rc('xtick', labelsize=12)
mpl.rc('ytick', labelsize=12)

# Where to save the figures
PROJECT_ROOT_DIR = "."
CHAPTER_ID = "deep"
IMAGES_PATH = os.path.join(PROJECT_ROOT_DIR, "images", CHAPTER_ID)

## 12. Implement a custom layer that performs Layer Normalization

In [5]:
class LayerNormalization(keras.layers.Layer):
    def __init__(self, eps=0.001, **kwargs):
        super().__init__(**kwargs)
        self.eps = eps
    
    def build(self, batch_input_shape):
        self.alpha = self.add_weight(
            name="alpha", shape=batch_input_shape[-1:],
            initializer="ones"
        )
        self.beta = self.add_weight(
            name="beta", shape=batch_input_shape[-1:],
            initializer="zeros"
        )
        super().build(batch_input_shape)
    
    def call(self, X):
        mean, variance = tf.nn.moments(X, axes=-1, keepdims=True)
        return self.alpha * (X - mean) / (tf.sqrt(variance + self.eps)) + self.beta
    
    def compute_output_shape(self, batch_input_shape):
        return batch_input_shape
    def get_config(self):
        base_config = super().get_config()
        return {**base_config, "eps": self.eps}

In [3]:
from sklearn.datasets import fetch_california_housing
from sklearn.model_selection import train_test_split
from sklearn.preprocessing import StandardScaler

housing = fetch_california_housing()
X_train_full, X_test, y_train_full, y_test = train_test_split(
    housing.data, housing.target.reshape(-1, 1), random_state=42)
X_train, X_valid, y_train, y_valid = train_test_split(
    X_train_full, y_train_full, random_state=42)

scaler = StandardScaler()
X_train_scaled = scaler.fit_transform(X_train)
X_valid_scaled = scaler.transform(X_valid)
X_test_scaled = scaler.transform(X_test)

In [6]:
X = X_train.astype(np.float32)

custom_layer_norm = LayerNormalization()
keras_layer_norm = keras.layers.LayerNormalization()

tf.reduce_mean(keras.losses.mean_absolute_error(
    keras_layer_norm(X), custom_layer_norm(X)
))

<tf.Tensor: id=129, shape=(), dtype=float32, numpy=5.4875404e-08>

In [7]:
random_alpha = np.random.rand(X.shape[-1])
random_beta = np.random.rand(X.shape[-1])

custom_layer_norm.set_weights([random_alpha, random_beta])
keras_layer_norm.set_weights([random_alpha, random_beta])

tf.reduce_mean(keras.losses.mean_absolute_error(
    keras_layer_norm(X), custom_layer_norm(X)
))

<tf.Tensor: id=172, shape=(), dtype=float32, numpy=2.3667205e-08>

## 13. Train a model using a custom training loop to tackle the Fashion MNIST dataset

In [10]:
(X_train_full, y_train_full), (X_test, y_test) = keras.datasets.fashion_mnist.load_data()
X_train_full = X_train_full.astype(np.float32) / 255.
X_valid, X_train = X_train_full[:5000], X_train_full[5000:]
y_valid, y_train = y_train_full[:5000], y_train_full[5000:]
X_test = X_test.astype(np.float32) / 255.

In [11]:
keras.backend.clear_session()
np.random.seed(42)
tf.random.set_seed(42)

In [12]:
model = keras.models.Sequential([
    keras.layers.Flatten(input_shape=[28, 28]),
    keras.layers.Dense(100, activation="relu"),
    keras.layers.Dense(10, activation="softmax"),
])

In [14]:
n_epochs = 5
batch_size = 32
n_steps = len(X_train) // batch_size
optimizer = keras.optimizers.Nadam(lr = 0.01)
loss_fn = keras.losses.sparse_categorical_crossentropy
mean_loss = keras.metrics.Mean()
metrics = [keras.metrics.SparseCategoricalAccuracy()]

In [20]:
!pip install tqdm



In [26]:
from tqdm import trange
from collections import OrderedDict

In [23]:
def random_batch(X, y, batch_size=32):
    idx = np.random.randint(len(X), size=batch_size)
    return X[idx], y[idx]

In [27]:
with trange(1, n_epochs + 1, desc="All epochs") as epochs:
    for epoch in epochs:
        with trange(1, n_steps+1, desc="Epoch {}/{}".format(epoch, n_epochs)) as steps:
            for step in steps:
                X_batch, y_batch = random_batch(X_train, y_train)
                with tf.GradientTape() as tape:
                    y_pred = model(X_batch)
                    main_loss = tf.reduce_mean(loss_fn(y_batch, y_pred))
                    loss = tf.add_n([main_loss] + model.losses)
                gradients = tape.gradient(loss, model.trainable_variables)
                optimizer.apply_gradients(zip(gradients, model.trainable_variables))
                for variable in model.variables:
                    if variable.constraint is not None:
                        variable.assign(variable.constraint(variable))
                status = OrderedDict()
                mean_loss(loss)
                status["loss"] = mean_loss.result().numpy()
                for metric in metrics:
                    metric(y_batch, y_pred)
                    status[metric.name] = metric.result().numpy()
                steps.set_postfix(status)
            y_pred = model(X_valid)
            status["val_loss"] = np.mean(loss_fn(y_valid, y_pred))
            status["val_accuracy"]  = np.mean(keras.metrics.sparse_categorical_accuracy(
                tf.constant(y_valid, dtype=np.float32), y_pred))
            steps.set_postfix(status)
        for metric in [mean_loss] + metrics:
            metric.reset_states()

All epochs:   0%|                                                                                | 0/5 [00:00<?, ?it/s]
Epoch 1/5:   0%|                                                                              | 0/1718 [00:00<?, ?it/s][A
Epoch 1/5:   0%|                                 | 0/1718 [00:00<?, ?it/s, loss=3.5, sparse_categorical_accuracy=0.188][A
Epoch 1/5:   0%|                         | 1/1718 [00:00<11:38,  2.46it/s, loss=3.5, sparse_categorical_accuracy=0.188][A
Epoch 1/5:   0%|                        | 1/1718 [00:00<11:38,  2.46it/s, loss=3.03, sparse_categorical_accuracy=0.141][A
Epoch 1/5:   0%|                        | 1/1718 [00:00<11:38,  2.46it/s, loss=2.89, sparse_categorical_accuracy=0.219][A
Epoch 1/5:   0%|                        | 1/1718 [00:00<11:38,  2.46it/s, loss=2.59, sparse_categorical_accuracy=0.281][A
Epoch 1/5:   0%|                        | 1/1718 [00:00<11:38,  2.46it/s, loss=2.38, sparse_categorical_accuracy=0.338][A
Epoch 1/5:   0%|   

Epoch 1/5:   3%|▋                      | 50/1718 [00:01<00:54, 30.70it/s, loss=1.07, sparse_categorical_accuracy=0.624][A
Epoch 1/5:   3%|▋                       | 50/1718 [00:01<00:54, 30.70it/s, loss=1.06, sparse_categorical_accuracy=0.63][A
Epoch 1/5:   3%|▋                      | 50/1718 [00:01<00:54, 30.70it/s, loss=1.05, sparse_categorical_accuracy=0.632][A
Epoch 1/5:   3%|▋                      | 55/1718 [00:01<00:49, 33.48it/s, loss=1.05, sparse_categorical_accuracy=0.632][A
Epoch 1/5:   3%|▋                      | 55/1718 [00:01<00:49, 33.48it/s, loss=1.05, sparse_categorical_accuracy=0.633][A
Epoch 1/5:   3%|▋                      | 55/1718 [00:01<00:49, 33.48it/s, loss=1.04, sparse_categorical_accuracy=0.634][A
Epoch 1/5:   3%|▋                      | 55/1718 [00:01<00:49, 33.48it/s, loss=1.04, sparse_categorical_accuracy=0.635][A
Epoch 1/5:   3%|▋                      | 55/1718 [00:01<00:49, 33.48it/s, loss=1.04, sparse_categorical_accuracy=0.636][A
Epoch 1/5:   3%|

Epoch 1/5:   6%|█▎                   | 105/1718 [00:02<00:38, 41.76it/s, loss=0.868, sparse_categorical_accuracy=0.685][A
Epoch 1/5:   6%|█▎                    | 105/1718 [00:03<00:38, 41.76it/s, loss=0.87, sparse_categorical_accuracy=0.684][A
Epoch 1/5:   6%|█▎                   | 105/1718 [00:03<00:38, 41.76it/s, loss=0.867, sparse_categorical_accuracy=0.686][A
Epoch 1/5:   6%|█▎                   | 110/1718 [00:03<00:38, 41.97it/s, loss=0.867, sparse_categorical_accuracy=0.686][A
Epoch 1/5:   6%|█▎                   | 110/1718 [00:03<00:38, 41.97it/s, loss=0.867, sparse_categorical_accuracy=0.686][A
Epoch 1/5:   6%|█▎                   | 110/1718 [00:03<00:38, 41.97it/s, loss=0.864, sparse_categorical_accuracy=0.687][A
Epoch 1/5:   6%|█▎                   | 110/1718 [00:03<00:38, 41.97it/s, loss=0.864, sparse_categorical_accuracy=0.686][A
Epoch 1/5:   6%|█▍                    | 110/1718 [00:03<00:38, 41.97it/s, loss=0.86, sparse_categorical_accuracy=0.688][A
Epoch 1/5:   6%|

Epoch 1/5:   9%|██                    | 160/1718 [00:04<00:37, 41.81it/s, loss=0.77, sparse_categorical_accuracy=0.718][A
Epoch 1/5:   9%|██                    | 160/1718 [00:04<00:37, 41.81it/s, loss=0.77, sparse_categorical_accuracy=0.719][A
Epoch 1/5:   9%|█▉                   | 160/1718 [00:04<00:37, 41.81it/s, loss=0.769, sparse_categorical_accuracy=0.719][A
Epoch 1/5:  10%|██                   | 165/1718 [00:04<00:37, 41.49it/s, loss=0.769, sparse_categorical_accuracy=0.719][A
Epoch 1/5:  10%|██                   | 165/1718 [00:04<00:37, 41.49it/s, loss=0.771, sparse_categorical_accuracy=0.719][A
Epoch 1/5:  10%|██                    | 165/1718 [00:04<00:37, 41.49it/s, loss=0.77, sparse_categorical_accuracy=0.719][A
Epoch 1/5:  10%|██                    | 165/1718 [00:04<00:37, 41.49it/s, loss=0.769, sparse_categorical_accuracy=0.72][A
Epoch 1/5:  10%|██                    | 165/1718 [00:04<00:37, 41.49it/s, loss=0.768, sparse_categorical_accuracy=0.72][A
Epoch 1/5:  10%|

Epoch 1/5:  13%|██▋                  | 215/1718 [00:05<00:35, 42.47it/s, loss=0.757, sparse_categorical_accuracy=0.728][A
Epoch 1/5:  13%|██▋                  | 215/1718 [00:05<00:35, 42.47it/s, loss=0.756, sparse_categorical_accuracy=0.729][A
Epoch 1/5:  13%|██▋                  | 215/1718 [00:05<00:35, 42.47it/s, loss=0.756, sparse_categorical_accuracy=0.729][A
Epoch 1/5:  13%|██▋                  | 220/1718 [00:05<00:35, 42.26it/s, loss=0.756, sparse_categorical_accuracy=0.729][A
Epoch 1/5:  13%|██▋                  | 220/1718 [00:05<00:35, 42.26it/s, loss=0.757, sparse_categorical_accuracy=0.729][A
Epoch 1/5:  13%|██▋                  | 220/1718 [00:05<00:35, 42.26it/s, loss=0.756, sparse_categorical_accuracy=0.729][A
Epoch 1/5:  13%|██▋                  | 220/1718 [00:05<00:35, 42.26it/s, loss=0.757, sparse_categorical_accuracy=0.729][A
Epoch 1/5:  13%|██▋                  | 220/1718 [00:05<00:35, 42.26it/s, loss=0.756, sparse_categorical_accuracy=0.729][A
Epoch 1/5:  13%|

Epoch 1/5:  16%|███▍                  | 270/1718 [00:06<00:31, 45.43it/s, loss=0.722, sparse_categorical_accuracy=0.74][A
Epoch 1/5:  16%|███▍                  | 270/1718 [00:06<00:31, 45.43it/s, loss=0.721, sparse_categorical_accuracy=0.74][A
Epoch 1/5:  16%|███▌                   | 270/1718 [00:06<00:31, 45.43it/s, loss=0.72, sparse_categorical_accuracy=0.74][A
Epoch 1/5:  16%|███▋                   | 275/1718 [00:06<00:31, 45.19it/s, loss=0.72, sparse_categorical_accuracy=0.74][A
Epoch 1/5:  16%|███▋                   | 275/1718 [00:06<00:31, 45.19it/s, loss=0.72, sparse_categorical_accuracy=0.74][A
Epoch 1/5:  16%|███▎                 | 275/1718 [00:06<00:31, 45.19it/s, loss=0.719, sparse_categorical_accuracy=0.741][A
Epoch 1/5:  16%|███▎                 | 275/1718 [00:06<00:31, 45.19it/s, loss=0.719, sparse_categorical_accuracy=0.741][A
Epoch 1/5:  16%|███▎                 | 275/1718 [00:06<00:31, 45.19it/s, loss=0.719, sparse_categorical_accuracy=0.741][A
Epoch 1/5:  16%|

Epoch 1/5:  19%|████▏                 | 324/1718 [00:08<00:33, 41.60it/s, loss=0.69, sparse_categorical_accuracy=0.751][A
Epoch 1/5:  19%|████▏                 | 324/1718 [00:08<00:33, 41.60it/s, loss=0.69, sparse_categorical_accuracy=0.752][A
Epoch 1/5:  19%|████▏                 | 329/1718 [00:08<00:36, 38.40it/s, loss=0.69, sparse_categorical_accuracy=0.752][A
Epoch 1/5:  19%|████                 | 329/1718 [00:08<00:36, 38.40it/s, loss=0.689, sparse_categorical_accuracy=0.752][A
Epoch 1/5:  19%|████                 | 329/1718 [00:08<00:36, 38.40it/s, loss=0.689, sparse_categorical_accuracy=0.752][A
Epoch 1/5:  19%|████                 | 329/1718 [00:08<00:36, 38.40it/s, loss=0.689, sparse_categorical_accuracy=0.752][A
Epoch 1/5:  19%|████                 | 329/1718 [00:08<00:36, 38.40it/s, loss=0.688, sparse_categorical_accuracy=0.752][A
Epoch 1/5:  19%|████                 | 333/1718 [00:08<00:36, 38.36it/s, loss=0.688, sparse_categorical_accuracy=0.752][A
Epoch 1/5:  19%|

Epoch 1/5:  22%|████▌                | 378/1718 [00:09<00:30, 44.15it/s, loss=0.668, sparse_categorical_accuracy=0.758][A
Epoch 1/5:  22%|████▋                | 383/1718 [00:09<00:30, 43.86it/s, loss=0.668, sparse_categorical_accuracy=0.758][A
Epoch 1/5:  22%|████▋                | 383/1718 [00:09<00:30, 43.86it/s, loss=0.667, sparse_categorical_accuracy=0.758][A
Epoch 1/5:  22%|████▋                | 383/1718 [00:09<00:30, 43.86it/s, loss=0.668, sparse_categorical_accuracy=0.758][A
Epoch 1/5:  22%|████▋                | 383/1718 [00:09<00:30, 43.86it/s, loss=0.668, sparse_categorical_accuracy=0.759][A
Epoch 1/5:  22%|████▋                | 383/1718 [00:09<00:30, 43.86it/s, loss=0.667, sparse_categorical_accuracy=0.759][A
Epoch 1/5:  22%|████▋                | 383/1718 [00:09<00:30, 43.86it/s, loss=0.668, sparse_categorical_accuracy=0.759][A
Epoch 1/5:  23%|████▋                | 388/1718 [00:09<00:31, 42.34it/s, loss=0.668, sparse_categorical_accuracy=0.759][A
Epoch 1/5:  23%|

Epoch 1/5:  25%|█████▎               | 433/1718 [00:10<00:31, 41.18it/s, loss=0.652, sparse_categorical_accuracy=0.764][A
Epoch 1/5:  25%|█████▎               | 438/1718 [00:10<00:31, 40.65it/s, loss=0.652, sparse_categorical_accuracy=0.764][A
Epoch 1/5:  25%|█████▎               | 438/1718 [00:10<00:31, 40.65it/s, loss=0.652, sparse_categorical_accuracy=0.765][A
Epoch 1/5:  25%|█████▎               | 438/1718 [00:10<00:31, 40.65it/s, loss=0.652, sparse_categorical_accuracy=0.764][A
Epoch 1/5:  25%|█████▎               | 438/1718 [00:10<00:31, 40.65it/s, loss=0.651, sparse_categorical_accuracy=0.764][A
Epoch 1/5:  25%|█████▌                | 438/1718 [00:10<00:31, 40.65it/s, loss=0.65, sparse_categorical_accuracy=0.765][A
Epoch 1/5:  25%|█████▎               | 438/1718 [00:10<00:31, 40.65it/s, loss=0.651, sparse_categorical_accuracy=0.765][A
Epoch 1/5:  26%|█████▍               | 443/1718 [00:10<00:31, 40.76it/s, loss=0.651, sparse_categorical_accuracy=0.765][A
Epoch 1/5:  26%|

Epoch 1/5:  28%|█████▉               | 488/1718 [00:12<00:29, 41.02it/s, loss=0.633, sparse_categorical_accuracy=0.772][A
Epoch 1/5:  29%|██████               | 493/1718 [00:12<00:30, 40.55it/s, loss=0.633, sparse_categorical_accuracy=0.772][A
Epoch 1/5:  29%|██████               | 493/1718 [00:12<00:30, 40.55it/s, loss=0.633, sparse_categorical_accuracy=0.772][A
Epoch 1/5:  29%|██████               | 493/1718 [00:12<00:30, 40.55it/s, loss=0.632, sparse_categorical_accuracy=0.772][A
Epoch 1/5:  29%|██████               | 493/1718 [00:12<00:30, 40.55it/s, loss=0.633, sparse_categorical_accuracy=0.772][A
Epoch 1/5:  29%|██████               | 493/1718 [00:12<00:30, 40.55it/s, loss=0.632, sparse_categorical_accuracy=0.772][A
Epoch 1/5:  29%|██████               | 493/1718 [00:12<00:30, 40.55it/s, loss=0.632, sparse_categorical_accuracy=0.773][A
Epoch 1/5:  29%|██████               | 498/1718 [00:12<00:30, 39.74it/s, loss=0.632, sparse_categorical_accuracy=0.773][A
Epoch 1/5:  29%|

Epoch 1/5:  32%|██████▋              | 545/1718 [00:13<00:29, 39.68it/s, loss=0.621, sparse_categorical_accuracy=0.777][A
Epoch 1/5:  32%|██████▉               | 545/1718 [00:13<00:29, 39.68it/s, loss=0.62, sparse_categorical_accuracy=0.777][A
Epoch 1/5:  32%|██████▉               | 545/1718 [00:13<00:29, 39.68it/s, loss=0.62, sparse_categorical_accuracy=0.777][A
Epoch 1/5:  32%|██████▉               | 545/1718 [00:13<00:29, 39.68it/s, loss=0.62, sparse_categorical_accuracy=0.776][A
Epoch 1/5:  32%|███████               | 550/1718 [00:13<00:29, 39.90it/s, loss=0.62, sparse_categorical_accuracy=0.776][A
Epoch 1/5:  32%|███████               | 550/1718 [00:13<00:29, 39.90it/s, loss=0.62, sparse_categorical_accuracy=0.776][A
Epoch 1/5:  32%|███████               | 550/1718 [00:13<00:29, 39.90it/s, loss=0.62, sparse_categorical_accuracy=0.776][A
Epoch 1/5:  32%|███████               | 550/1718 [00:13<00:29, 39.90it/s, loss=0.62, sparse_categorical_accuracy=0.776][A
Epoch 1/5:  32%|

Epoch 1/5:  35%|███████▋              | 598/1718 [00:14<00:27, 41.45it/s, loss=0.609, sparse_categorical_accuracy=0.78][A
Epoch 1/5:  35%|███████▋              | 598/1718 [00:14<00:27, 41.45it/s, loss=0.608, sparse_categorical_accuracy=0.78][A
Epoch 1/5:  35%|███████▋              | 603/1718 [00:14<00:27, 40.15it/s, loss=0.608, sparse_categorical_accuracy=0.78][A
Epoch 1/5:  35%|████████               | 603/1718 [00:14<00:27, 40.15it/s, loss=0.61, sparse_categorical_accuracy=0.78][A
Epoch 1/5:  35%|████████               | 603/1718 [00:14<00:27, 40.15it/s, loss=0.61, sparse_categorical_accuracy=0.78][A
Epoch 1/5:  35%|████████               | 603/1718 [00:14<00:27, 40.15it/s, loss=0.61, sparse_categorical_accuracy=0.78][A
Epoch 1/5:  35%|████████               | 603/1718 [00:14<00:27, 40.15it/s, loss=0.61, sparse_categorical_accuracy=0.78][A
Epoch 1/5:  35%|████████               | 603/1718 [00:15<00:27, 40.15it/s, loss=0.61, sparse_categorical_accuracy=0.78][A
Epoch 1/5:  35%|

Epoch 1/5:  38%|███████▉             | 653/1718 [00:16<00:27, 38.79it/s, loss=0.595, sparse_categorical_accuracy=0.785][A
Epoch 1/5:  38%|████████             | 657/1718 [00:16<00:27, 38.83it/s, loss=0.595, sparse_categorical_accuracy=0.785][A
Epoch 1/5:  38%|████████             | 657/1718 [00:16<00:27, 38.83it/s, loss=0.596, sparse_categorical_accuracy=0.784][A
Epoch 1/5:  38%|████████             | 657/1718 [00:16<00:27, 38.83it/s, loss=0.596, sparse_categorical_accuracy=0.784][A
Epoch 1/5:  38%|████████             | 657/1718 [00:16<00:27, 38.83it/s, loss=0.596, sparse_categorical_accuracy=0.785][A
Epoch 1/5:  38%|████████             | 657/1718 [00:16<00:27, 38.83it/s, loss=0.595, sparse_categorical_accuracy=0.785][A
Epoch 1/5:  38%|████████             | 657/1718 [00:16<00:27, 38.83it/s, loss=0.595, sparse_categorical_accuracy=0.785][A
Epoch 1/5:  39%|████████             | 662/1718 [00:16<00:26, 40.24it/s, loss=0.595, sparse_categorical_accuracy=0.785][A
Epoch 1/5:  39%|

Epoch 1/5:  41%|████████▋            | 707/1718 [00:17<00:23, 42.95it/s, loss=0.587, sparse_categorical_accuracy=0.787][A
Epoch 1/5:  41%|████████▋            | 712/1718 [00:17<00:24, 41.36it/s, loss=0.587, sparse_categorical_accuracy=0.787][A
Epoch 1/5:  41%|████████▋            | 712/1718 [00:17<00:24, 41.36it/s, loss=0.587, sparse_categorical_accuracy=0.788][A
Epoch 1/5:  41%|████████▋            | 712/1718 [00:17<00:24, 41.36it/s, loss=0.587, sparse_categorical_accuracy=0.788][A
Epoch 1/5:  41%|████████▋            | 712/1718 [00:17<00:24, 41.36it/s, loss=0.587, sparse_categorical_accuracy=0.788][A
Epoch 1/5:  41%|████████▋            | 712/1718 [00:17<00:24, 41.36it/s, loss=0.587, sparse_categorical_accuracy=0.788][A
Epoch 1/5:  41%|████████▋            | 712/1718 [00:17<00:24, 41.36it/s, loss=0.587, sparse_categorical_accuracy=0.788][A
Epoch 1/5:  42%|████████▊            | 717/1718 [00:17<00:24, 40.92it/s, loss=0.587, sparse_categorical_accuracy=0.788][A
Epoch 1/5:  42%|

Epoch 1/5:  44%|█████████▎           | 762/1718 [00:18<00:22, 41.77it/s, loss=0.579, sparse_categorical_accuracy=0.791][A
Epoch 1/5:  45%|█████████▍           | 767/1718 [00:18<00:22, 41.92it/s, loss=0.579, sparse_categorical_accuracy=0.791][A
Epoch 1/5:  45%|█████████▍           | 767/1718 [00:18<00:22, 41.92it/s, loss=0.579, sparse_categorical_accuracy=0.791][A
Epoch 1/5:  45%|█████████▍           | 767/1718 [00:18<00:22, 41.92it/s, loss=0.579, sparse_categorical_accuracy=0.791][A
Epoch 1/5:  45%|█████████▍           | 767/1718 [00:18<00:22, 41.92it/s, loss=0.579, sparse_categorical_accuracy=0.791][A
Epoch 1/5:  45%|█████████▍           | 767/1718 [00:18<00:22, 41.92it/s, loss=0.578, sparse_categorical_accuracy=0.791][A
Epoch 1/5:  45%|█████████▍           | 767/1718 [00:18<00:22, 41.92it/s, loss=0.578, sparse_categorical_accuracy=0.791][A
Epoch 1/5:  45%|█████████▍           | 772/1718 [00:18<00:22, 41.46it/s, loss=0.578, sparse_categorical_accuracy=0.791][A
Epoch 1/5:  45%|

Epoch 1/5:  48%|█████████▉           | 817/1718 [00:20<00:21, 41.28it/s, loss=0.573, sparse_categorical_accuracy=0.792][A
Epoch 1/5:  48%|██████████           | 822/1718 [00:20<00:21, 41.12it/s, loss=0.573, sparse_categorical_accuracy=0.792][A
Epoch 1/5:  48%|██████████           | 822/1718 [00:20<00:21, 41.12it/s, loss=0.573, sparse_categorical_accuracy=0.792][A
Epoch 1/5:  48%|██████████           | 822/1718 [00:20<00:21, 41.12it/s, loss=0.573, sparse_categorical_accuracy=0.792][A
Epoch 1/5:  48%|██████████           | 822/1718 [00:20<00:21, 41.12it/s, loss=0.573, sparse_categorical_accuracy=0.792][A
Epoch 1/5:  48%|██████████           | 822/1718 [00:20<00:21, 41.12it/s, loss=0.573, sparse_categorical_accuracy=0.792][A
Epoch 1/5:  48%|██████████           | 822/1718 [00:20<00:21, 41.12it/s, loss=0.573, sparse_categorical_accuracy=0.792][A
Epoch 1/5:  48%|██████████           | 827/1718 [00:20<00:21, 41.11it/s, loss=0.573, sparse_categorical_accuracy=0.792][A
Epoch 1/5:  48%|

Epoch 1/5:  51%|██████████▋          | 873/1718 [00:21<00:26, 32.15it/s, loss=0.567, sparse_categorical_accuracy=0.795][A
Epoch 1/5:  51%|██████████▋          | 873/1718 [00:21<00:26, 32.15it/s, loss=0.567, sparse_categorical_accuracy=0.795][A
Epoch 1/5:  51%|██████████▋          | 873/1718 [00:21<00:26, 32.15it/s, loss=0.567, sparse_categorical_accuracy=0.795][A
Epoch 1/5:  51%|██████████▋          | 877/1718 [00:21<00:25, 33.16it/s, loss=0.567, sparse_categorical_accuracy=0.795][A
Epoch 1/5:  51%|██████████▋          | 877/1718 [00:21<00:25, 33.16it/s, loss=0.567, sparse_categorical_accuracy=0.795][A
Epoch 1/5:  51%|██████████▋          | 877/1718 [00:21<00:25, 33.16it/s, loss=0.567, sparse_categorical_accuracy=0.795][A
Epoch 1/5:  51%|██████████▋          | 877/1718 [00:21<00:25, 33.16it/s, loss=0.566, sparse_categorical_accuracy=0.795][A
Epoch 1/5:  51%|██████████▋          | 877/1718 [00:21<00:25, 33.16it/s, loss=0.566, sparse_categorical_accuracy=0.795][A
Epoch 1/5:  51%|

Epoch 1/5:  54%|███████████▎         | 925/1718 [00:23<00:24, 32.42it/s, loss=0.562, sparse_categorical_accuracy=0.796][A
Epoch 1/5:  54%|███████████▎         | 925/1718 [00:23<00:24, 32.42it/s, loss=0.562, sparse_categorical_accuracy=0.797][A
Epoch 1/5:  54%|███████████▎         | 929/1718 [00:23<00:23, 33.37it/s, loss=0.562, sparse_categorical_accuracy=0.797][A
Epoch 1/5:  54%|███████████▎         | 929/1718 [00:23<00:23, 33.37it/s, loss=0.562, sparse_categorical_accuracy=0.797][A
Epoch 1/5:  54%|███████████▎         | 929/1718 [00:23<00:23, 33.37it/s, loss=0.562, sparse_categorical_accuracy=0.797][A
Epoch 1/5:  54%|███████████▎         | 929/1718 [00:23<00:23, 33.37it/s, loss=0.562, sparse_categorical_accuracy=0.797][A
Epoch 1/5:  54%|███████████▎         | 929/1718 [00:23<00:23, 33.37it/s, loss=0.561, sparse_categorical_accuracy=0.797][A
Epoch 1/5:  54%|███████████▍         | 933/1718 [00:23<00:23, 33.51it/s, loss=0.561, sparse_categorical_accuracy=0.797][A
Epoch 1/5:  54%|

Epoch 1/5:  57%|███████████▉         | 977/1718 [00:24<00:21, 34.78it/s, loss=0.556, sparse_categorical_accuracy=0.799][A
Epoch 1/5:  57%|███████████▉         | 981/1718 [00:24<00:20, 35.18it/s, loss=0.556, sparse_categorical_accuracy=0.799][A
Epoch 1/5:  57%|███████████▉         | 981/1718 [00:24<00:20, 35.18it/s, loss=0.556, sparse_categorical_accuracy=0.799][A
Epoch 1/5:  57%|███████████▉         | 981/1718 [00:24<00:20, 35.18it/s, loss=0.556, sparse_categorical_accuracy=0.799][A
Epoch 1/5:  57%|███████████▉         | 981/1718 [00:24<00:20, 35.18it/s, loss=0.556, sparse_categorical_accuracy=0.799][A
Epoch 1/5:  57%|███████████▉         | 981/1718 [00:25<00:20, 35.18it/s, loss=0.556, sparse_categorical_accuracy=0.799][A
Epoch 1/5:  57%|████████████         | 985/1718 [00:25<00:20, 35.89it/s, loss=0.556, sparse_categorical_accuracy=0.799][A
Epoch 1/5:  57%|████████████         | 985/1718 [00:25<00:20, 35.89it/s, loss=0.556, sparse_categorical_accuracy=0.799][A
Epoch 1/5:  57%|

Epoch 1/5:  60%|████████████▌        | 1030/1718 [00:26<00:18, 36.85it/s, loss=0.55, sparse_categorical_accuracy=0.801][A
Epoch 1/5:  60%|████████████▋        | 1034/1718 [00:26<00:18, 36.48it/s, loss=0.55, sparse_categorical_accuracy=0.801][A
Epoch 1/5:  60%|████████████▋        | 1034/1718 [00:26<00:18, 36.48it/s, loss=0.55, sparse_categorical_accuracy=0.801][A
Epoch 1/5:  60%|████████████▋        | 1034/1718 [00:26<00:18, 36.48it/s, loss=0.55, sparse_categorical_accuracy=0.801][A
Epoch 1/5:  60%|████████████▋        | 1034/1718 [00:26<00:18, 36.48it/s, loss=0.55, sparse_categorical_accuracy=0.801][A
Epoch 1/5:  60%|████████████        | 1034/1718 [00:26<00:18, 36.48it/s, loss=0.549, sparse_categorical_accuracy=0.801][A
Epoch 1/5:  60%|████████████        | 1038/1718 [00:26<00:18, 36.92it/s, loss=0.549, sparse_categorical_accuracy=0.801][A
Epoch 1/5:  60%|████████████        | 1038/1718 [00:26<00:18, 36.92it/s, loss=0.549, sparse_categorical_accuracy=0.801][A
Epoch 1/5:  60%|

Epoch 1/5:  63%|████████████▌       | 1082/1718 [00:27<00:17, 35.92it/s, loss=0.545, sparse_categorical_accuracy=0.803][A
Epoch 1/5:  63%|████████████▋       | 1087/1718 [00:27<00:17, 36.88it/s, loss=0.545, sparse_categorical_accuracy=0.803][A
Epoch 1/5:  63%|████████████▋       | 1087/1718 [00:27<00:17, 36.88it/s, loss=0.545, sparse_categorical_accuracy=0.803][A
Epoch 1/5:  63%|████████████▋       | 1087/1718 [00:27<00:17, 36.88it/s, loss=0.545, sparse_categorical_accuracy=0.803][A
Epoch 1/5:  63%|████████████▋       | 1087/1718 [00:27<00:17, 36.88it/s, loss=0.545, sparse_categorical_accuracy=0.803][A
Epoch 1/5:  63%|████████████▋       | 1087/1718 [00:27<00:17, 36.88it/s, loss=0.545, sparse_categorical_accuracy=0.803][A
Epoch 1/5:  64%|████████████▋       | 1091/1718 [00:27<00:16, 37.11it/s, loss=0.545, sparse_categorical_accuracy=0.803][A
Epoch 1/5:  64%|████████████▋       | 1091/1718 [00:27<00:16, 37.11it/s, loss=0.545, sparse_categorical_accuracy=0.803][A
Epoch 1/5:  64%|

Epoch 1/5:  66%|█████████████▎      | 1139/1718 [00:29<00:15, 36.36it/s, loss=0.541, sparse_categorical_accuracy=0.804][A
Epoch 1/5:  66%|█████████████▎      | 1139/1718 [00:29<00:15, 36.36it/s, loss=0.541, sparse_categorical_accuracy=0.804][A
Epoch 1/5:  66%|█████████████▎      | 1139/1718 [00:29<00:15, 36.36it/s, loss=0.541, sparse_categorical_accuracy=0.804][A
Epoch 1/5:  66%|█████████████▎      | 1139/1718 [00:29<00:15, 36.36it/s, loss=0.541, sparse_categorical_accuracy=0.804][A
Epoch 1/5:  66%|█████████████▎      | 1139/1718 [00:29<00:15, 36.36it/s, loss=0.541, sparse_categorical_accuracy=0.804][A
Epoch 1/5:  67%|█████████████▎      | 1143/1718 [00:29<00:15, 36.89it/s, loss=0.541, sparse_categorical_accuracy=0.804][A
Epoch 1/5:  67%|█████████████▎      | 1143/1718 [00:29<00:15, 36.89it/s, loss=0.541, sparse_categorical_accuracy=0.804][A
Epoch 1/5:  67%|█████████████▎      | 1143/1718 [00:29<00:15, 36.89it/s, loss=0.541, sparse_categorical_accuracy=0.804][A
Epoch 1/5:  67%|

Epoch 1/5:  69%|█████████████▉      | 1192/1718 [00:30<00:12, 43.17it/s, loss=0.535, sparse_categorical_accuracy=0.807][A
Epoch 1/5:  69%|█████████████▉      | 1192/1718 [00:30<00:12, 43.17it/s, loss=0.535, sparse_categorical_accuracy=0.807][A
Epoch 1/5:  69%|█████████████▉      | 1192/1718 [00:30<00:12, 43.17it/s, loss=0.535, sparse_categorical_accuracy=0.807][A
Epoch 1/5:  69%|█████████████▉      | 1192/1718 [00:30<00:12, 43.17it/s, loss=0.535, sparse_categorical_accuracy=0.807][A
Epoch 1/5:  70%|█████████████▉      | 1197/1718 [00:30<00:12, 43.19it/s, loss=0.535, sparse_categorical_accuracy=0.807][A
Epoch 1/5:  70%|█████████████▉      | 1197/1718 [00:30<00:12, 43.19it/s, loss=0.535, sparse_categorical_accuracy=0.807][A
Epoch 1/5:  70%|█████████████▉      | 1197/1718 [00:30<00:12, 43.19it/s, loss=0.535, sparse_categorical_accuracy=0.807][A
Epoch 1/5:  70%|█████████████▉      | 1197/1718 [00:30<00:12, 43.19it/s, loss=0.535, sparse_categorical_accuracy=0.807][A
Epoch 1/5:  70%|

Epoch 1/5:  73%|██████████████▌     | 1247/1718 [00:31<00:10, 43.16it/s, loss=0.532, sparse_categorical_accuracy=0.808][A
Epoch 1/5:  73%|██████████████▌     | 1247/1718 [00:31<00:10, 43.16it/s, loss=0.532, sparse_categorical_accuracy=0.808][A
Epoch 1/5:  73%|██████████████▌     | 1247/1718 [00:31<00:10, 43.16it/s, loss=0.532, sparse_categorical_accuracy=0.808][A
Epoch 1/5:  73%|██████████████▌     | 1247/1718 [00:31<00:10, 43.16it/s, loss=0.531, sparse_categorical_accuracy=0.808][A
Epoch 1/5:  73%|██████████████▌     | 1252/1718 [00:31<00:10, 43.40it/s, loss=0.531, sparse_categorical_accuracy=0.808][A
Epoch 1/5:  73%|██████████████▌     | 1252/1718 [00:31<00:10, 43.40it/s, loss=0.532, sparse_categorical_accuracy=0.808][A
Epoch 1/5:  73%|██████████████▌     | 1252/1718 [00:32<00:10, 43.40it/s, loss=0.532, sparse_categorical_accuracy=0.808][A
Epoch 1/5:  73%|██████████████▌     | 1252/1718 [00:32<00:10, 43.40it/s, loss=0.531, sparse_categorical_accuracy=0.808][A
Epoch 1/5:  73%|

Epoch 1/5:  76%|███████████████▏    | 1302/1718 [00:33<00:10, 41.38it/s, loss=0.527, sparse_categorical_accuracy=0.809][A
Epoch 1/5:  76%|███████████████▏    | 1302/1718 [00:33<00:10, 41.38it/s, loss=0.527, sparse_categorical_accuracy=0.809][A
Epoch 1/5:  76%|███████████████▏    | 1302/1718 [00:33<00:10, 41.38it/s, loss=0.527, sparse_categorical_accuracy=0.809][A
Epoch 1/5:  76%|███████████████▏    | 1302/1718 [00:33<00:10, 41.38it/s, loss=0.527, sparse_categorical_accuracy=0.809][A
Epoch 1/5:  76%|███████████████▏    | 1307/1718 [00:33<00:10, 38.31it/s, loss=0.527, sparse_categorical_accuracy=0.809][A
Epoch 1/5:  76%|███████████████▏    | 1307/1718 [00:33<00:10, 38.31it/s, loss=0.527, sparse_categorical_accuracy=0.809][A
Epoch 1/5:  76%|███████████████▏    | 1307/1718 [00:33<00:10, 38.31it/s, loss=0.527, sparse_categorical_accuracy=0.809][A
Epoch 1/5:  76%|███████████████▏    | 1307/1718 [00:33<00:10, 38.31it/s, loss=0.527, sparse_categorical_accuracy=0.809][A
Epoch 1/5:  76%|

Epoch 1/5:  79%|███████████████▊    | 1355/1718 [00:34<00:08, 40.63it/s, loss=0.523, sparse_categorical_accuracy=0.811][A
Epoch 1/5:  79%|███████████████▊    | 1355/1718 [00:34<00:08, 40.63it/s, loss=0.523, sparse_categorical_accuracy=0.811][A
Epoch 1/5:  79%|███████████████▊    | 1355/1718 [00:34<00:08, 40.63it/s, loss=0.523, sparse_categorical_accuracy=0.811][A
Epoch 1/5:  79%|███████████████▊    | 1360/1718 [00:34<00:08, 41.17it/s, loss=0.523, sparse_categorical_accuracy=0.811][A
Epoch 1/5:  79%|███████████████▊    | 1360/1718 [00:34<00:08, 41.17it/s, loss=0.523, sparse_categorical_accuracy=0.811][A
Epoch 1/5:  79%|███████████████▊    | 1360/1718 [00:34<00:08, 41.17it/s, loss=0.522, sparse_categorical_accuracy=0.811][A
Epoch 1/5:  79%|███████████████▊    | 1360/1718 [00:34<00:08, 41.17it/s, loss=0.522, sparse_categorical_accuracy=0.811][A
Epoch 1/5:  79%|███████████████▊    | 1360/1718 [00:34<00:08, 41.17it/s, loss=0.522, sparse_categorical_accuracy=0.811][A
Epoch 1/5:  79%|

Epoch 1/5:  82%|████████████████▍   | 1412/1718 [00:36<00:08, 37.29it/s, loss=0.518, sparse_categorical_accuracy=0.812][A
Epoch 1/5:  82%|████████████████▍   | 1412/1718 [00:36<00:08, 37.29it/s, loss=0.518, sparse_categorical_accuracy=0.812][A
Epoch 1/5:  82%|████████████████▍   | 1412/1718 [00:36<00:08, 37.29it/s, loss=0.518, sparse_categorical_accuracy=0.812][A
Epoch 1/5:  82%|████████████████▍   | 1412/1718 [00:36<00:08, 37.29it/s, loss=0.518, sparse_categorical_accuracy=0.812][A
Epoch 1/5:  82%|████████████████▍   | 1412/1718 [00:36<00:08, 37.29it/s, loss=0.518, sparse_categorical_accuracy=0.812][A
Epoch 1/5:  82%|████████████████▍   | 1412/1718 [00:36<00:08, 37.29it/s, loss=0.518, sparse_categorical_accuracy=0.812][A
Epoch 1/5:  82%|████████████████▍   | 1417/1718 [00:36<00:07, 38.53it/s, loss=0.518, sparse_categorical_accuracy=0.812][A
Epoch 1/5:  82%|████████████████▍   | 1417/1718 [00:36<00:07, 38.53it/s, loss=0.517, sparse_categorical_accuracy=0.812][A
Epoch 1/5:  82%|

Epoch 1/5:  85%|█████████████████   | 1464/1718 [00:37<00:06, 40.43it/s, loss=0.516, sparse_categorical_accuracy=0.813][A
Epoch 1/5:  85%|█████████████████   | 1464/1718 [00:37<00:06, 40.43it/s, loss=0.515, sparse_categorical_accuracy=0.813][A
Epoch 1/5:  85%|█████████████████   | 1464/1718 [00:37<00:06, 40.43it/s, loss=0.515, sparse_categorical_accuracy=0.813][A
Epoch 1/5:  85%|█████████████████   | 1464/1718 [00:37<00:06, 40.43it/s, loss=0.515, sparse_categorical_accuracy=0.813][A
Epoch 1/5:  86%|█████████████████   | 1469/1718 [00:37<00:06, 40.28it/s, loss=0.515, sparse_categorical_accuracy=0.813][A
Epoch 1/5:  86%|█████████████████   | 1469/1718 [00:37<00:06, 40.28it/s, loss=0.515, sparse_categorical_accuracy=0.813][A
Epoch 1/5:  86%|█████████████████   | 1469/1718 [00:37<00:06, 40.28it/s, loss=0.515, sparse_categorical_accuracy=0.813][A
Epoch 1/5:  86%|█████████████████   | 1469/1718 [00:37<00:06, 40.28it/s, loss=0.515, sparse_categorical_accuracy=0.813][A
Epoch 1/5:  86%|

Epoch 1/5:  88%|█████████████████▋  | 1519/1718 [00:38<00:05, 37.84it/s, loss=0.513, sparse_categorical_accuracy=0.814][A
Epoch 1/5:  88%|█████████████████▋  | 1519/1718 [00:38<00:05, 37.84it/s, loss=0.513, sparse_categorical_accuracy=0.814][A
Epoch 1/5:  88%|█████████████████▋  | 1519/1718 [00:38<00:05, 37.84it/s, loss=0.513, sparse_categorical_accuracy=0.814][A
Epoch 1/5:  89%|█████████████████▋  | 1523/1718 [00:38<00:05, 38.14it/s, loss=0.513, sparse_categorical_accuracy=0.814][A
Epoch 1/5:  89%|█████████████████▋  | 1523/1718 [00:38<00:05, 38.14it/s, loss=0.513, sparse_categorical_accuracy=0.814][A
Epoch 1/5:  89%|█████████████████▋  | 1523/1718 [00:38<00:05, 38.14it/s, loss=0.513, sparse_categorical_accuracy=0.814][A
Epoch 1/5:  89%|█████████████████▋  | 1523/1718 [00:38<00:05, 38.14it/s, loss=0.513, sparse_categorical_accuracy=0.814][A
Epoch 1/5:  89%|█████████████████▋  | 1523/1718 [00:38<00:05, 38.14it/s, loss=0.513, sparse_categorical_accuracy=0.814][A
Epoch 1/5:  89%|

Epoch 1/5:  92%|███████████████████▎ | 1575/1718 [00:40<00:03, 41.38it/s, loss=0.51, sparse_categorical_accuracy=0.815][A
Epoch 1/5:  92%|███████████████████▎ | 1575/1718 [00:40<00:03, 41.38it/s, loss=0.51, sparse_categorical_accuracy=0.815][A
Epoch 1/5:  92%|███████████████████▎ | 1575/1718 [00:40<00:03, 41.38it/s, loss=0.51, sparse_categorical_accuracy=0.815][A
Epoch 1/5:  92%|███████████████████▎ | 1575/1718 [00:40<00:03, 41.38it/s, loss=0.51, sparse_categorical_accuracy=0.815][A
Epoch 1/5:  92%|███████████████████▎ | 1575/1718 [00:40<00:03, 41.38it/s, loss=0.51, sparse_categorical_accuracy=0.815][A
Epoch 1/5:  92%|███████████████████▎ | 1575/1718 [00:40<00:03, 41.38it/s, loss=0.51, sparse_categorical_accuracy=0.815][A
Epoch 1/5:  92%|███████████████████▎ | 1580/1718 [00:40<00:03, 41.73it/s, loss=0.51, sparse_categorical_accuracy=0.815][A
Epoch 1/5:  92%|███████████████████▎ | 1580/1718 [00:40<00:03, 41.73it/s, loss=0.51, sparse_categorical_accuracy=0.815][A
Epoch 1/5:  92%|

Epoch 1/5:  95%|██████████████████▉ | 1630/1718 [00:41<00:02, 41.37it/s, loss=0.507, sparse_categorical_accuracy=0.816][A
Epoch 1/5:  95%|██████████████████▉ | 1630/1718 [00:41<00:02, 41.37it/s, loss=0.507, sparse_categorical_accuracy=0.816][A
Epoch 1/5:  95%|██████████████████▉ | 1630/1718 [00:41<00:02, 41.37it/s, loss=0.507, sparse_categorical_accuracy=0.816][A
Epoch 1/5:  95%|██████████████████▉ | 1630/1718 [00:41<00:02, 41.37it/s, loss=0.507, sparse_categorical_accuracy=0.816][A
Epoch 1/5:  95%|██████████████████▉ | 1630/1718 [00:41<00:02, 41.37it/s, loss=0.507, sparse_categorical_accuracy=0.816][A
Epoch 1/5:  95%|██████████████████▉ | 1630/1718 [00:41<00:02, 41.37it/s, loss=0.507, sparse_categorical_accuracy=0.816][A
Epoch 1/5:  95%|███████████████████ | 1635/1718 [00:41<00:01, 41.90it/s, loss=0.507, sparse_categorical_accuracy=0.816][A
Epoch 1/5:  95%|███████████████████ | 1635/1718 [00:41<00:01, 41.90it/s, loss=0.507, sparse_categorical_accuracy=0.816][A
Epoch 1/5:  95%|

Epoch 1/5:  98%|███████████████████▌| 1685/1718 [00:42<00:00, 42.72it/s, loss=0.505, sparse_categorical_accuracy=0.817][A
Epoch 1/5:  98%|███████████████████▌| 1685/1718 [00:42<00:00, 42.72it/s, loss=0.505, sparse_categorical_accuracy=0.817][A
Epoch 1/5:  98%|███████████████████▌| 1685/1718 [00:42<00:00, 42.72it/s, loss=0.505, sparse_categorical_accuracy=0.817][A
Epoch 1/5:  98%|███████████████████▌| 1685/1718 [00:42<00:00, 42.72it/s, loss=0.505, sparse_categorical_accuracy=0.817][A
Epoch 1/5:  98%|███████████████████▌| 1685/1718 [00:42<00:00, 42.72it/s, loss=0.505, sparse_categorical_accuracy=0.817][A
Epoch 1/5:  98%|███████████████████▌| 1685/1718 [00:42<00:00, 42.72it/s, loss=0.505, sparse_categorical_accuracy=0.817][A
Epoch 1/5:  98%|███████████████████▋| 1690/1718 [00:42<00:00, 41.90it/s, loss=0.505, sparse_categorical_accuracy=0.817][A
Epoch 1/5:  98%|███████████████████▋| 1690/1718 [00:42<00:00, 41.90it/s, loss=0.505, sparse_categorical_accuracy=0.817][A
Epoch 1/5:  98%|

Epoch 2/5:   1%|▏                     | 19/1718 [00:00<00:41, 40.93it/s, loss=0.404, sparse_categorical_accuracy=0.881][A
Epoch 2/5:   1%|▏                     | 19/1718 [00:00<00:41, 40.93it/s, loss=0.402, sparse_categorical_accuracy=0.881][A
Epoch 2/5:   1%|▏                     | 19/1718 [00:00<00:41, 40.93it/s, loss=0.392, sparse_categorical_accuracy=0.883][A
Epoch 2/5:   1%|▏                     | 19/1718 [00:00<00:41, 40.93it/s, loss=0.386, sparse_categorical_accuracy=0.882][A
Epoch 2/5:   1%|▎                     | 24/1718 [00:00<00:41, 41.02it/s, loss=0.386, sparse_categorical_accuracy=0.882][A
Epoch 2/5:   1%|▎                     | 24/1718 [00:00<00:41, 41.02it/s, loss=0.386, sparse_categorical_accuracy=0.881][A
Epoch 2/5:   1%|▎                     | 24/1718 [00:00<00:41, 41.02it/s, loss=0.393, sparse_categorical_accuracy=0.881][A
Epoch 2/5:   1%|▎                      | 24/1718 [00:00<00:41, 41.02it/s, loss=0.39, sparse_categorical_accuracy=0.883][A
Epoch 2/5:   1%|

Epoch 2/5:   4%|▉                     | 75/1718 [00:01<00:41, 39.33it/s, loss=0.405, sparse_categorical_accuracy=0.858][A
Epoch 2/5:   4%|▉                     | 75/1718 [00:01<00:41, 39.33it/s, loss=0.403, sparse_categorical_accuracy=0.859][A
Epoch 2/5:   4%|▉                     | 75/1718 [00:01<00:41, 39.33it/s, loss=0.403, sparse_categorical_accuracy=0.858][A
Epoch 2/5:   4%|▉                     | 75/1718 [00:01<00:41, 39.33it/s, loss=0.402, sparse_categorical_accuracy=0.858][A
Epoch 2/5:   4%|▉                     | 75/1718 [00:01<00:41, 39.33it/s, loss=0.403, sparse_categorical_accuracy=0.857][A
Epoch 2/5:   4%|▉                     | 75/1718 [00:01<00:41, 39.33it/s, loss=0.402, sparse_categorical_accuracy=0.857][A
Epoch 2/5:   5%|█                     | 80/1718 [00:01<00:41, 39.84it/s, loss=0.402, sparse_categorical_accuracy=0.857][A
Epoch 2/5:   5%|█                     | 80/1718 [00:02<00:41, 39.84it/s, loss=0.402, sparse_categorical_accuracy=0.857][A
Epoch 2/5:   5%|

Epoch 2/5:   8%|█▌                   | 130/1718 [00:03<00:37, 42.39it/s, loss=0.386, sparse_categorical_accuracy=0.863][A
Epoch 2/5:   8%|█▌                   | 130/1718 [00:03<00:37, 42.39it/s, loss=0.387, sparse_categorical_accuracy=0.863][A
Epoch 2/5:   8%|█▋                    | 130/1718 [00:03<00:37, 42.39it/s, loss=0.39, sparse_categorical_accuracy=0.862][A
Epoch 2/5:   8%|█▋                    | 130/1718 [00:03<00:37, 42.39it/s, loss=0.39, sparse_categorical_accuracy=0.862][A
Epoch 2/5:   8%|█▋                    | 130/1718 [00:03<00:37, 42.39it/s, loss=0.39, sparse_categorical_accuracy=0.861][A
Epoch 2/5:   8%|█▋                    | 130/1718 [00:03<00:37, 42.39it/s, loss=0.39, sparse_categorical_accuracy=0.861][A
Epoch 2/5:   8%|█▋                    | 135/1718 [00:03<00:37, 42.69it/s, loss=0.39, sparse_categorical_accuracy=0.861][A
Epoch 2/5:   8%|█▋                   | 135/1718 [00:03<00:37, 42.69it/s, loss=0.391, sparse_categorical_accuracy=0.861][A
Epoch 2/5:   8%|

Epoch 2/5:  11%|██▎                  | 185/1718 [00:04<00:40, 37.63it/s, loss=0.394, sparse_categorical_accuracy=0.859][A
Epoch 2/5:  11%|██▎                  | 185/1718 [00:04<00:40, 37.63it/s, loss=0.395, sparse_categorical_accuracy=0.859][A
Epoch 2/5:  11%|██▎                  | 185/1718 [00:04<00:40, 37.63it/s, loss=0.394, sparse_categorical_accuracy=0.859][A
Epoch 2/5:  11%|██▎                  | 185/1718 [00:04<00:40, 37.63it/s, loss=0.394, sparse_categorical_accuracy=0.859][A
Epoch 2/5:  11%|██▎                  | 185/1718 [00:04<00:40, 37.63it/s, loss=0.396, sparse_categorical_accuracy=0.858][A
Epoch 2/5:  11%|██▎                  | 189/1718 [00:04<00:40, 37.69it/s, loss=0.396, sparse_categorical_accuracy=0.858][A
Epoch 2/5:  11%|██▎                  | 189/1718 [00:04<00:40, 37.69it/s, loss=0.397, sparse_categorical_accuracy=0.858][A
Epoch 2/5:  11%|██▎                  | 189/1718 [00:04<00:40, 37.69it/s, loss=0.397, sparse_categorical_accuracy=0.858][A
Epoch 2/5:  11%|

Epoch 2/5:  14%|██▉                  | 236/1718 [00:05<00:35, 41.64it/s, loss=0.401, sparse_categorical_accuracy=0.859][A
Epoch 2/5:  14%|███▏                   | 236/1718 [00:05<00:35, 41.64it/s, loss=0.4, sparse_categorical_accuracy=0.859][A
Epoch 2/5:  14%|███▏                   | 241/1718 [00:06<00:36, 40.13it/s, loss=0.4, sparse_categorical_accuracy=0.859][A
All epochs:  20%|██████████████▍                                                         | 1/5 [00:49<03:19, 49.99s/it]


KeyboardInterrupt: 