<a href="https://colab.research.google.com/github/atick-faisal/MultiViewUNet-Aneurysm/blob/main/src/training/MultiViewUNet.ipynb" target="_parent"><img src="https://colab.research.google.com/assets/colab-badge.svg" alt="Open In Colab"/></a>

# Colab Info


In [1]:
from psutil import virtual_memory

gpu_info = !nvidia-smi
gpu_info = '\n'.join(gpu_info)
if gpu_info.find('failed') >= 0:
    print('Not connected to a GPU')
else:
    print(gpu_info)


ram_gb = virtual_memory().total / 1e9
print('Your runtime has {:.1f} gigabytes of available RAM\n'.format(ram_gb))

if ram_gb < 20:
    print('Not using a high-RAM runtime')
else:
    print('You are using a high-RAM runtime!')


Tue Jun 20 09:26:45 2023       
+-----------------------------------------------------------------------------+
| NVIDIA-SMI 525.85.12    Driver Version: 525.85.12    CUDA Version: 12.0     |
|-------------------------------+----------------------+----------------------+
| GPU  Name        Persistence-M| Bus-Id        Disp.A | Volatile Uncorr. ECC |
| Fan  Temp  Perf  Pwr:Usage/Cap|         Memory-Usage | GPU-Util  Compute M. |
|                               |                      |               MIG M. |
|   0  Tesla T4            Off  | 00000000:00:04.0 Off |                    0 |
| N/A   38C    P8     9W /  70W |      0MiB / 15360MiB |      0%      Default |
|                               |                      |                  N/A |
+-------------------------------+----------------------+----------------------+
                                                                               
+-----------------------------------------------------------------------------+
| Proces

# Fix for GDrive


In [2]:
!pip install -U --no-cache-dir gdown --pre > /dev/null


# Mount GDrive


In [3]:
from google.colab import drive
drive.mount('/content/drive')


Mounted at /content/drive


# Download and Extract Dataset


In [4]:
!gdown "1AoEOeOpN0-x6Rj73OqRfnwMciiTayy73"
!unzip -o "AAA_DATASET_r3.zip" > /dev/null


Downloading...
From (uriginal): https://drive.google.com/uc?id=1AoEOeOpN0-x6Rj73OqRfnwMciiTayy73
From (redirected): https://drive.google.com/uc?id=1AoEOeOpN0-x6Rj73OqRfnwMciiTayy73&confirm=t&uuid=3ce755c6-74bb-4aaa-b21a-b8cfd5f64a8c
To: /content/AAA_DATASET_r3.zip
100% 1.14G/1.14G [00:08<00:00, 134MB/s]


# Imports


In [5]:
import os
import datetime
import matplotlib
import pandas as pd
import tensorflow as tf
import matplotlib.pyplot as plt

from tqdm import tqdm

matplotlib.use('Agg')
plt.rcParams["font.size"] = 16


# Config


In [6]:
PROBLEM = "TAWSS_2_ECAP"

MODEL_NAME = "MultiViewUNet"
DATASET_PATH = "/content/Images/"
TRAIN_DIR = "Train/"
TEST_DIR = "Test/"
INPUT_DIR = PROBLEM.split("_2_")[0]
TARGET_DIR = PROBLEM.split("_2_")[1]
MODEL_PATH = "/content/drive/MyDrive/Research/TAVI/Models/"
PRED_PATH = "/content/drive/MyDrive/Research/TAVI/Predictions/"
IMG_SIZE = 256
BATCH_SIZE = 16
BUFFER_SIZE = 1000
VAL_SPLIT = 0.2
LEARNING_RATE = 0.001
N_EPOCHS = 300
PATIENCE = 30

EXP_NAME = f"{PROBLEM}_{MODEL_NAME}_I{IMG_SIZE}_B{BATCH_SIZE}_LR{LEARNING_RATE}"


# Architecture


In [7]:
class UNet:
    def __init__(
        self,
        img_size: int,
        n_channels: int = 3,
        width: int = 32,
        depth: int = 4,
        kernel_size: int = 3
    ):
        self.img_size = img_size
        self.n_channels = n_channels
        self.width = width
        self.depth = depth
        self.kernel_size = kernel_size

    @staticmethod
    def conv(
        x: tf.Tensor,
        filters: int,
        kernel_size: int
    ) -> tf.Tensor:
        for i in range(2):
            x = tf.keras.layers.Conv2D(
                filters=filters,
                kernel_size=kernel_size,
                strides=1,
                padding="same",
                data_format="channels_last",
                dilation_rate=1,
                groups=1,
                activation=None,
                use_bias=True,
                kernel_initializer="glorot_uniform",
                bias_initializer="zeros",
            )(x)

            x = tf.keras.layers.BatchNormalization()(x)
            x = tf.keras.layers.Activation("relu")(x)

        return x

    @staticmethod
    def deconv(x: tf.Tensor, filters: int) -> tf.Tensor:
        x = tf.keras.layers.Conv2DTranspose(
            filters=filters,
            kernel_size=2,
            strides=2,
            padding="same",
            output_padding=None,
            data_format=None,
            dilation_rate=1,
            activation=None,
            use_bias=True,
            kernel_initializer="glorot_uniform",
            bias_initializer="zeros",
        )(x)

        x = tf.keras.layers.BatchNormalization()(x)
        x = tf.keras.layers.Activation("relu")(x)

        return x

    @staticmethod
    def output(x: tf.Tensor) -> tf.Tensor:
        return tf.keras.layers.Conv2D(3, (1, 1), activation="sigmoid")(x)

    @staticmethod
    def pool(x: tf.Tensor, pool_size: int = 2) -> tf.Tensor:
        return tf.keras.layers.MaxPool2D(pool_size)(x)

    @staticmethod
    def dropout(x: tf.Tensor, amount: float = 0.5) -> tf.Tensor:
        return tf.keras.layers.Dropout(amount)(x)

    def __call__(self) -> tf.keras.Model:
        inputs = tf.keras.layers.Input(
            shape=(self.img_size, self.img_size, self.n_channels)
        )

        # scaled = tf.keras.layers.Rescaling(1./255.0, offset=0)(inputs)

        # ------------------ Downsampling ---------------------
        downsample_layers = []
        downsample_layers.append(
            self.conv(
                x=inputs,
                filters=self.width,
                kernel_size=self.kernel_size
            )
        )
        for i in range(1, self.depth):
            dropout_amount = 0.2 if i == 1 else 0.5
            filters = int((2 ** i) * self.width)
            downsample_layers.append(
                self.dropout(
                    self.pool(
                        self.conv(
                            x=downsample_layers[i - 1],
                            filters=filters,
                            kernel_size=self.kernel_size
                        )
                    ),
                    amount=dropout_amount
                )
            )

        # ------------------- Features --------------------
        n_features = int((2 ** self.depth) * self.width)
        self.features = self.pool(
            self.conv(
                x=downsample_layers[-1],
                filters=n_features,
                kernel_size=self.kernel_size
            )
        )

        # ------------------- Upsampling --------------------
        upsample_layers = []
        upsample_layers.append(self.features)
        for i in range(1, self.depth + 1):
            filters = int((2 ** (self.depth - i)) * self.width)
            upsample_layers.append(
                self.conv(
                    x=self.dropout(
                        tf.keras.layers.concatenate([
                            downsample_layers[self.depth - i],
                            self.deconv(
                                x=upsample_layers[i - 1],
                                filters=filters
                            )
                        ])
                    ),
                    filters=filters,
                    kernel_size=self.kernel_size
                )
            )

        # ---------------------- Output -----------------------
        outputs = self.output(upsample_layers[-1])

        return tf.keras.Model(inputs, outputs)


In [8]:
# ... MultiResUNet
from keras.layers import Input, Conv2D, MaxPooling2D, Conv2DTranspose, concatenate, BatchNormalization, Activation, add
from keras.models import Model, model_from_json
from keras.optimizers import Adam
# from keras.layers.advanced_activations import ELU, LeakyReLU
from keras.utils.vis_utils import plot_model


def conv2d_bn(x, filters, num_row, num_col, padding='same', strides=(1, 1), activation='relu', name=None):
    '''
    2D Convolutional layers

    Arguments:
        x {keras layer} -- input layer
        filters {int} -- number of filters
        num_row {int} -- number of rows in filters
        num_col {int} -- number of columns in filters

    Keyword Arguments:
        padding {str} -- mode of padding (default: {'same'})
        strides {tuple} -- stride of convolution operation (default: {(1, 1)})
        activation {str} -- activation function (default: {'relu'})
        name {str} -- name of the layer (default: {None})

    Returns:
        [keras layer] -- [output layer]
    '''

    x = Conv2D(filters, (num_row, num_col), strides=strides,
               padding=padding, use_bias=False)(x)
    x = BatchNormalization(axis=3, scale=False)(x)

    if(activation == None):
        return x

    x = Activation(activation, name=name)(x)

    return x


def trans_conv2d_bn(x, filters, num_row, num_col, padding='same', strides=(2, 2), name=None):
    '''
    2D Transposed Convolutional layers

    Arguments:
        x {keras layer} -- input layer
        filters {int} -- number of filters
        num_row {int} -- number of rows in filters
        num_col {int} -- number of columns in filters

    Keyword Arguments:
        padding {str} -- mode of padding (default: {'same'})
        strides {tuple} -- stride of convolution operation (default: {(2, 2)})
        name {str} -- name of the layer (default: {None})

    Returns:
        [keras layer] -- [output layer]
    '''

    x = Conv2DTranspose(filters, (num_row, num_col),
                        strides=strides, padding=padding)(x)
    x = BatchNormalization(axis=3, scale=False)(x)

    return x


def MultiResBlock(U, inp, alpha=1.67):
    '''
    MultiRes Block

    Arguments:
        U {int} -- Number of filters in a corrsponding UNet stage
        inp {keras layer} -- input layer

    Returns:
        [keras layer] -- [output layer]
    '''

    W = alpha * U

    shortcut = inp

    shortcut = conv2d_bn(shortcut, int(W*0.167) + int(W*0.333) +
                         int(W*0.5), 1, 1, activation=None, padding='same')

    conv3x3 = conv2d_bn(inp, int(W*0.167), 3, 3,
                        activation='relu', padding='same')

    conv5x5 = conv2d_bn(conv3x3, int(W*0.333), 3, 3,
                        activation='relu', padding='same')

    conv7x7 = conv2d_bn(conv5x5, int(W*0.5), 3, 3,
                        activation='relu', padding='same')

    out = concatenate([conv3x3, conv5x5, conv7x7], axis=3)
    out = BatchNormalization(axis=3)(out)

    out = add([shortcut, out])
    out = Activation('relu')(out)
    out = BatchNormalization(axis=3)(out)

    return out


def ResPath(filters, length, inp):
    '''
    ResPath

    Arguments:
        filters {int} -- [description]
        length {int} -- length of ResPath
        inp {keras layer} -- input layer

    Returns:
        [keras layer] -- [output layer]
    '''

    shortcut = inp
    shortcut = conv2d_bn(shortcut, filters, 1, 1,
                         activation=None, padding='same')

    out = conv2d_bn(inp, filters, 3, 3, activation='relu', padding='same')

    out = add([shortcut, out])
    out = Activation('relu')(out)
    out = BatchNormalization(axis=3)(out)

    for i in range(length-1):

        shortcut = out
        shortcut = conv2d_bn(shortcut, filters, 1, 1,
                             activation=None, padding='same')

        out = conv2d_bn(out, filters, 3, 3, activation='relu', padding='same')

        out = add([shortcut, out])
        out = Activation('relu')(out)
        out = BatchNormalization(axis=3)(out)

    return out


def MultiResUNet(height, width, n_channels):
    '''
    MultiResUNet

    Arguments:
        height {int} -- height of image
        width {int} -- width of image
        n_channels {int} -- number of channels in image

    Returns:
        [keras model] -- MultiResUNet model
    '''

    inputs = Input((height, width, n_channels))

    mresblock1 = MultiResBlock(32, inputs)
    pool1 = MaxPooling2D(pool_size=(2, 2))(mresblock1)
    mresblock1 = ResPath(32, 4, mresblock1)

    mresblock2 = MultiResBlock(32*2, pool1)
    pool2 = MaxPooling2D(pool_size=(2, 2))(mresblock2)
    mresblock2 = ResPath(32*2, 3, mresblock2)

    mresblock3 = MultiResBlock(32*4, pool2)
    pool3 = MaxPooling2D(pool_size=(2, 2))(mresblock3)
    mresblock3 = ResPath(32*4, 2, mresblock3)

    mresblock4 = MultiResBlock(32*8, pool3)
    pool4 = MaxPooling2D(pool_size=(2, 2))(mresblock4)
    mresblock4 = ResPath(32*8, 1, mresblock4)

    mresblock5 = MultiResBlock(32*16, pool4)

    up6 = concatenate([Conv2DTranspose(
        32*8, (2, 2), strides=(2, 2), padding='same')(mresblock5), mresblock4], axis=3)
    mresblock6 = MultiResBlock(32*8, up6)

    up7 = concatenate([Conv2DTranspose(
        32*4, (2, 2), strides=(2, 2), padding='same')(mresblock6), mresblock3], axis=3)
    mresblock7 = MultiResBlock(32*4, up7)

    up8 = concatenate([Conv2DTranspose(
        32*2, (2, 2), strides=(2, 2), padding='same')(mresblock7), mresblock2], axis=3)
    mresblock8 = MultiResBlock(32*2, up8)

    up9 = concatenate([Conv2DTranspose(32, (2, 2), strides=(
        2, 2), padding='same')(mresblock8), mresblock1], axis=3)
    mresblock9 = MultiResBlock(32, up9)

    conv10 = conv2d_bn(mresblock9, 3, 1, 1, activation='sigmoid')

    model = Model(inputs=[inputs], outputs=[conv10])

    return model


# def main():

#     # Define the model

#     model = MultiResUnet(128, 128,3)
#     print(model.summary())


# if __name__ == '__main__':
#     main()


In [9]:
# # ... MultiResUNet3D
# from keras.layers import Input, Conv3D, MaxPooling3D, Conv3DTranspose, concatenate, BatchNormalization, Activation, add
# from keras.models import Model, model_from_json
# from keras.optimizers import Adam
# # from keras.layers.advanced_activations import ELU, LeakyReLU
# from keras.utils.vis_utils import plot_model


# def conv3d_bn(x, filters, num_row, num_col, num_z, padding='same', strides=(1, 1, 1), activation='relu', name=None):
#     '''
#     3D Convolutional layers

#     Arguments:
#         x {keras layer} -- input layer
#         filters {int} -- number of filters
#         num_row {int} -- number of rows in filters
#         num_col {int} -- number of columns in filters
#         num_z {int} -- length along z axis in filters

#     Keyword Arguments:
#         padding {str} -- mode of padding (default: {'same'})
#         strides {tuple} -- stride of convolution operation (default: {(1, 1, 1)})
#         activation {str} -- activation function (default: {'relu'})
#         name {str} -- name of the layer (default: {None})

#     Returns:
#         [keras layer] -- [output layer]
#     '''

#     x = Conv3D(filters, (num_row, num_col, num_z),
#                strides=strides, padding=padding, use_bias=False)(x)
#     x = BatchNormalization(axis=4, scale=False)(x)

#     if(activation == None):
#         return x

#     x = Activation(activation, name=name)(x)
#     return x


# def trans_conv3d_bn(x, filters, num_row, num_col, num_z, padding='same', strides=(2, 2, 2), name=None):
#     '''
#     2D Transposed Convolutional layers

#     Arguments:
#         x {keras layer} -- input layer
#         filters {int} -- number of filters
#         num_row {int} -- number of rows in filters
#         num_col {int} -- number of columns in filters
#         num_z {int} -- length along z axis in filters

#     Keyword Arguments:
#         padding {str} -- mode of padding (default: {'same'})
#         strides {tuple} -- stride of convolution operation (default: {(2, 2, 2)})
#         name {str} -- name of the layer (default: {None})

#     Returns:
#         [keras layer] -- [output layer]
#     '''

#     x = Conv3DTranspose(filters, (num_row, num_col, num_z),
#                         strides=strides, padding=padding)(x)
#     x = BatchNormalization(axis=4, scale=False)(x)

#     return x


# def MultiResBlock(U, inp, alpha=1.67):
#     '''
#     MultiRes Block

#     Arguments:
#         U {int} -- Number of filters in a corrsponding UNet stage
#         inp {keras layer} -- input layer

#     Returns:
#         [keras layer] -- [output layer]
#     '''

#     W = alpha * U

#     shortcut = inp

#     shortcut = conv3d_bn(shortcut, int(W*0.167) + int(W*0.333) +
#                          int(W*0.5), 1, 1, 1, activation=None, padding='same')

#     conv3x3 = conv3d_bn(inp, int(W*0.167), 3, 3, 3,
#                         activation='relu', padding='same')

#     conv5x5 = conv3d_bn(conv3x3, int(W*0.333), 3, 3, 3,
#                         activation='relu', padding='same')

#     conv7x7 = conv3d_bn(conv5x5, int(W*0.5), 3, 3, 3,
#                         activation='relu', padding='same')

#     out = concatenate([conv3x3, conv5x5, conv7x7], axis=4)
#     out = BatchNormalization(axis=4)(out)

#     out = add([shortcut, out])
#     out = Activation('relu')(out)
#     out = BatchNormalization(axis=4)(out)

#     return out


# def ResPath(filters, length, inp):
#     '''
#     ResPath

#     Arguments:
#         filters {int} -- [description]
#         length {int} -- length of ResPath
#         inp {keras layer} -- input layer

#     Returns:
#         [keras layer] -- [output layer]
#     '''

#     shortcut = inp
#     shortcut = conv3d_bn(shortcut, filters, 1, 1, 1,
#                          activation=None, padding='same')

#     out = conv3d_bn(inp, filters, 3, 3, 3, activation='relu', padding='same')

#     out = add([shortcut, out])
#     out = Activation('relu')(out)
#     out = BatchNormalization(axis=4)(out)

#     for i in range(length-1):

#         shortcut = out
#         shortcut = conv3d_bn(shortcut, filters, 1, 1, 1,
#                              activation=None, padding='same')

#         out = conv3d_bn(out, filters, 3, 3, 3,
#                         activation='relu', padding='same')

#         out = add([shortcut, out])
#         out = Activation('relu')(out)
#         out = BatchNormalization(axis=4)(out)

#     return out


# def MultiResUnet3D(height, width, z, n_channels):
#     '''
#     MultiResUNet3D

#     Arguments:
#         height {int} -- height of image
#         width {int} -- width of image
#         z {int} -- length along z axis
#         n_channels {int} -- number of channels in image

#     Returns:
#         [keras model] -- MultiResUNet3D model
#     '''

#     inputs = Input((height, width, z, n_channels))

#     mresblock1 = MultiResBlock(32, inputs)
#     pool1 = MaxPooling3D(pool_size=(2, 2, 2))(mresblock1)
#     mresblock1 = ResPath(32, 4, mresblock1)

#     mresblock2 = MultiResBlock(32*2, pool1)
#     pool2 = MaxPooling3D(pool_size=(2, 2, 2))(mresblock2)
#     mresblock2 = ResPath(32*2, 3, mresblock2)

#     mresblock3 = MultiResBlock(32*4, pool2)
#     pool3 = MaxPooling3D(pool_size=(2, 2, 2))(mresblock3)
#     mresblock3 = ResPath(32*4, 2, mresblock3)

#     mresblock4 = MultiResBlock(32*8, pool3)
#     pool4 = MaxPooling3D(pool_size=(2, 2, 2))(mresblock4)
#     mresblock4 = ResPath(32*8, 1, mresblock4)

#     mresblock5 = MultiResBlock(32*16, pool4)

#     up6 = concatenate([Conv3DTranspose(
#         32*8, (2, 2, 2), strides=(2, 2, 2), padding='same')(mresblock5), mresblock4], axis=4)
#     mresblock6 = MultiResBlock(32*8, up6)

#     up7 = concatenate([Conv3DTranspose(
#         32*4, (2, 2, 2), strides=(2, 2, 2), padding='same')(mresblock6), mresblock3], axis=4)
#     mresblock7 = MultiResBlock(32*4, up7)

#     up8 = concatenate([Conv3DTranspose(
#         32*2, (2, 2, 2), strides=(2, 2, 2), padding='same')(mresblock7), mresblock2], axis=4)
#     mresblock8 = MultiResBlock(32*2, up8)

#     up9 = concatenate([Conv3DTranspose(32, (2, 2, 2), strides=(
#         2, 2, 2), padding='same')(mresblock8), mresblock1], axis=4)
#     mresblock9 = MultiResBlock(32, up9)

#     conv10 = conv3d_bn(mresblock9, 3, 1, 1, 1, activation='sigmoid')

#     model = Model(inputs=[inputs], outputs=[conv10])

#     return model


# # def main():

# #     # Define the model

# #     model = MultiResUnet3D(80, 80, 48, 4)
# #     print(model.summary())


# # if __name__ == '__main__':
# #     main()


# Loss Functions / Metrics


In [10]:
@tf.function
def attention_mse(y_true, y_pred):
    _y_true = y_true[y_true != 1.0]
    _y_pred = y_pred[y_true != 1.0]
    squared_difference = tf.square(_y_true - _y_pred)
    return tf.reduce_mean(squared_difference, axis=-1)


@tf.function
def attention_mae(y_true, y_pred):
    _y_true = y_true[y_true != 1.0]
    _y_pred = y_pred[y_true != 1.0]
    squared_difference = tf.abs(_y_true - _y_pred)
    return tf.reduce_mean(squared_difference, axis=-1)


# DataLoader


In [11]:
def load_data_from_dir(path: str) -> tf.data.Dataset:
    return tf.keras.utils.image_dataset_from_directory(
        directory=path,
        labels=None,
        color_mode='rgb',
        batch_size=BATCH_SIZE,
        image_size=(IMG_SIZE, IMG_SIZE),
        shuffle=False,
        seed=42,
        interpolation='bilinear',
        follow_links=False,
        crop_to_aspect_ratio=False
    )


# Load Dataset


In [12]:
trainX = load_data_from_dir(os.path.join(DATASET_PATH, TRAIN_DIR, INPUT_DIR))
trainY = load_data_from_dir(os.path.join(DATASET_PATH, TRAIN_DIR, TARGET_DIR))
testX = load_data_from_dir(os.path.join(DATASET_PATH, TEST_DIR, INPUT_DIR))
testY = load_data_from_dir(os.path.join(DATASET_PATH, TEST_DIR, TARGET_DIR))

train_ds = tf.data.Dataset.zip((trainX, trainY))
test_ds = tf.data.Dataset.zip((testX, testY))

print(train_ds.element_spec)
print(test_ds.element_spec)


Found 2436 files belonging to 1 classes.
Found 2436 files belonging to 1 classes.
Found 612 files belonging to 1 classes.
Found 612 files belonging to 1 classes.
(TensorSpec(shape=(None, 256, 256, 3), dtype=tf.float32, name=None), TensorSpec(shape=(None, 256, 256, 3), dtype=tf.float32, name=None))
(TensorSpec(shape=(None, 256, 256, 3), dtype=tf.float32, name=None), TensorSpec(shape=(None, 256, 256, 3), dtype=tf.float32, name=None))


# Normalization


In [13]:
normalization_layer = tf.keras.layers.Rescaling(1./255)
train_ds = train_ds.map(lambda x, y: (
    normalization_layer(x), normalization_layer(y)))
test_ds = test_ds.map(lambda x, y: (
    normalization_layer(x), normalization_layer(y)))


# Augmentation


In [14]:
class Augment(tf.keras.layers.Layer):
    def __init__(self, seed=42):
        super().__init__()
        # both use the same seed, so they'll make the same random changes.
        self.augment_inputs = tf.keras.layers.RandomZoom(
            (-0.1, -0.7), seed=seed)
        self.augment_labels = tf.keras.layers.RandomZoom(
            (-0.1, -0.7), seed=seed)

    def call(self, inputs, labels):
        inputs = self.augment_inputs(inputs)
        labels = self.augment_labels(labels)
        return inputs, labels


# Optimization


In [15]:
AUTOTUNE = tf.data.AUTOTUNE

train_batches = (
    train_ds
    .cache()
    .shuffle(BUFFER_SIZE)
    .prefetch(buffer_size=AUTOTUNE)
)

test_batches = (
    test_ds
    .cache()
    .prefetch(buffer_size=AUTOTUNE)
)


# Training Config


In [16]:
model_path = os.path.join(MODEL_PATH, EXP_NAME)

callbacks = [
    tf.keras.callbacks.EarlyStopping(
        monitor="val_loss",
        patience=PATIENCE,
        restore_best_weights=True
    ),
    tf.keras.callbacks.ModelCheckpoint(
        model_path,
        monitor='val_loss',
        verbose=1,
        save_best_only=True,
        save_weights_only=True
    )
]

optimizer = tf.keras.optimizers.Adam(
    learning_rate=LEARNING_RATE
)

model = UNet(IMG_SIZE)()
# model = MultiResUNet(IMG_SIZE, IMG_SIZE, 3)

model.compile(
    loss=attention_mse,
    optimizer=optimizer,
    metrics=[attention_mae]
)

try:
    model.load_weights(model_path)
except:
    print("Checkpoint not found")
    pass


# Training


In [17]:
history = model.fit(
    train_batches,
    validation_data=test_batches,
    epochs=N_EPOCHS,
    batch_size=BATCH_SIZE,
    callbacks=callbacks,
    verbose=1
)


Epoch 1/300
Epoch 1: val_loss improved from inf to 0.01571, saving model to /content/drive/MyDrive/Research/TAVI/Models/TAWSS_2_ECAP_MultiViewUNet_I256_B16_LR0.001
Epoch 2/300
Epoch 2: val_loss improved from 0.01571 to 0.01535, saving model to /content/drive/MyDrive/Research/TAVI/Models/TAWSS_2_ECAP_MultiViewUNet_I256_B16_LR0.001
Epoch 3/300
Epoch 3: val_loss improved from 0.01535 to 0.01518, saving model to /content/drive/MyDrive/Research/TAVI/Models/TAWSS_2_ECAP_MultiViewUNet_I256_B16_LR0.001
Epoch 4/300
Epoch 4: val_loss improved from 0.01518 to 0.01473, saving model to /content/drive/MyDrive/Research/TAVI/Models/TAWSS_2_ECAP_MultiViewUNet_I256_B16_LR0.001
Epoch 5/300
Epoch 5: val_loss did not improve from 0.01473
Epoch 6/300
Epoch 6: val_loss improved from 0.01473 to 0.01471, saving model to /content/drive/MyDrive/Research/TAVI/Models/TAWSS_2_ECAP_MultiViewUNet_I256_B16_LR0.001
Epoch 7/300
Epoch 7: val_loss did not improve from 0.01471
Epoch 8/300
Epoch 8: val_loss did not improve 

# Save Model


In [18]:
timestamp = datetime.datetime.now().strftime('%b-%d-%I:%M%p')
if not os.path.exists(model_path):
    os.makedirs(model_path)

model.save(os.path.join(model_path, timestamp))




In [19]:
os.path.join(model_path, timestamp)

'/content/drive/MyDrive/Research/TAVI/Models/TAWSS_2_ECAP_MultiViewUNet_I256_B16_LR0.001/Jun-20-12:36PM'

# Save Predictions


In [20]:
test_ds_unbatched = test_batches.unbatch()

pred_path = os.path.join(PRED_PATH, EXP_NAME, timestamp)
if not os.path.exists(pred_path):
    os.makedirs(pred_path)

metrics = pd.DataFrame()

for idx, (input, target) in enumerate(tqdm(test_ds_unbatched)):

    target = tf.squeeze(target).numpy()
    prediction = tf.squeeze(
        model.predict(
            tf.expand_dims(input, axis=0)
        )
    )

    channel_sum = tf.expand_dims(tf.reduce_sum(target, axis=-1), axis=-1)
    white_mask = tf.reduce_all(tf.equal(channel_sum, 3.0), axis=-1)
    expanded_mask = tf.expand_dims(white_mask, axis=-1)
    expanded_mask = tf.tile(expanded_mask, [1, 1, 3])
    prediction = tf.where(expanded_mask, tf.ones_like(prediction), prediction)

    plt.figure(figsize=(7, 7))
    plt.imshow(target)
    plt.axis("off")
    plt.tight_layout()
    plt.savefig(os.path.join(pred_path, f"{idx}_T.png"))
    plt.close()

    plt.figure(figsize=(7, 7))
    plt.imshow(prediction)
    plt.axis("off")
    plt.tight_layout()
    plt.savefig(os.path.join(pred_path, f"{idx}_P.png"))
    plt.close()


0it [00:00, ?it/s]



1it [00:02,  2.32s/it]



2it [00:02,  1.21s/it]



3it [00:03,  1.17it/s]



4it [00:03,  1.44it/s]



5it [00:04,  1.66it/s]



6it [00:04,  1.83it/s]



7it [00:04,  1.96it/s]



8it [00:05,  2.09it/s]



9it [00:05,  2.14it/s]



10it [00:06,  2.17it/s]



11it [00:06,  2.27it/s]



12it [00:07,  2.27it/s]



13it [00:07,  2.24it/s]



14it [00:07,  2.25it/s]



15it [00:08,  2.22it/s]



16it [00:08,  2.15it/s]



17it [00:09,  2.12it/s]



18it [00:09,  2.19it/s]



19it [00:10,  2.37it/s]



20it [00:10,  2.41it/s]



21it [00:10,  2.56it/s]



22it [00:11,  2.64it/s]



23it [00:11,  2.56it/s]



24it [00:12,  2.48it/s]



25it [00:12,  2.43it/s]



26it [00:12,  2.54it/s]



27it [00:13,  2.48it/s]



28it [00:13,  2.40it/s]



29it [00:14,  2.42it/s]



30it [00:14,  2.37it/s]



31it [00:15,  2.34it/s]



32it [00:15,  2.31it/s]



33it [00:15,  2.30it/s]



34it [00:16,  2.32it/s]



35it [00:16,  2.29it/s]



36it [00:17,  2.26it/s]



37it [00:17,  2.32it/s]



38it [00:18,  2.46it/s]



39it [00:18,  2.40it/s]



40it [00:18,  2.38it/s]



41it [00:19,  2.35it/s]



42it [00:19,  2.34it/s]



43it [00:20,  2.43it/s]



44it [00:20,  2.39it/s]



45it [00:21,  2.37it/s]



46it [00:21,  2.34it/s]



47it [00:21,  2.30it/s]



48it [00:22,  2.44it/s]



49it [00:22,  2.54it/s]



50it [00:23,  2.43it/s]



51it [00:23,  2.37it/s]



52it [00:23,  2.34it/s]



53it [00:24,  2.32it/s]



54it [00:24,  2.45it/s]



55it [00:25,  2.55it/s]



56it [00:25,  2.63it/s]



57it [00:25,  2.47it/s]



58it [00:26,  2.57it/s]



59it [00:26,  2.63it/s]



60it [00:26,  2.69it/s]



61it [00:27,  2.55it/s]



62it [00:27,  2.48it/s]



63it [00:28,  2.40it/s]



64it [00:28,  2.34it/s]



65it [00:29,  2.31it/s]



66it [00:29,  2.30it/s]



67it [00:30,  2.28it/s]



68it [00:30,  2.27it/s]



69it [00:30,  2.34it/s]



70it [00:31,  1.76it/s]



71it [00:32,  1.90it/s]



72it [00:32,  2.01it/s]



73it [00:33,  2.19it/s]



74it [00:33,  2.33it/s]



75it [00:33,  2.28it/s]



76it [00:34,  2.27it/s]



77it [00:34,  2.26it/s]



78it [00:35,  2.26it/s]



79it [00:35,  2.25it/s]



80it [00:36,  2.21it/s]



81it [00:36,  2.22it/s]



82it [00:37,  2.23it/s]



83it [00:37,  2.24it/s]



84it [00:37,  2.30it/s]



85it [00:38,  2.29it/s]



86it [00:38,  2.33it/s]



87it [00:39,  2.37it/s]



88it [00:39,  2.35it/s]



89it [00:39,  2.46it/s]



90it [00:40,  2.56it/s]



91it [00:40,  2.55it/s]



92it [00:41,  2.34it/s]



93it [00:41,  2.29it/s]



94it [00:42,  2.27it/s]



95it [00:42,  2.20it/s]



96it [00:43,  2.19it/s]



97it [00:43,  2.23it/s]



98it [00:43,  2.21it/s]



99it [00:44,  2.23it/s]



100it [00:44,  2.24it/s]



101it [00:45,  2.33it/s]



102it [00:45,  2.31it/s]



103it [00:46,  2.30it/s]



104it [00:46,  2.46it/s]



105it [00:46,  2.57it/s]



106it [00:47,  2.62it/s]



107it [00:47,  2.54it/s]



108it [00:47,  2.48it/s]



109it [00:48,  2.47it/s]



110it [00:48,  2.47it/s]



111it [00:49,  2.53it/s]



112it [00:49,  2.43it/s]



113it [00:49,  2.52it/s]



114it [00:50,  2.47it/s]



115it [00:50,  2.40it/s]



116it [00:51,  2.41it/s]



117it [00:51,  2.44it/s]



118it [00:52,  2.38it/s]



119it [00:52,  2.34it/s]



120it [00:52,  2.48it/s]



121it [00:53,  2.42it/s]



122it [00:53,  2.39it/s]



123it [00:54,  2.32it/s]



124it [00:54,  2.30it/s]



125it [00:55,  2.20it/s]



126it [00:55,  2.21it/s]



127it [00:56,  2.16it/s]



128it [00:56,  2.20it/s]



129it [00:56,  2.22it/s]



130it [00:57,  2.30it/s]



131it [00:57,  2.37it/s]



132it [00:58,  2.34it/s]



133it [00:58,  2.32it/s]



134it [00:59,  2.31it/s]



135it [00:59,  2.30it/s]



136it [00:59,  2.29it/s]



137it [01:00,  2.29it/s]



138it [01:00,  2.29it/s]



139it [01:01,  2.29it/s]



140it [01:01,  2.29it/s]



141it [01:02,  2.28it/s]



142it [01:02,  2.26it/s]



143it [01:03,  2.26it/s]



144it [01:03,  2.23it/s]



145it [01:03,  2.25it/s]



146it [01:04,  2.25it/s]



147it [01:04,  2.24it/s]



148it [01:05,  2.24it/s]



149it [01:05,  2.25it/s]



150it [01:06,  2.24it/s]



151it [01:06,  2.25it/s]



152it [01:07,  2.24it/s]



153it [01:07,  2.23it/s]



154it [01:07,  2.24it/s]



155it [01:08,  2.23it/s]



156it [01:08,  2.21it/s]



157it [01:09,  2.17it/s]



158it [01:09,  2.10it/s]



159it [01:10,  2.13it/s]



160it [01:10,  2.25it/s]



161it [01:11,  2.26it/s]



162it [01:11,  2.27it/s]



163it [01:12,  2.27it/s]



164it [01:12,  2.42it/s]



165it [01:12,  2.48it/s]



166it [01:13,  2.43it/s]



167it [01:13,  2.39it/s]



168it [01:14,  2.36it/s]



169it [01:14,  2.46it/s]



170it [01:14,  2.49it/s]



171it [01:15,  2.56it/s]



172it [01:15,  2.44it/s]



173it [01:15,  2.55it/s]



174it [01:16,  2.09it/s]



175it [01:17,  2.26it/s]



176it [01:17,  2.42it/s]



177it [01:17,  2.42it/s]



178it [01:18,  2.53it/s]



179it [01:18,  2.63it/s]



180it [01:18,  2.51it/s]



181it [01:19,  2.43it/s]



182it [01:19,  2.38it/s]



183it [01:20,  2.31it/s]



184it [01:20,  2.27it/s]



185it [01:21,  2.27it/s]



186it [01:21,  2.17it/s]



187it [01:22,  2.11it/s]



188it [01:22,  2.14it/s]



189it [01:23,  2.11it/s]



190it [01:23,  2.13it/s]



191it [01:23,  2.27it/s]



192it [01:24,  2.28it/s]



193it [01:24,  2.27it/s]



194it [01:25,  2.42it/s]



195it [01:25,  2.37it/s]



196it [01:25,  2.43it/s]



197it [01:26,  2.37it/s]



198it [01:26,  2.33it/s]



199it [01:27,  2.32it/s]



200it [01:27,  2.31it/s]



201it [01:28,  2.30it/s]



202it [01:28,  2.30it/s]



203it [01:29,  2.29it/s]



204it [01:29,  2.28it/s]



205it [01:29,  2.31it/s]



206it [01:30,  2.46it/s]



207it [01:30,  2.54it/s]



208it [01:31,  2.49it/s]



209it [01:31,  2.42it/s]



210it [01:31,  2.52it/s]



211it [01:32,  2.62it/s]



212it [01:32,  2.48it/s]



213it [01:33,  2.47it/s]



214it [01:33,  2.41it/s]



215it [01:33,  2.32it/s]



216it [01:34,  2.30it/s]



217it [01:34,  2.26it/s]



218it [01:35,  2.24it/s]



219it [01:35,  2.17it/s]



220it [01:36,  2.19it/s]



221it [01:36,  2.19it/s]



222it [01:37,  2.22it/s]



223it [01:37,  2.36it/s]



224it [01:37,  2.38it/s]



225it [01:38,  2.36it/s]



226it [01:38,  2.36it/s]



227it [01:39,  2.33it/s]



228it [01:39,  2.27it/s]



229it [01:40,  2.26it/s]



230it [01:40,  2.26it/s]



231it [01:40,  2.41it/s]



232it [01:41,  2.53it/s]



233it [01:41,  2.60it/s]



234it [01:42,  2.66it/s]



235it [01:42,  2.62it/s]



236it [01:42,  2.69it/s]



237it [01:43,  2.59it/s]



238it [01:43,  2.50it/s]



239it [01:43,  2.62it/s]



240it [01:44,  2.46it/s]



241it [01:44,  2.51it/s]



242it [01:45,  2.60it/s]



243it [01:45,  2.69it/s]



244it [01:45,  2.56it/s]



245it [01:46,  2.59it/s]



246it [01:46,  2.70it/s]



247it [01:47,  2.46it/s]



248it [01:47,  2.40it/s]



249it [01:47,  2.37it/s]



250it [01:48,  2.32it/s]



251it [01:48,  2.31it/s]



252it [01:49,  2.22it/s]



253it [01:49,  2.22it/s]



254it [01:50,  2.25it/s]



255it [01:50,  2.27it/s]



256it [01:51,  2.27it/s]



257it [01:51,  2.41it/s]



258it [01:51,  2.52it/s]



259it [01:52,  2.44it/s]



260it [01:52,  2.39it/s]



261it [01:53,  2.54it/s]



262it [01:53,  2.58it/s]



263it [01:53,  2.50it/s]



264it [01:54,  2.46it/s]



265it [01:54,  2.39it/s]



266it [01:55,  2.37it/s]



267it [01:55,  2.30it/s]



268it [01:56,  2.28it/s]



269it [01:56,  2.26it/s]



270it [01:56,  2.26it/s]



271it [01:57,  2.40it/s]



272it [01:57,  2.35it/s]



273it [01:58,  2.51it/s]



274it [01:58,  2.57it/s]



275it [01:58,  2.58it/s]



276it [01:59,  2.70it/s]



277it [01:59,  2.58it/s]



278it [02:00,  2.02it/s]



279it [02:00,  2.04it/s]



280it [02:01,  2.07it/s]



281it [02:01,  2.12it/s]



282it [02:02,  2.15it/s]



283it [02:02,  2.18it/s]



284it [02:03,  2.19it/s]



285it [02:03,  2.20it/s]



286it [02:03,  2.22it/s]



287it [02:04,  2.39it/s]



288it [02:04,  2.42it/s]



289it [02:05,  2.37it/s]



290it [02:05,  2.35it/s]



291it [02:06,  2.33it/s]



292it [02:06,  2.31it/s]



293it [02:06,  2.30it/s]



294it [02:07,  2.29it/s]



295it [02:07,  2.27it/s]



296it [02:08,  2.24it/s]



297it [02:08,  2.25it/s]



298it [02:09,  2.26it/s]



299it [02:09,  2.28it/s]



300it [02:10,  2.24it/s]



301it [02:10,  2.23it/s]



302it [02:10,  2.25it/s]



303it [02:11,  2.26it/s]



304it [02:11,  2.36it/s]



305it [02:12,  2.49it/s]



306it [02:12,  2.55it/s]



307it [02:12,  2.52it/s]



308it [02:13,  2.36it/s]



309it [02:13,  2.28it/s]



310it [02:14,  2.27it/s]



311it [02:14,  2.21it/s]



312it [02:15,  2.21it/s]



313it [02:15,  2.19it/s]



314it [02:16,  2.29it/s]



315it [02:16,  2.29it/s]



316it [02:16,  2.33it/s]



317it [02:17,  2.45it/s]



318it [02:17,  2.53it/s]



319it [02:18,  2.55it/s]



320it [02:18,  2.62it/s]



321it [02:18,  2.70it/s]



322it [02:19,  2.75it/s]



323it [02:19,  2.59it/s]



324it [02:19,  2.49it/s]



325it [02:20,  2.58it/s]



326it [02:20,  2.65it/s]



327it [02:21,  2.54it/s]



328it [02:21,  2.44it/s]



329it [02:21,  2.51it/s]



330it [02:22,  2.43it/s]



331it [02:22,  2.38it/s]



332it [02:23,  2.35it/s]



333it [02:23,  2.34it/s]



334it [02:24,  2.33it/s]



335it [02:24,  2.32it/s]



336it [02:24,  2.32it/s]



337it [02:25,  2.32it/s]



338it [02:25,  2.32it/s]



339it [02:26,  2.28it/s]



340it [02:26,  2.27it/s]



341it [02:27,  2.26it/s]



342it [02:27,  2.25it/s]



343it [02:28,  2.22it/s]



344it [02:28,  2.22it/s]



345it [02:28,  2.22it/s]



346it [02:29,  2.24it/s]



347it [02:29,  2.25it/s]



348it [02:30,  2.25it/s]



349it [02:30,  2.26it/s]



350it [02:31,  2.26it/s]



351it [02:31,  2.25it/s]



352it [02:32,  2.37it/s]



353it [02:32,  2.50it/s]



354it [02:32,  2.42it/s]



355it [02:33,  2.37it/s]



356it [02:33,  2.42it/s]



357it [02:33,  2.51it/s]



358it [02:34,  2.41it/s]



359it [02:34,  2.37it/s]



360it [02:35,  2.39it/s]



361it [02:35,  2.36it/s]



362it [02:36,  2.33it/s]



363it [02:36,  2.43it/s]



364it [02:36,  2.38it/s]



365it [02:37,  2.36it/s]



366it [02:37,  2.31it/s]



367it [02:38,  2.32it/s]



368it [02:38,  2.38it/s]



369it [02:39,  2.30it/s]



370it [02:39,  2.29it/s]



371it [02:40,  2.28it/s]



372it [02:40,  2.18it/s]



373it [02:41,  2.19it/s]



374it [02:41,  2.12it/s]



375it [02:41,  2.13it/s]



376it [02:42,  2.17it/s]



377it [02:42,  2.19it/s]



378it [02:43,  2.21it/s]



379it [02:43,  2.23it/s]



380it [02:44,  2.25it/s]



381it [02:44,  2.26it/s]



382it [02:45,  2.27it/s]



383it [02:45,  2.31it/s]



384it [02:45,  2.29it/s]



385it [02:46,  2.01it/s]



386it [02:46,  2.21it/s]



387it [02:47,  2.23it/s]



388it [02:47,  2.39it/s]



389it [02:48,  2.50it/s]



390it [02:48,  2.44it/s]



391it [02:48,  2.56it/s]



392it [02:49,  2.59it/s]



393it [02:49,  2.56it/s]



394it [02:49,  2.67it/s]



395it [02:50,  2.77it/s]



396it [02:50,  2.68it/s]



397it [02:51,  2.56it/s]



398it [02:51,  2.47it/s]



399it [02:51,  2.42it/s]



400it [02:52,  2.33it/s]



401it [02:52,  2.24it/s]



402it [02:53,  2.20it/s]



403it [02:53,  2.21it/s]



404it [02:54,  2.22it/s]



405it [02:54,  2.22it/s]



406it [02:55,  2.13it/s]



407it [02:55,  2.12it/s]



408it [02:56,  2.17it/s]



409it [02:56,  2.37it/s]



410it [02:56,  2.34it/s]



411it [02:57,  2.50it/s]



412it [02:57,  2.57it/s]



413it [02:57,  2.67it/s]



414it [02:58,  2.65it/s]



415it [02:58,  2.49it/s]



416it [02:59,  2.41it/s]



417it [02:59,  2.36it/s]



418it [03:00,  2.33it/s]



419it [03:00,  2.46it/s]



420it [03:00,  2.41it/s]



421it [03:01,  2.38it/s]



422it [03:01,  2.36it/s]



423it [03:02,  2.50it/s]



424it [03:02,  2.57it/s]



425it [03:02,  2.55it/s]



426it [03:03,  2.44it/s]



427it [03:03,  2.52it/s]



428it [03:04,  2.55it/s]



429it [03:04,  2.46it/s]



430it [03:04,  2.41it/s]



431it [03:05,  2.45it/s]



432it [03:05,  2.29it/s]



433it [03:06,  2.29it/s]



434it [03:06,  2.26it/s]



435it [03:07,  2.25it/s]



436it [03:07,  2.23it/s]



437it [03:08,  2.23it/s]



438it [03:08,  2.22it/s]



439it [03:08,  2.35it/s]



440it [03:09,  2.49it/s]



441it [03:09,  2.61it/s]



442it [03:10,  2.49it/s]



443it [03:10,  2.63it/s]



444it [03:10,  2.49it/s]



445it [03:11,  2.46it/s]



446it [03:11,  2.60it/s]



447it [03:12,  2.59it/s]



448it [03:12,  2.51it/s]



449it [03:12,  2.60it/s]



450it [03:13,  2.55it/s]



451it [03:13,  2.66it/s]



452it [03:13,  2.51it/s]



453it [03:14,  2.45it/s]



454it [03:14,  2.39it/s]



455it [03:15,  2.43it/s]



456it [03:15,  2.52it/s]



457it [03:15,  2.55it/s]



458it [03:16,  2.47it/s]



459it [03:16,  2.41it/s]



460it [03:17,  2.36it/s]



461it [03:17,  2.34it/s]



462it [03:18,  2.44it/s]



463it [03:18,  2.39it/s]



464it [03:19,  2.33it/s]



465it [03:19,  2.29it/s]



466it [03:19,  2.29it/s]



467it [03:20,  2.29it/s]



468it [03:20,  2.26it/s]



469it [03:21,  2.25it/s]



470it [03:21,  2.24it/s]



471it [03:22,  2.25it/s]



472it [03:22,  2.26it/s]



473it [03:23,  2.27it/s]



474it [03:23,  2.43it/s]



475it [03:23,  2.58it/s]



476it [03:24,  2.69it/s]



477it [03:24,  2.55it/s]



478it [03:24,  2.47it/s]



479it [03:25,  2.48it/s]



480it [03:25,  2.60it/s]



481it [03:25,  2.63it/s]



482it [03:26,  2.52it/s]



483it [03:26,  2.45it/s]



484it [03:27,  2.40it/s]



485it [03:27,  2.36it/s]



486it [03:28,  2.41it/s]



487it [03:28,  2.37it/s]



488it [03:29,  2.33it/s]



489it [03:29,  2.29it/s]



490it [03:30,  1.88it/s]



491it [03:30,  1.97it/s]



492it [03:31,  2.13it/s]



493it [03:31,  2.17it/s]



494it [03:31,  2.18it/s]



495it [03:32,  2.18it/s]



496it [03:32,  2.17it/s]



497it [03:33,  2.12it/s]



498it [03:33,  2.10it/s]



499it [03:34,  2.11it/s]



500it [03:34,  2.15it/s]



501it [03:35,  2.23it/s]



502it [03:35,  2.37it/s]



503it [03:35,  2.50it/s]



504it [03:36,  2.44it/s]



505it [03:36,  2.38it/s]



506it [03:37,  2.32it/s]



507it [03:37,  2.49it/s]



508it [03:37,  2.58it/s]



509it [03:38,  2.48it/s]



510it [03:38,  2.40it/s]



511it [03:39,  2.52it/s]



512it [03:39,  2.52it/s]



513it [03:39,  2.44it/s]



514it [03:40,  2.54it/s]



515it [03:40,  2.46it/s]



516it [03:41,  2.39it/s]



517it [03:41,  2.33it/s]



518it [03:42,  2.31it/s]



519it [03:42,  2.46it/s]



520it [03:42,  2.40it/s]



521it [03:43,  2.36it/s]



522it [03:43,  2.49it/s]



523it [03:44,  2.41it/s]



524it [03:44,  2.53it/s]



525it [03:44,  2.64it/s]



526it [03:45,  2.46it/s]



527it [03:45,  2.40it/s]



528it [03:46,  2.34it/s]



529it [03:46,  2.32it/s]



530it [03:47,  2.20it/s]



531it [03:47,  2.21it/s]



532it [03:48,  2.21it/s]



533it [03:48,  2.22it/s]



534it [03:48,  2.24it/s]



535it [03:49,  2.26it/s]



536it [03:49,  2.27it/s]



537it [03:50,  2.44it/s]



538it [03:50,  2.38it/s]



539it [03:50,  2.55it/s]



540it [03:51,  2.66it/s]



541it [03:51,  2.68it/s]



542it [03:51,  2.74it/s]



543it [03:52,  2.61it/s]



544it [03:52,  2.62it/s]



545it [03:53,  2.49it/s]



546it [03:53,  2.43it/s]



547it [03:54,  2.40it/s]



548it [03:54,  2.36it/s]



549it [03:54,  2.34it/s]



550it [03:55,  2.48it/s]



551it [03:55,  2.61it/s]



552it [03:56,  2.50it/s]



553it [03:56,  2.50it/s]



554it [03:56,  2.60it/s]



555it [03:57,  2.49it/s]



556it [03:57,  2.43it/s]



557it [03:58,  2.38it/s]



558it [03:58,  2.33it/s]



559it [03:59,  2.30it/s]



560it [03:59,  2.26it/s]



561it [03:59,  2.21it/s]



562it [04:00,  2.14it/s]



563it [04:00,  2.10it/s]



564it [04:01,  2.10it/s]



565it [04:01,  2.13it/s]



566it [04:02,  2.17it/s]



567it [04:02,  2.24it/s]



568it [04:03,  2.25it/s]



569it [04:03,  2.23it/s]



570it [04:04,  2.35it/s]



571it [04:04,  2.49it/s]



572it [04:04,  2.41it/s]



573it [04:05,  2.36it/s]



574it [04:05,  2.34it/s]



575it [04:06,  2.32it/s]



576it [04:06,  2.33it/s]



577it [04:06,  2.35it/s]



578it [04:07,  2.45it/s]



579it [04:07,  2.57it/s]



580it [04:08,  2.51it/s]



581it [04:08,  2.44it/s]



582it [04:08,  2.51it/s]



583it [04:09,  2.42it/s]



584it [04:09,  2.38it/s]



585it [04:10,  2.32it/s]



586it [04:10,  2.47it/s]



587it [04:11,  2.49it/s]



588it [04:11,  2.45it/s]



589it [04:11,  2.34it/s]



590it [04:12,  2.31it/s]



591it [04:13,  1.87it/s]



592it [04:13,  1.95it/s]



593it [04:14,  1.95it/s]



594it [04:14,  2.02it/s]



595it [04:15,  2.07it/s]



596it [04:15,  2.23it/s]



597it [04:15,  2.36it/s]



598it [04:16,  2.30it/s]



599it [04:16,  2.27it/s]



600it [04:17,  2.27it/s]



601it [04:17,  2.42it/s]



602it [04:17,  2.46it/s]



603it [04:18,  2.42it/s]



604it [04:18,  2.58it/s]



605it [04:19,  2.47it/s]



606it [04:19,  2.39it/s]



607it [04:19,  2.39it/s]



608it [04:20,  2.36it/s]



609it [04:20,  2.34it/s]



610it [04:21,  2.31it/s]



611it [04:21,  2.28it/s]



612it [05:21,  1.90it/s]


# Loss Curve


In [21]:
try:
    loss = history.history['loss']
    val_loss = history.history['val_loss']

    plt.figure(figsize=(8, 6))
    plt.plot(loss, label='Training Loss')
    plt.plot(val_loss, label='Validation Loss')
    plt.legend(loc='upper right')
    plt.ylabel('Attention MAE')
    plt.title('Training and Validation Loss')
    plt.xlabel('Epoch')
    plt.tight_layout()
    plt.savefig(os.path.join(model_path, timestamp + ".png"))
    plt.close()
except:
    print("Model did not finish training")


# Metrics


In [22]:
model.evaluate(test_batches)




[0.013964442536234856, 0.05754619464278221]