In [1]:
import os
import pandas as pd
import numpy as np
from sklearn.preprocessing import LabelEncoder
from sklearn.model_selection import train_test_split
from sklearn.metrics import classification_report, confusion_matrix
import matplotlib.pyplot as plt

import torch
from torch import nn, optim
from torch.nn import functional as F
from torch.utils.data import Dataset, DataLoader

import torchmetrics
from torchmetrics.functional import accuracy

import pytorch_lightning as pl
from pytorch_lightning.loggers import TensorBoardLogger
from pytorch_lightning.callbacks import ModelCheckpoint

device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
print(device)

  from .autonotebook import tqdm as notebook_tqdm


cuda


## Model Setup 

In [2]:
pl.seed_everything(42, workers=True)

class DrowsyDataset(Dataset):
    
    def __init__(self, sequences):
        self.sequences = sequences
        
    def __len__(self):
        return len(self.sequences)
    
    def __getitem__(self, idx):
        sequence, label = self.sequences[idx]
        return dict(
            sequence=torch.Tensor(sequence.to_numpy()),
            label=torch.tensor(label).long()
        )
    
class DrowsyDataModule(pl.LightningDataModule):
    
    def __init__(self, train_sequences, val_sequences, test_sequences, batch_size):
        super().__init__()
        self.train_sequences = train_sequences
        self.val_sequences = val_sequences
        self.test_sequences = test_sequences
        self.batch_size = batch_size

    def setup(self, stage=None):
        self.train_dataset = DrowsyDataset(self.train_sequences)
        self.val_dataset = DrowsyDataset(self.val_sequences)
        self.test_dataset = DrowsyDataset(self.test_sequences)
        
    def train_dataloader(self):
        return DataLoader(
            self.train_dataset,
            batch_size=self.batch_size,
            shuffle=True,
            num_workers=os.cpu_count()
        )
    
    def val_dataloader(self):
        return DataLoader(
            self.val_dataset,
            batch_size=self.batch_size,
            shuffle=False,
            num_workers=os.cpu_count()
        )
    
    def test_dataloader(self):
        return DataLoader(
            self.test_dataset,
            batch_size=self.batch_size,
            shuffle=False,
            num_workers=os.cpu_count()
        ) 

class DrowsyModel(nn.Module):
    
    def __init__(self, n_features, n_classes, n_hidden=256, n_layers=3):
        super().__init__()
        
        self.n_hidden = n_hidden
        
        self.lstm = nn.LSTM(
            input_size=n_features,
            hidden_size=n_hidden,
            num_layers=n_layers,
            batch_first=True,
            dropout=0.75
        )
        
        self.classifier = nn.Linear(n_hidden, n_classes)
        
    def forward(self, x):
        self.lstm.flatten_parameters()
        _, (hidden, _) = self.lstm(x)
        
        out = hidden[-1]
        return self.classifier(out)
    
class DrowsyPredictor(pl.LightningModule):
    
    def __init__(self, n_features: int, n_classes: int):
        super().__init__()
        self.model = DrowsyModel(n_features, n_classes)
        self.criterion = nn.CrossEntropyLoss()
        
    def forward(self, x, label=None):
        output = self.model(x)
        loss = 0
        if label is not None:
            loss = self.criterion(output, label)
        return loss, output
        
    def training_step(self, batch, batch_idx):
        sequences = batch["sequence"]
        labels = batch["label"]
        loss, outputs = self(sequences, labels)
        predictions = torch.argmax(outputs, dim=1)
        step_accuracy = accuracy(predictions, labels)
        
        self.log("train_loss", loss, prog_bar=True, logger=True)
        self.log("train_accuracy", step_accuracy, prog_bar=True, logger=True)
        
        return {"loss": loss, "accuracy": step_accuracy}
    
    def validation_step(self, batch, batch_idx):
        sequences = batch["sequence"]
        labels = batch["label"]
        loss, outputs = self(sequences, labels)
        predictions = torch.argmax(outputs, dim=1)
        step_accuracy = accuracy(predictions, labels)
        
        self.log("val_loss", loss, prog_bar=True, logger=True)
        self.log("val_accuracy", step_accuracy, prog_bar=True, logger=True)
        
        return {"loss": loss, "accuracy": step_accuracy}
    
    def test_step(self, batch, batch_idx):
        sequences = batch["sequence"]
        labels = batch["label"]
        loss, outputs = self(sequences, labels)
        predictions = torch.argmax(outputs, dim=1)
        step_accuracy = accuracy(predictions, labels)
        
        self.log("test_loss", loss, prog_bar=True, logger=True)
        self.log("test_accuracy", step_accuracy, prog_bar=True, logger=True)
        
        return {"loss": loss, "accuracy": step_accuracy}
    
    def configure_optimizers(self):
        return optim.Adam(self.parameters(), lr=0.0001)

Global seed set to 42


## 參數設置

In [3]:
%load_ext tensorboard
%reload_ext tensorboard
%tensorboard --logdir ./lightning_logs --host 0.0.0.0 --port=8888

ERROR: Failed to launch TensorBoard (exited with -6).
Contents of stderr:
2022-03-08 08:41:33.916283: I tensorflow/stream_executor/platform/default/dso_loader.cc:48] Successfully opened dynamic library libcudart.so.10.1
E0308 08:42:11.963188 140516159272768 program.py:312] TensorBoard could not bind to port 8888, it was already in use
ERROR: TensorBoard could not bind to port 8888, it was already in use
terminate called without an active exception
Fatal Python error: Aborted

Current thread 0x00007fcc006cc700 (most recent call first):
  File "/usr/local/lib/python3.6/dist-packages/tensorflow/python/lib/io/file_io.py", line 700 in list_directory_v2
  File "/usr/local/lib/python3.6/dist-packages/tensorboard/backend/event_processing/io_wrapper.py", line 89 in ListDirectoryAbsolute
  File "/usr/local/lib/python3.6/dist-packages/tensorboard/backend/event_processing/directory_watcher.py", line 212 in _GetNextPath
  File "/usr/local/lib/python3.6/dist-packages/tensorboard/backend/event_proces

In [4]:
X_train = pd.read_csv('../data2.csv')

In [5]:
N_EPOCHS = 200
BATCH_SIZE = 50

# randomed 
ORG_FEATURE_COLUMNS = ['HEOR', 'T5', 'VEOL', 'VEOU', 'F8', 'FZ', 'F7', 'TP8', 'FC3', 'T4', 'HEOL', 'FT10', 'O2', 'FC4', 'FCZ', 'CP3', 'FP2', 'TP7', 'C3', 'F3', 'PZ', 'F4', 'O1', 'FT7', 'CP4', 'FP1', 'C4', 'T6', 'FT8', 'CZ', 'PO1', 'OZ', 'A2', 'A1', 'T3', 'P4', 'P3', 'FT9', 'CPZ', 'PO2']
# ['HEOR', 'T5', 'VEOL', 'VEOU', 'F8', 'FZ', 'F7', 'TP8', 'FC3', 'T4', 'HEOL', 'FT10', 'O2', 'FC4', 'FCZ', 'CP3', 'FP2', 'TP7', 'C3', 'F3', 'PZ', 'F4', 'O1', 'FT7', 'CP4', 'FP1', 'C4', 'T6', 'FT8', 'CZ', 'PO1', 'OZ', 'A2', 'A1', 'T3', 'P4', 'P3', 'FT9', 'CPZ', 'PO2']
g = X_train.groupby("group")

In [6]:
# import random
# ORG_FEATURE_COLUMNS = ['TP8', 'FP2', 'FCZ', 'FT10', 'O2', 'O1', 'FT7', 'F4', 'TP7', 'C3', 'C4', 'F3', 'FT8', 'T6', 'HEOR', 'T5', 'VEOL', 'F7', 'FZ', 'VEOU', 'A1', 'P3', 'PZ', 'CP3', 'P4', 'CPZ', 'A2', 'HEOL', 'CP4', 'FT9', 'F8', 'OZ', 'CZ', 'FC4', 'FC3', 'FP1', 'PO1', 'T3', 'T4', 'PO2']
# random.shuffle(ORG_FEATURE_COLUMNS)
# print(ORG_FEATURE_COLUMNS)

## Main

In [None]:
n = 18
FEATURE_COLUMNS = ORG_FEATURE_COLUMNS[n:]

while(n < 20):
    print("------------------ Round: " + str(n) + " ------------------")
    print(FEATURE_COLUMNS)
    print("Len:", len(FEATURE_COLUMNS))
    
    label_encoder = LabelEncoder()
    encoded_labels = label_encoder.fit_transform(X_train.state)

    label_encoder.classes_

    X_train['label'] = encoded_labels

    # Prepare data ###########################################
    sequences = [] 

    for name, group in g:
        sequence_features = group[FEATURE_COLUMNS]
        label = group.label.iloc[0]

        # print((sequence_features, label))
        sequences.append((sequence_features, label))

    # Setting up train, test, val gruop #######################
    train_sequences, test_sequences = train_test_split(sequences, test_size=0.2)
    val_sequences, test_sequences = train_test_split(test_sequences, test_size=0.5)


    # Setting up data module ##################################
    data_module = DrowsyDataModule(
        train_sequences, val_sequences, test_sequences, BATCH_SIZE
    )

    model = DrowsyPredictor(
        n_features=len(FEATURE_COLUMNS), 
        n_classes=len(label_encoder.classes_)
    )

    # Check points and logger #################################
    checkpoint_callback = ModelCheckpoint(
        dirpath="checkpoints",
        filename="best-checkpoint-corr-mi-" + str(n),
        save_top_k=2,
        verbose=True,
        monitor="val_loss",
        mode="min"
    )

    logger = TensorBoardLogger("lightning_logs", name="Drowsy_MI" + str(n))

    trainer = pl.Trainer(
        logger=logger,
        callbacks=[checkpoint_callback],
        max_epochs=N_EPOCHS,
        gpus=[0],
#         gpus=1, 
#         auto_select_gpus=True,
        auto_lr_find=True, 
        # check_val_every_n_epoch=10
        # refresh_rate=20,
    )
    
    # Training start
    if (n == 18):
        trainer.fit(model, data_module, ckpt_path="/Workspace/code/checkpoints/best-checkpoint-corr-mi-18-v6.ckpt")
    else:
        trainer.fit(model, data_module)
    trainer.test(model, data_module)
    
    FEATURE_COLUMNS.pop(0)
    n = n + 1

------------------ Round: 17 ------------------
['TP7', 'C3', 'F3', 'PZ', 'F4', 'O1', 'FT7', 'CP4', 'FP1', 'C4', 'T6', 'FT8', 'CZ', 'PO1', 'OZ', 'A2', 'A1', 'T3', 'P4', 'P3', 'FT9', 'CPZ', 'PO2']
Len: 23


GPU available: True, used: True
TPU available: False, using: 0 TPU cores
IPU available: False, using: 0 IPUs
Restoring states from the checkpoint path at /Workspace/code/checkpoints/best-checkpoint-corr-mi-17.ckpt
LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1,2]
  "You're resuming from a checkpoint that ended mid-epoch."
Restored all states from the checkpoint file at /Workspace/code/checkpoints/best-checkpoint-corr-mi-17.ckpt

  | Name      | Type             | Params
-----------------------------------------------
0 | model     | DrowsyModel      | 1.3 M 
1 | criterion | CrossEntropyLoss | 0     
-----------------------------------------------
1.3 M     Trainable params
0         Non-trainable params
1.3 M     Total params
5.364     Total estimated model params size (MB)
  rank_zero_warn(f"Checkpoint directory {dirpath} exists and is not empty.")


                                                                      

Global seed set to 42


Epoch 199:  89%|████████▊ | 226/255 [01:17<00:09,  2.92it/s, loss=0.0423, v_num=5, train_loss=0.00486, train_accuracy=1.000]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 199:  89%|████████▉ | 228/255 [01:19<00:09,  2.88it/s, loss=0.0423, v_num=5, train_loss=0.00486, train_accuracy=1.000]
Epoch 199:  90%|█████████ | 230/255 [01:19<00:08,  2.90it/s, loss=0.0423, v_num=5, train_loss=0.00486, train_accuracy=1.000]
Epoch 199:  91%|█████████ | 232/255 [01:19<00:07,  2.92it/s, loss=0.0423, v_num=5, train_loss=0.00486, train_accuracy=1.000]
Epoch 199:  92%|█████████▏| 234/255 [01:19<00:07,  2.94it/s, loss=0.0423, v_num=5, train_loss=0.00486, train_accuracy=1.000]
Epoch 199:  93%|█████████▎| 236/255 [01:19<00:06,  2.96it/s, loss=0.0423, v_num=5, train_loss=0.00486, train_accuracy=1.000]
Epoch 199:  93%|█████████▎| 238/255 [01:19<00:05,  2.98it/s, loss=0.0423, v_num=5, train_loss=0.00486, train_accuracy=1.000]
Epoch 199:  94%|█████████▍| 240/255 [

Epoch 199, global step 45199: val_loss was not in top 2


Epoch 199: 100%|██████████| 255/255 [01:21<00:00,  3.13it/s, loss=0.0423, v_num=5, train_loss=0.00486, train_accuracy=1.000, val_loss=0.157, val_accuracy=0.945]


LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1,2]


Testing: 100%|██████████| 29/29 [00:03<00:00,  8.66it/s]--------------------------------------------------------------------------------
DATALOADER:0 TEST RESULTS
{'test_accuracy': 0.9503193497657776, 'test_loss': 0.1399056315422058}
--------------------------------------------------------------------------------
Testing: 100%|██████████| 29/29 [00:04<00:00,  7.25it/s]
------------------ Round: 18 ------------------
['C3', 'F3', 'PZ', 'F4', 'O1', 'FT7', 'CP4', 'FP1', 'C4', 'T6', 'FT8', 'CZ', 'PO1', 'OZ', 'A2', 'A1', 'T3', 'P4', 'P3', 'FT9', 'CPZ', 'PO2']
Len: 22


GPU available: True, used: True
TPU available: False, using: 0 TPU cores
IPU available: False, using: 0 IPUs
LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1,2]

  | Name      | Type             | Params
-----------------------------------------------
0 | model     | DrowsyModel      | 1.3 M 
1 | criterion | CrossEntropyLoss | 0     
-----------------------------------------------
1.3 M     Trainable params
0         Non-trainable params
1.3 M     Total params
5.360     Total estimated model params size (MB)
  rank_zero_warn(f"Checkpoint directory {dirpath} exists and is not empty.")


                                                                      

Global seed set to 42


Epoch 0:  89%|████████▊ | 226/255 [01:16<00:09,  2.96it/s, loss=0.648, v_num=3, train_loss=0.525, train_accuracy=0.833]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 0:  89%|████████▉ | 228/255 [01:19<00:09,  2.85it/s, loss=0.648, v_num=3, train_loss=0.525, train_accuracy=0.833]
Epoch 0:  90%|█████████ | 230/255 [01:20<00:08,  2.87it/s, loss=0.648, v_num=3, train_loss=0.525, train_accuracy=0.833]
Epoch 0:  91%|█████████ | 232/255 [01:20<00:07,  2.89it/s, loss=0.648, v_num=3, train_loss=0.525, train_accuracy=0.833]
Epoch 0:  92%|█████████▏| 234/255 [01:20<00:07,  2.91it/s, loss=0.648, v_num=3, train_loss=0.525, train_accuracy=0.833]
Epoch 0:  93%|█████████▎| 236/255 [01:20<00:06,  2.93it/s, loss=0.648, v_num=3, train_loss=0.525, train_accuracy=0.833]
Epoch 0:  93%|█████████▎| 238/255 [01:20<00:05,  2.95it/s, loss=0.648, v_num=3, train_loss=0.525, train_accuracy=0.833]
Epoch 0:  94%|█████████▍| 240/255 [01:20<00:05,  2.97it/s, loss=0.648, v

Epoch 0, global step 225: val_loss reached 0.68401 (best 0.68401), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-18-v6.ckpt" as top 2


Epoch 1:  89%|████████▊ | 226/255 [01:16<00:09,  2.96it/s, loss=0.658, v_num=3, train_loss=0.648, train_accuracy=0.667, val_loss=0.684, val_accuracy=0.597]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 1:  89%|████████▉ | 228/255 [01:20<00:09,  2.84it/s, loss=0.658, v_num=3, train_loss=0.648, train_accuracy=0.667, val_loss=0.684, val_accuracy=0.597]
Epoch 1:  90%|█████████ | 230/255 [01:20<00:08,  2.86it/s, loss=0.658, v_num=3, train_loss=0.648, train_accuracy=0.667, val_loss=0.684, val_accuracy=0.597]
Epoch 1:  91%|█████████ | 232/255 [01:20<00:07,  2.88it/s, loss=0.658, v_num=3, train_loss=0.648, train_accuracy=0.667, val_loss=0.684, val_accuracy=0.597]
Epoch 1:  92%|█████████▏| 234/255 [01:20<00:07,  2.90it/s, loss=0.658, v_num=3, train_loss=0.648, train_accuracy=0.667, val_loss=0.684, val_accuracy=0.597]
Epoch 1:  93%|█████████▎| 236/255 [01:20<00:06,  2.92it/s, loss=0.658, v_num=3, train_loss=0.648, train_accuracy=0.667, val_loss=0.6

Epoch 1, global step 451: val_loss reached 0.67526 (best 0.67526), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-18-v7.ckpt" as top 2


Epoch 2:  89%|████████▊ | 226/255 [01:16<00:09,  2.94it/s, loss=0.585, v_num=3, train_loss=0.576, train_accuracy=0.667, val_loss=0.675, val_accuracy=0.591]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 2:  89%|████████▉ | 228/255 [01:20<00:09,  2.82it/s, loss=0.585, v_num=3, train_loss=0.576, train_accuracy=0.667, val_loss=0.675, val_accuracy=0.591]
Epoch 2:  90%|█████████ | 230/255 [01:20<00:08,  2.84it/s, loss=0.585, v_num=3, train_loss=0.576, train_accuracy=0.667, val_loss=0.675, val_accuracy=0.591]
Epoch 2:  91%|█████████ | 232/255 [01:21<00:08,  2.86it/s, loss=0.585, v_num=3, train_loss=0.576, train_accuracy=0.667, val_loss=0.675, val_accuracy=0.591]
Epoch 2:  92%|█████████▏| 234/255 [01:21<00:07,  2.88it/s, loss=0.585, v_num=3, train_loss=0.576, train_accuracy=0.667, val_loss=0.675, val_accuracy=0.591]
Epoch 2:  93%|█████████▎| 236/255 [01:21<00:06,  2.90it/s, loss=0.585, v_num=3, train_loss=0.576, train_accuracy=0.667, val_loss=0.6

Epoch 2, global step 677: val_loss reached 0.60173 (best 0.60173), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-18-v6.ckpt" as top 2


Epoch 3:  89%|████████▊ | 226/255 [01:16<00:09,  2.95it/s, loss=0.818, v_num=3, train_loss=1.140, train_accuracy=0.333, val_loss=0.602, val_accuracy=0.694]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 3:  89%|████████▉ | 228/255 [01:20<00:09,  2.85it/s, loss=0.818, v_num=3, train_loss=1.140, train_accuracy=0.333, val_loss=0.602, val_accuracy=0.694]
Epoch 3:  90%|█████████ | 230/255 [01:20<00:08,  2.87it/s, loss=0.818, v_num=3, train_loss=1.140, train_accuracy=0.333, val_loss=0.602, val_accuracy=0.694]
Epoch 3:  91%|█████████ | 232/255 [01:20<00:07,  2.89it/s, loss=0.818, v_num=3, train_loss=1.140, train_accuracy=0.333, val_loss=0.602, val_accuracy=0.694]
Epoch 3:  92%|█████████▏| 234/255 [01:20<00:07,  2.91it/s, loss=0.818, v_num=3, train_loss=1.140, train_accuracy=0.333, val_loss=0.602, val_accuracy=0.694]
Epoch 3:  93%|█████████▎| 236/255 [01:20<00:06,  2.93it/s, loss=0.818, v_num=3, train_loss=1.140, train_accuracy=0.333, val_loss=0.6

Epoch 3, global step 903: val_loss was not in top 2


Epoch 4:  89%|████████▊ | 226/255 [01:16<00:09,  2.97it/s, loss=0.604, v_num=3, train_loss=0.574, train_accuracy=0.667, val_loss=0.869, val_accuracy=0.551]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 4:  89%|████████▉ | 228/255 [01:19<00:09,  2.86it/s, loss=0.604, v_num=3, train_loss=0.574, train_accuracy=0.667, val_loss=0.869, val_accuracy=0.551]
Epoch 4:  90%|█████████ | 230/255 [01:19<00:08,  2.88it/s, loss=0.604, v_num=3, train_loss=0.574, train_accuracy=0.667, val_loss=0.869, val_accuracy=0.551]
Epoch 4:  91%|█████████ | 232/255 [01:20<00:07,  2.90it/s, loss=0.604, v_num=3, train_loss=0.574, train_accuracy=0.667, val_loss=0.869, val_accuracy=0.551]
Epoch 4:  92%|█████████▏| 234/255 [01:20<00:07,  2.92it/s, loss=0.604, v_num=3, train_loss=0.574, train_accuracy=0.667, val_loss=0.869, val_accuracy=0.551]
Epoch 4:  93%|█████████▎| 236/255 [01:20<00:06,  2.94it/s, loss=0.604, v_num=3, train_loss=0.574, train_accuracy=0.667, val_loss=0.8

Epoch 4, global step 1129: val_loss reached 0.61628 (best 0.60173), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-18-v7.ckpt" as top 2


Epoch 5:  89%|████████▊ | 226/255 [01:16<00:09,  2.94it/s, loss=0.518, v_num=3, train_loss=0.465, train_accuracy=0.778, val_loss=0.616, val_accuracy=0.674]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 5:  89%|████████▉ | 228/255 [01:20<00:09,  2.83it/s, loss=0.518, v_num=3, train_loss=0.465, train_accuracy=0.778, val_loss=0.616, val_accuracy=0.674]
Epoch 5:  90%|█████████ | 230/255 [01:20<00:08,  2.85it/s, loss=0.518, v_num=3, train_loss=0.465, train_accuracy=0.778, val_loss=0.616, val_accuracy=0.674]
Epoch 5:  91%|█████████ | 232/255 [01:20<00:08,  2.87it/s, loss=0.518, v_num=3, train_loss=0.465, train_accuracy=0.778, val_loss=0.616, val_accuracy=0.674]
Epoch 5:  92%|█████████▏| 234/255 [01:20<00:07,  2.89it/s, loss=0.518, v_num=3, train_loss=0.465, train_accuracy=0.778, val_loss=0.616, val_accuracy=0.674]
Epoch 5:  93%|█████████▎| 236/255 [01:21<00:06,  2.91it/s, loss=0.518, v_num=3, train_loss=0.465, train_accuracy=0.778, val_loss=0.6

Epoch 5, global step 1355: val_loss reached 0.51963 (best 0.51963), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-18-v7.ckpt" as top 2


Epoch 6:  89%|████████▊ | 226/255 [01:19<00:10,  2.84it/s, loss=0.456, v_num=3, train_loss=0.180, train_accuracy=1.000, val_loss=0.520, val_accuracy=0.765]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 6:  89%|████████▉ | 228/255 [01:23<00:09,  2.74it/s, loss=0.456, v_num=3, train_loss=0.180, train_accuracy=1.000, val_loss=0.520, val_accuracy=0.765]
Epoch 6:  90%|█████████ | 230/255 [01:23<00:09,  2.76it/s, loss=0.456, v_num=3, train_loss=0.180, train_accuracy=1.000, val_loss=0.520, val_accuracy=0.765]
Epoch 6:  91%|█████████ | 232/255 [01:23<00:08,  2.78it/s, loss=0.456, v_num=3, train_loss=0.180, train_accuracy=1.000, val_loss=0.520, val_accuracy=0.765]
Epoch 6:  92%|█████████▏| 234/255 [01:23<00:07,  2.80it/s, loss=0.456, v_num=3, train_loss=0.180, train_accuracy=1.000, val_loss=0.520, val_accuracy=0.765]
Epoch 6:  93%|█████████▎| 236/255 [01:23<00:06,  2.82it/s, loss=0.456, v_num=3, train_loss=0.180, train_accuracy=1.000, val_loss=0.5

Epoch 6, global step 1581: val_loss reached 0.55370 (best 0.51963), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-18-v6.ckpt" as top 2


Epoch 7:  89%|████████▊ | 226/255 [01:19<00:10,  2.84it/s, loss=0.503, v_num=3, train_loss=0.687, train_accuracy=0.611, val_loss=0.554, val_accuracy=0.741]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 7:  89%|████████▉ | 228/255 [01:23<00:09,  2.74it/s, loss=0.503, v_num=3, train_loss=0.687, train_accuracy=0.611, val_loss=0.554, val_accuracy=0.741]
Epoch 7:  90%|█████████ | 230/255 [01:23<00:09,  2.76it/s, loss=0.503, v_num=3, train_loss=0.687, train_accuracy=0.611, val_loss=0.554, val_accuracy=0.741]
Epoch 7:  91%|█████████ | 232/255 [01:23<00:08,  2.78it/s, loss=0.503, v_num=3, train_loss=0.687, train_accuracy=0.611, val_loss=0.554, val_accuracy=0.741]
Epoch 7:  92%|█████████▏| 234/255 [01:23<00:07,  2.80it/s, loss=0.503, v_num=3, train_loss=0.687, train_accuracy=0.611, val_loss=0.554, val_accuracy=0.741]
Epoch 7:  93%|█████████▎| 236/255 [01:23<00:06,  2.82it/s, loss=0.503, v_num=3, train_loss=0.687, train_accuracy=0.611, val_loss=0.5

Epoch 7, global step 1807: val_loss reached 0.55181 (best 0.51963), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-18-v6.ckpt" as top 2


Epoch 8:  89%|████████▊ | 226/255 [01:17<00:09,  2.92it/s, loss=0.456, v_num=3, train_loss=0.375, train_accuracy=0.833, val_loss=0.552, val_accuracy=0.702]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 8:  89%|████████▉ | 228/255 [01:21<00:09,  2.81it/s, loss=0.456, v_num=3, train_loss=0.375, train_accuracy=0.833, val_loss=0.552, val_accuracy=0.702]
Epoch 8:  90%|█████████ | 230/255 [01:21<00:08,  2.83it/s, loss=0.456, v_num=3, train_loss=0.375, train_accuracy=0.833, val_loss=0.552, val_accuracy=0.702]
Epoch 8:  91%|█████████ | 232/255 [01:21<00:08,  2.85it/s, loss=0.456, v_num=3, train_loss=0.375, train_accuracy=0.833, val_loss=0.552, val_accuracy=0.702]
Epoch 8:  92%|█████████▏| 234/255 [01:21<00:07,  2.87it/s, loss=0.456, v_num=3, train_loss=0.375, train_accuracy=0.833, val_loss=0.552, val_accuracy=0.702]
Epoch 8:  93%|█████████▎| 236/255 [01:21<00:06,  2.89it/s, loss=0.456, v_num=3, train_loss=0.375, train_accuracy=0.833, val_loss=0.5

Epoch 8, global step 2033: val_loss reached 0.47892 (best 0.47892), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-18-v6.ckpt" as top 2


Epoch 9:  89%|████████▊ | 226/255 [01:18<00:10,  2.87it/s, loss=0.502, v_num=3, train_loss=0.586, train_accuracy=0.778, val_loss=0.479, val_accuracy=0.781]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 9:  89%|████████▉ | 228/255 [01:22<00:09,  2.77it/s, loss=0.502, v_num=3, train_loss=0.586, train_accuracy=0.778, val_loss=0.479, val_accuracy=0.781]
Epoch 9:  90%|█████████ | 230/255 [01:22<00:08,  2.79it/s, loss=0.502, v_num=3, train_loss=0.586, train_accuracy=0.778, val_loss=0.479, val_accuracy=0.781]
Epoch 9:  91%|█████████ | 232/255 [01:22<00:08,  2.81it/s, loss=0.502, v_num=3, train_loss=0.586, train_accuracy=0.778, val_loss=0.479, val_accuracy=0.781]
Epoch 9:  92%|█████████▏| 234/255 [01:22<00:07,  2.83it/s, loss=0.502, v_num=3, train_loss=0.586, train_accuracy=0.778, val_loss=0.479, val_accuracy=0.781]
Epoch 9:  93%|█████████▎| 236/255 [01:22<00:06,  2.85it/s, loss=0.502, v_num=3, train_loss=0.586, train_accuracy=0.778, val_loss=0.4

Epoch 9, global step 2259: val_loss reached 0.45462 (best 0.45462), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-18-v7.ckpt" as top 2


Epoch 10:  89%|████████▊ | 226/255 [01:18<00:10,  2.89it/s, loss=0.329, v_num=3, train_loss=0.319, train_accuracy=0.833, val_loss=0.455, val_accuracy=0.793]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 10:  89%|████████▉ | 228/255 [01:21<00:09,  2.79it/s, loss=0.329, v_num=3, train_loss=0.319, train_accuracy=0.833, val_loss=0.455, val_accuracy=0.793]
Epoch 10:  90%|█████████ | 230/255 [01:21<00:08,  2.81it/s, loss=0.329, v_num=3, train_loss=0.319, train_accuracy=0.833, val_loss=0.455, val_accuracy=0.793]
Epoch 10:  91%|█████████ | 232/255 [01:22<00:08,  2.83it/s, loss=0.329, v_num=3, train_loss=0.319, train_accuracy=0.833, val_loss=0.455, val_accuracy=0.793]
Epoch 10:  92%|█████████▏| 234/255 [01:22<00:07,  2.84it/s, loss=0.329, v_num=3, train_loss=0.319, train_accuracy=0.833, val_loss=0.455, val_accuracy=0.793]
Epoch 10:  93%|█████████▎| 236/255 [01:22<00:06,  2.86it/s, loss=0.329, v_num=3, train_loss=0.319, train_accuracy=0.833, val_lo

Epoch 10, global step 2485: val_loss reached 0.40675 (best 0.40675), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-18-v6.ckpt" as top 2


Epoch 11:  89%|████████▊ | 226/255 [01:20<00:10,  2.81it/s, loss=0.518, v_num=3, train_loss=0.507, train_accuracy=0.722, val_loss=0.407, val_accuracy=0.835]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 11:  89%|████████▉ | 228/255 [01:24<00:10,  2.68it/s, loss=0.518, v_num=3, train_loss=0.507, train_accuracy=0.722, val_loss=0.407, val_accuracy=0.835]
Epoch 11:  90%|█████████ | 230/255 [01:25<00:09,  2.70it/s, loss=0.518, v_num=3, train_loss=0.507, train_accuracy=0.722, val_loss=0.407, val_accuracy=0.835]
Epoch 11:  91%|█████████ | 232/255 [01:25<00:08,  2.72it/s, loss=0.518, v_num=3, train_loss=0.507, train_accuracy=0.722, val_loss=0.407, val_accuracy=0.835]
Epoch 11:  92%|█████████▏| 234/255 [01:25<00:07,  2.74it/s, loss=0.518, v_num=3, train_loss=0.507, train_accuracy=0.722, val_loss=0.407, val_accuracy=0.835]
Epoch 11:  93%|█████████▎| 236/255 [01:25<00:06,  2.75it/s, loss=0.518, v_num=3, train_loss=0.507, train_accuracy=0.722, val_lo

Epoch 11, global step 2711: val_loss was not in top 2


Epoch 12:  89%|████████▊ | 226/255 [01:22<00:10,  2.75it/s, loss=0.435, v_num=3, train_loss=0.349, train_accuracy=0.889, val_loss=0.614, val_accuracy=0.732]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 12:  89%|████████▉ | 228/255 [01:26<00:10,  2.62it/s, loss=0.435, v_num=3, train_loss=0.349, train_accuracy=0.889, val_loss=0.614, val_accuracy=0.732]
Epoch 12:  90%|█████████ | 230/255 [01:27<00:09,  2.64it/s, loss=0.435, v_num=3, train_loss=0.349, train_accuracy=0.889, val_loss=0.614, val_accuracy=0.732]
Epoch 12:  91%|█████████ | 232/255 [01:27<00:08,  2.66it/s, loss=0.435, v_num=3, train_loss=0.349, train_accuracy=0.889, val_loss=0.614, val_accuracy=0.732]
Epoch 12:  92%|█████████▏| 234/255 [01:27<00:07,  2.68it/s, loss=0.435, v_num=3, train_loss=0.349, train_accuracy=0.889, val_loss=0.614, val_accuracy=0.732]
Epoch 12:  93%|█████████▎| 236/255 [01:27<00:07,  2.69it/s, loss=0.435, v_num=3, train_loss=0.349, train_accuracy=0.889, val_lo

Epoch 12, global step 2937: val_loss was not in top 2


Epoch 13:  89%|████████▊ | 226/255 [01:23<00:10,  2.72it/s, loss=0.355, v_num=3, train_loss=0.435, train_accuracy=0.778, val_loss=0.484, val_accuracy=0.797]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 13:  89%|████████▉ | 228/255 [01:28<00:10,  2.59it/s, loss=0.355, v_num=3, train_loss=0.435, train_accuracy=0.778, val_loss=0.484, val_accuracy=0.797]
Epoch 13:  90%|█████████ | 230/255 [01:28<00:09,  2.60it/s, loss=0.355, v_num=3, train_loss=0.435, train_accuracy=0.778, val_loss=0.484, val_accuracy=0.797]
Epoch 13:  91%|█████████ | 232/255 [01:28<00:08,  2.62it/s, loss=0.355, v_num=3, train_loss=0.435, train_accuracy=0.778, val_loss=0.484, val_accuracy=0.797]
Epoch 13:  92%|█████████▏| 234/255 [01:28<00:07,  2.64it/s, loss=0.355, v_num=3, train_loss=0.435, train_accuracy=0.778, val_loss=0.484, val_accuracy=0.797]
Epoch 13:  93%|█████████▎| 236/255 [01:28<00:07,  2.66it/s, loss=0.355, v_num=3, train_loss=0.435, train_accuracy=0.778, val_lo

Epoch 13, global step 3163: val_loss reached 0.39304 (best 0.39304), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-18-v7.ckpt" as top 2


Epoch 14:  89%|████████▊ | 226/255 [01:23<00:10,  2.70it/s, loss=0.572, v_num=3, train_loss=0.495, train_accuracy=0.833, val_loss=0.393, val_accuracy=0.852]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 14:  89%|████████▉ | 228/255 [01:28<00:10,  2.58it/s, loss=0.572, v_num=3, train_loss=0.495, train_accuracy=0.833, val_loss=0.393, val_accuracy=0.852]
Epoch 14:  90%|█████████ | 230/255 [01:28<00:09,  2.59it/s, loss=0.572, v_num=3, train_loss=0.495, train_accuracy=0.833, val_loss=0.393, val_accuracy=0.852]
Epoch 14:  91%|█████████ | 232/255 [01:28<00:08,  2.61it/s, loss=0.572, v_num=3, train_loss=0.495, train_accuracy=0.833, val_loss=0.393, val_accuracy=0.852]
Epoch 14:  92%|█████████▏| 234/255 [01:28<00:07,  2.63it/s, loss=0.572, v_num=3, train_loss=0.495, train_accuracy=0.833, val_loss=0.393, val_accuracy=0.852]
Epoch 14:  93%|█████████▎| 236/255 [01:29<00:07,  2.65it/s, loss=0.572, v_num=3, train_loss=0.495, train_accuracy=0.833, val_lo

Epoch 14, global step 3389: val_loss was not in top 2


Epoch 15:  89%|████████▊ | 226/255 [01:23<00:10,  2.71it/s, loss=0.519, v_num=3, train_loss=0.487, train_accuracy=0.833, val_loss=0.598, val_accuracy=0.721]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 15:  89%|████████▉ | 228/255 [01:28<00:10,  2.58it/s, loss=0.519, v_num=3, train_loss=0.487, train_accuracy=0.833, val_loss=0.598, val_accuracy=0.721]
Epoch 15:  90%|█████████ | 230/255 [01:28<00:09,  2.60it/s, loss=0.519, v_num=3, train_loss=0.487, train_accuracy=0.833, val_loss=0.598, val_accuracy=0.721]
Epoch 15:  91%|█████████ | 232/255 [01:28<00:08,  2.61it/s, loss=0.519, v_num=3, train_loss=0.487, train_accuracy=0.833, val_loss=0.598, val_accuracy=0.721]
Epoch 15:  92%|█████████▏| 234/255 [01:28<00:07,  2.63it/s, loss=0.519, v_num=3, train_loss=0.487, train_accuracy=0.833, val_loss=0.598, val_accuracy=0.721]
Epoch 15:  93%|█████████▎| 236/255 [01:29<00:07,  2.65it/s, loss=0.519, v_num=3, train_loss=0.487, train_accuracy=0.833, val_lo

Epoch 15, global step 3615: val_loss was not in top 2


Epoch 16:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.469, v_num=3, train_loss=0.415, train_accuracy=0.833, val_loss=0.555, val_accuracy=0.773]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 16:  89%|████████▉ | 228/255 [01:23<00:09,  2.72it/s, loss=0.469, v_num=3, train_loss=0.415, train_accuracy=0.833, val_loss=0.555, val_accuracy=0.773]
Epoch 16:  90%|█████████ | 230/255 [01:23<00:09,  2.74it/s, loss=0.469, v_num=3, train_loss=0.415, train_accuracy=0.833, val_loss=0.555, val_accuracy=0.773]
Epoch 16:  91%|█████████ | 232/255 [01:24<00:08,  2.76it/s, loss=0.469, v_num=3, train_loss=0.415, train_accuracy=0.833, val_loss=0.555, val_accuracy=0.773]
Epoch 16:  92%|█████████▏| 234/255 [01:24<00:07,  2.78it/s, loss=0.469, v_num=3, train_loss=0.415, train_accuracy=0.833, val_loss=0.555, val_accuracy=0.773]
Epoch 16:  93%|█████████▎| 236/255 [01:24<00:06,  2.80it/s, loss=0.469, v_num=3, train_loss=0.415, train_accuracy=0.833, val_lo

Epoch 16, global step 3841: val_loss was not in top 2


Epoch 17:  89%|████████▊ | 226/255 [01:17<00:09,  2.91it/s, loss=0.402, v_num=3, train_loss=0.360, train_accuracy=0.889, val_loss=0.513, val_accuracy=0.791]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 17:  89%|████████▉ | 228/255 [01:21<00:09,  2.80it/s, loss=0.402, v_num=3, train_loss=0.360, train_accuracy=0.889, val_loss=0.513, val_accuracy=0.791]
Epoch 17:  90%|█████████ | 230/255 [01:21<00:08,  2.82it/s, loss=0.402, v_num=3, train_loss=0.360, train_accuracy=0.889, val_loss=0.513, val_accuracy=0.791]
Epoch 17:  91%|█████████ | 232/255 [01:21<00:08,  2.84it/s, loss=0.402, v_num=3, train_loss=0.360, train_accuracy=0.889, val_loss=0.513, val_accuracy=0.791]
Epoch 17:  92%|█████████▏| 234/255 [01:21<00:07,  2.86it/s, loss=0.402, v_num=3, train_loss=0.360, train_accuracy=0.889, val_loss=0.513, val_accuracy=0.791]
Epoch 17:  93%|█████████▎| 236/255 [01:21<00:06,  2.88it/s, loss=0.402, v_num=3, train_loss=0.360, train_accuracy=0.889, val_lo

Epoch 17, global step 4067: val_loss was not in top 2


Epoch 18:  89%|████████▊ | 226/255 [01:17<00:09,  2.91it/s, loss=0.336, v_num=3, train_loss=0.212, train_accuracy=0.889, val_loss=0.453, val_accuracy=0.820]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 18:  89%|████████▉ | 228/255 [01:21<00:09,  2.80it/s, loss=0.336, v_num=3, train_loss=0.212, train_accuracy=0.889, val_loss=0.453, val_accuracy=0.820]
Epoch 18:  90%|█████████ | 230/255 [01:21<00:08,  2.82it/s, loss=0.336, v_num=3, train_loss=0.212, train_accuracy=0.889, val_loss=0.453, val_accuracy=0.820]
Epoch 18:  91%|█████████ | 232/255 [01:21<00:08,  2.84it/s, loss=0.336, v_num=3, train_loss=0.212, train_accuracy=0.889, val_loss=0.453, val_accuracy=0.820]
Epoch 18:  92%|█████████▏| 234/255 [01:21<00:07,  2.86it/s, loss=0.336, v_num=3, train_loss=0.212, train_accuracy=0.889, val_loss=0.453, val_accuracy=0.820]
Epoch 18:  93%|█████████▎| 236/255 [01:21<00:06,  2.88it/s, loss=0.336, v_num=3, train_loss=0.212, train_accuracy=0.889, val_lo

Epoch 18, global step 4293: val_loss reached 0.37766 (best 0.37766), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-18-v6.ckpt" as top 2


Epoch 19:  89%|████████▊ | 226/255 [01:17<00:09,  2.91it/s, loss=0.585, v_num=3, train_loss=0.618, train_accuracy=0.722, val_loss=0.378, val_accuracy=0.846]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 19:  89%|████████▉ | 228/255 [01:21<00:09,  2.80it/s, loss=0.585, v_num=3, train_loss=0.618, train_accuracy=0.722, val_loss=0.378, val_accuracy=0.846]
Epoch 19:  90%|█████████ | 230/255 [01:21<00:08,  2.82it/s, loss=0.585, v_num=3, train_loss=0.618, train_accuracy=0.722, val_loss=0.378, val_accuracy=0.846]
Epoch 19:  91%|█████████ | 232/255 [01:21<00:08,  2.84it/s, loss=0.585, v_num=3, train_loss=0.618, train_accuracy=0.722, val_loss=0.378, val_accuracy=0.846]
Epoch 19:  92%|█████████▏| 234/255 [01:21<00:07,  2.86it/s, loss=0.585, v_num=3, train_loss=0.618, train_accuracy=0.722, val_loss=0.378, val_accuracy=0.846]
Epoch 19:  93%|█████████▎| 236/255 [01:21<00:06,  2.88it/s, loss=0.585, v_num=3, train_loss=0.618, train_accuracy=0.722, val_lo

Epoch 19, global step 4519: val_loss was not in top 2


Epoch 20:  89%|████████▊ | 226/255 [01:17<00:09,  2.91it/s, loss=0.289, v_num=3, train_loss=0.331, train_accuracy=0.889, val_loss=0.423, val_accuracy=0.819]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 20:  89%|████████▉ | 228/255 [01:21<00:09,  2.80it/s, loss=0.289, v_num=3, train_loss=0.331, train_accuracy=0.889, val_loss=0.423, val_accuracy=0.819]
Epoch 20:  90%|█████████ | 230/255 [01:21<00:08,  2.82it/s, loss=0.289, v_num=3, train_loss=0.331, train_accuracy=0.889, val_loss=0.423, val_accuracy=0.819]
Epoch 20:  91%|█████████ | 232/255 [01:21<00:08,  2.84it/s, loss=0.289, v_num=3, train_loss=0.331, train_accuracy=0.889, val_loss=0.423, val_accuracy=0.819]
Epoch 20:  92%|█████████▏| 234/255 [01:21<00:07,  2.86it/s, loss=0.289, v_num=3, train_loss=0.331, train_accuracy=0.889, val_loss=0.423, val_accuracy=0.819]
Epoch 20:  93%|█████████▎| 236/255 [01:22<00:06,  2.88it/s, loss=0.289, v_num=3, train_loss=0.331, train_accuracy=0.889, val_lo

Epoch 20, global step 4745: val_loss reached 0.33121 (best 0.33121), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-18-v7.ckpt" as top 2


Epoch 21:  89%|████████▊ | 226/255 [01:18<00:10,  2.88it/s, loss=0.293, v_num=3, train_loss=0.276, train_accuracy=0.889, val_loss=0.331, val_accuracy=0.868]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 21:  89%|████████▉ | 228/255 [01:22<00:09,  2.78it/s, loss=0.293, v_num=3, train_loss=0.276, train_accuracy=0.889, val_loss=0.331, val_accuracy=0.868]
Epoch 21:  90%|█████████ | 230/255 [01:22<00:08,  2.80it/s, loss=0.293, v_num=3, train_loss=0.276, train_accuracy=0.889, val_loss=0.331, val_accuracy=0.868]
Epoch 21:  91%|█████████ | 232/255 [01:22<00:08,  2.81it/s, loss=0.293, v_num=3, train_loss=0.276, train_accuracy=0.889, val_loss=0.331, val_accuracy=0.868]
Epoch 21:  92%|█████████▏| 234/255 [01:22<00:07,  2.83it/s, loss=0.293, v_num=3, train_loss=0.276, train_accuracy=0.889, val_loss=0.331, val_accuracy=0.868]
Epoch 21:  93%|█████████▎| 236/255 [01:22<00:06,  2.85it/s, loss=0.293, v_num=3, train_loss=0.276, train_accuracy=0.889, val_lo

Epoch 21, global step 4971: val_loss reached 0.30052 (best 0.30052), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-18-v6.ckpt" as top 2


Epoch 22:  89%|████████▊ | 226/255 [01:18<00:10,  2.87it/s, loss=0.25, v_num=3, train_loss=0.144, train_accuracy=0.889, val_loss=0.301, val_accuracy=0.879] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 22:  89%|████████▉ | 228/255 [01:22<00:09,  2.77it/s, loss=0.25, v_num=3, train_loss=0.144, train_accuracy=0.889, val_loss=0.301, val_accuracy=0.879]
Epoch 22:  90%|█████████ | 230/255 [01:22<00:08,  2.79it/s, loss=0.25, v_num=3, train_loss=0.144, train_accuracy=0.889, val_loss=0.301, val_accuracy=0.879]
Epoch 22:  91%|█████████ | 232/255 [01:22<00:08,  2.81it/s, loss=0.25, v_num=3, train_loss=0.144, train_accuracy=0.889, val_loss=0.301, val_accuracy=0.879]
Epoch 22:  92%|█████████▏| 234/255 [01:22<00:07,  2.82it/s, loss=0.25, v_num=3, train_loss=0.144, train_accuracy=0.889, val_loss=0.301, val_accuracy=0.879]
Epoch 22:  93%|█████████▎| 236/255 [01:22<00:06,  2.84it/s, loss=0.25, v_num=3, train_loss=0.144, train_accuracy=0.889, val_loss=0.

Epoch 22, global step 5197: val_loss reached 0.30382 (best 0.30052), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-18-v7.ckpt" as top 2


Epoch 23:  89%|████████▊ | 226/255 [01:17<00:09,  2.90it/s, loss=0.289, v_num=3, train_loss=0.343, train_accuracy=0.889, val_loss=0.304, val_accuracy=0.886]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 23:  89%|████████▉ | 228/255 [01:21<00:09,  2.80it/s, loss=0.289, v_num=3, train_loss=0.343, train_accuracy=0.889, val_loss=0.304, val_accuracy=0.886]
Epoch 23:  90%|█████████ | 230/255 [01:21<00:08,  2.82it/s, loss=0.289, v_num=3, train_loss=0.343, train_accuracy=0.889, val_loss=0.304, val_accuracy=0.886]
Epoch 23:  91%|█████████ | 232/255 [01:21<00:08,  2.84it/s, loss=0.289, v_num=3, train_loss=0.343, train_accuracy=0.889, val_loss=0.304, val_accuracy=0.886]
Epoch 23:  92%|█████████▏| 234/255 [01:21<00:07,  2.86it/s, loss=0.289, v_num=3, train_loss=0.343, train_accuracy=0.889, val_loss=0.304, val_accuracy=0.886]
Epoch 23:  93%|█████████▎| 236/255 [01:22<00:06,  2.88it/s, loss=0.289, v_num=3, train_loss=0.343, train_accuracy=0.889, val_lo

Epoch 23, global step 5423: val_loss reached 0.29574 (best 0.29574), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-18-v7.ckpt" as top 2


Epoch 24:  89%|████████▊ | 226/255 [01:17<00:10,  2.90it/s, loss=0.245, v_num=3, train_loss=0.301, train_accuracy=0.833, val_loss=0.296, val_accuracy=0.870]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 24:  89%|████████▉ | 228/255 [01:21<00:09,  2.80it/s, loss=0.245, v_num=3, train_loss=0.301, train_accuracy=0.833, val_loss=0.296, val_accuracy=0.870]
Epoch 24:  90%|█████████ | 230/255 [01:21<00:08,  2.81it/s, loss=0.245, v_num=3, train_loss=0.301, train_accuracy=0.833, val_loss=0.296, val_accuracy=0.870]
Epoch 24:  91%|█████████ | 232/255 [01:21<00:08,  2.83it/s, loss=0.245, v_num=3, train_loss=0.301, train_accuracy=0.833, val_loss=0.296, val_accuracy=0.870]
Epoch 24:  92%|█████████▏| 234/255 [01:22<00:07,  2.85it/s, loss=0.245, v_num=3, train_loss=0.301, train_accuracy=0.833, val_loss=0.296, val_accuracy=0.870]
Epoch 24:  93%|█████████▎| 236/255 [01:22<00:06,  2.87it/s, loss=0.245, v_num=3, train_loss=0.301, train_accuracy=0.833, val_lo

Epoch 24, global step 5649: val_loss reached 0.27864 (best 0.27864), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-18-v6.ckpt" as top 2


Epoch 25:  89%|████████▊ | 226/255 [01:18<00:10,  2.90it/s, loss=0.301, v_num=3, train_loss=0.325, train_accuracy=0.722, val_loss=0.279, val_accuracy=0.889] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 25:  89%|████████▉ | 228/255 [01:21<00:09,  2.79it/s, loss=0.301, v_num=3, train_loss=0.325, train_accuracy=0.722, val_loss=0.279, val_accuracy=0.889]
Epoch 25:  90%|█████████ | 230/255 [01:21<00:08,  2.81it/s, loss=0.301, v_num=3, train_loss=0.325, train_accuracy=0.722, val_loss=0.279, val_accuracy=0.889]
Epoch 25:  91%|█████████ | 232/255 [01:21<00:08,  2.83it/s, loss=0.301, v_num=3, train_loss=0.325, train_accuracy=0.722, val_loss=0.279, val_accuracy=0.889]
Epoch 25:  92%|█████████▏| 234/255 [01:22<00:07,  2.85it/s, loss=0.301, v_num=3, train_loss=0.325, train_accuracy=0.722, val_loss=0.279, val_accuracy=0.889]
Epoch 25:  93%|█████████▎| 236/255 [01:22<00:06,  2.87it/s, loss=0.301, v_num=3, train_loss=0.325, train_accuracy=0.722, val_l

Epoch 25, global step 5875: val_loss was not in top 2


Epoch 26:  89%|████████▊ | 226/255 [01:17<00:09,  2.91it/s, loss=0.768, v_num=3, train_loss=0.407, train_accuracy=0.778, val_loss=0.309, val_accuracy=0.862]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 26:  89%|████████▉ | 228/255 [01:21<00:09,  2.80it/s, loss=0.768, v_num=3, train_loss=0.407, train_accuracy=0.778, val_loss=0.309, val_accuracy=0.862]
Epoch 26:  90%|█████████ | 230/255 [01:21<00:08,  2.82it/s, loss=0.768, v_num=3, train_loss=0.407, train_accuracy=0.778, val_loss=0.309, val_accuracy=0.862]
Epoch 26:  91%|█████████ | 232/255 [01:21<00:08,  2.84it/s, loss=0.768, v_num=3, train_loss=0.407, train_accuracy=0.778, val_loss=0.309, val_accuracy=0.862]
Epoch 26:  92%|█████████▏| 234/255 [01:21<00:07,  2.86it/s, loss=0.768, v_num=3, train_loss=0.407, train_accuracy=0.778, val_loss=0.309, val_accuracy=0.862]
Epoch 26:  93%|█████████▎| 236/255 [01:22<00:06,  2.88it/s, loss=0.768, v_num=3, train_loss=0.407, train_accuracy=0.778, val_lo

Epoch 26, global step 6101: val_loss was not in top 2


Epoch 27:  89%|████████▊ | 226/255 [01:17<00:09,  2.90it/s, loss=0.262, v_num=3, train_loss=0.389, train_accuracy=0.778, val_loss=0.539, val_accuracy=0.732] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 27:  89%|████████▉ | 228/255 [01:21<00:09,  2.80it/s, loss=0.262, v_num=3, train_loss=0.389, train_accuracy=0.778, val_loss=0.539, val_accuracy=0.732]
Epoch 27:  90%|█████████ | 230/255 [01:21<00:08,  2.82it/s, loss=0.262, v_num=3, train_loss=0.389, train_accuracy=0.778, val_loss=0.539, val_accuracy=0.732]
Epoch 27:  91%|█████████ | 232/255 [01:21<00:08,  2.84it/s, loss=0.262, v_num=3, train_loss=0.389, train_accuracy=0.778, val_loss=0.539, val_accuracy=0.732]
Epoch 27:  92%|█████████▏| 234/255 [01:21<00:07,  2.86it/s, loss=0.262, v_num=3, train_loss=0.389, train_accuracy=0.778, val_loss=0.539, val_accuracy=0.732]
Epoch 27:  93%|█████████▎| 236/255 [01:22<00:06,  2.87it/s, loss=0.262, v_num=3, train_loss=0.389, train_accuracy=0.778, val_l

Epoch 27, global step 6327: val_loss reached 0.27257 (best 0.27257), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-18-v7.ckpt" as top 2


Epoch 28:  89%|████████▊ | 226/255 [01:17<00:10,  2.90it/s, loss=0.219, v_num=3, train_loss=0.428, train_accuracy=0.722, val_loss=0.273, val_accuracy=0.894]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 28:  89%|████████▉ | 228/255 [01:21<00:09,  2.79it/s, loss=0.219, v_num=3, train_loss=0.428, train_accuracy=0.722, val_loss=0.273, val_accuracy=0.894]
Epoch 28:  90%|█████████ | 230/255 [01:21<00:08,  2.81it/s, loss=0.219, v_num=3, train_loss=0.428, train_accuracy=0.722, val_loss=0.273, val_accuracy=0.894]
Epoch 28:  91%|█████████ | 232/255 [01:21<00:08,  2.83it/s, loss=0.219, v_num=3, train_loss=0.428, train_accuracy=0.722, val_loss=0.273, val_accuracy=0.894]
Epoch 28:  92%|█████████▏| 234/255 [01:22<00:07,  2.85it/s, loss=0.219, v_num=3, train_loss=0.428, train_accuracy=0.722, val_loss=0.273, val_accuracy=0.894]
Epoch 28:  93%|█████████▎| 236/255 [01:22<00:06,  2.87it/s, loss=0.219, v_num=3, train_loss=0.428, train_accuracy=0.722, val_lo

Epoch 28, global step 6553: val_loss was not in top 2


Epoch 29:  89%|████████▊ | 226/255 [01:17<00:09,  2.91it/s, loss=0.23, v_num=3, train_loss=0.0999, train_accuracy=0.944, val_loss=0.290, val_accuracy=0.879] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 29:  89%|████████▉ | 228/255 [01:21<00:09,  2.80it/s, loss=0.23, v_num=3, train_loss=0.0999, train_accuracy=0.944, val_loss=0.290, val_accuracy=0.879]
Epoch 29:  90%|█████████ | 230/255 [01:21<00:08,  2.82it/s, loss=0.23, v_num=3, train_loss=0.0999, train_accuracy=0.944, val_loss=0.290, val_accuracy=0.879]
Epoch 29:  91%|█████████ | 232/255 [01:21<00:08,  2.84it/s, loss=0.23, v_num=3, train_loss=0.0999, train_accuracy=0.944, val_loss=0.290, val_accuracy=0.879]
Epoch 29:  92%|█████████▏| 234/255 [01:21<00:07,  2.86it/s, loss=0.23, v_num=3, train_loss=0.0999, train_accuracy=0.944, val_loss=0.290, val_accuracy=0.879]
Epoch 29:  93%|█████████▎| 236/255 [01:22<00:06,  2.88it/s, loss=0.23, v_num=3, train_loss=0.0999, train_accuracy=0.944, val_l

Epoch 29, global step 6779: val_loss reached 0.26353 (best 0.26353), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-18-v6.ckpt" as top 2


Epoch 30:  89%|████████▊ | 226/255 [01:17<00:09,  2.90it/s, loss=0.208, v_num=3, train_loss=0.143, train_accuracy=0.944, val_loss=0.264, val_accuracy=0.889] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 30:  89%|████████▉ | 228/255 [01:21<00:09,  2.80it/s, loss=0.208, v_num=3, train_loss=0.143, train_accuracy=0.944, val_loss=0.264, val_accuracy=0.889]
Epoch 30:  90%|█████████ | 230/255 [01:21<00:08,  2.82it/s, loss=0.208, v_num=3, train_loss=0.143, train_accuracy=0.944, val_loss=0.264, val_accuracy=0.889]
Epoch 30:  91%|█████████ | 232/255 [01:21<00:08,  2.84it/s, loss=0.208, v_num=3, train_loss=0.143, train_accuracy=0.944, val_loss=0.264, val_accuracy=0.889]
Epoch 30:  92%|█████████▏| 234/255 [01:21<00:07,  2.86it/s, loss=0.208, v_num=3, train_loss=0.143, train_accuracy=0.944, val_loss=0.264, val_accuracy=0.889]
Epoch 30:  93%|█████████▎| 236/255 [01:22<00:06,  2.88it/s, loss=0.208, v_num=3, train_loss=0.143, train_accuracy=0.944, val_l

Epoch 30, global step 7005: val_loss reached 0.24873 (best 0.24873), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-18-v7.ckpt" as top 2


Epoch 31:  89%|████████▊ | 226/255 [01:17<00:09,  2.90it/s, loss=0.189, v_num=3, train_loss=0.130, train_accuracy=0.944, val_loss=0.249, val_accuracy=0.896] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 31:  89%|████████▉ | 228/255 [01:21<00:09,  2.80it/s, loss=0.189, v_num=3, train_loss=0.130, train_accuracy=0.944, val_loss=0.249, val_accuracy=0.896]
Epoch 31:  90%|█████████ | 230/255 [01:21<00:08,  2.82it/s, loss=0.189, v_num=3, train_loss=0.130, train_accuracy=0.944, val_loss=0.249, val_accuracy=0.896]
Epoch 31:  91%|█████████ | 232/255 [01:21<00:08,  2.84it/s, loss=0.189, v_num=3, train_loss=0.130, train_accuracy=0.944, val_loss=0.249, val_accuracy=0.896]
Epoch 31:  92%|█████████▏| 234/255 [01:21<00:07,  2.86it/s, loss=0.189, v_num=3, train_loss=0.130, train_accuracy=0.944, val_loss=0.249, val_accuracy=0.896]
Epoch 31:  93%|█████████▎| 236/255 [01:22<00:06,  2.88it/s, loss=0.189, v_num=3, train_loss=0.130, train_accuracy=0.944, val_l

Epoch 31, global step 7231: val_loss reached 0.25708 (best 0.24873), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-18-v6.ckpt" as top 2


Epoch 32:  89%|████████▊ | 226/255 [01:17<00:09,  2.90it/s, loss=0.192, v_num=3, train_loss=0.142, train_accuracy=0.944, val_loss=0.257, val_accuracy=0.887] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 32:  89%|████████▉ | 228/255 [01:21<00:09,  2.80it/s, loss=0.192, v_num=3, train_loss=0.142, train_accuracy=0.944, val_loss=0.257, val_accuracy=0.887]
Epoch 32:  90%|█████████ | 230/255 [01:21<00:08,  2.82it/s, loss=0.192, v_num=3, train_loss=0.142, train_accuracy=0.944, val_loss=0.257, val_accuracy=0.887]
Epoch 32:  91%|█████████ | 232/255 [01:21<00:08,  2.84it/s, loss=0.192, v_num=3, train_loss=0.142, train_accuracy=0.944, val_loss=0.257, val_accuracy=0.887]
Epoch 32:  92%|█████████▏| 234/255 [01:21<00:07,  2.85it/s, loss=0.192, v_num=3, train_loss=0.142, train_accuracy=0.944, val_loss=0.257, val_accuracy=0.887]
Epoch 32:  93%|█████████▎| 236/255 [01:22<00:06,  2.87it/s, loss=0.192, v_num=3, train_loss=0.142, train_accuracy=0.944, val_l

Epoch 32, global step 7457: val_loss reached 0.23154 (best 0.23154), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-18-v6.ckpt" as top 2


Epoch 33:  89%|████████▊ | 226/255 [01:17<00:10,  2.90it/s, loss=0.2, v_num=3, train_loss=0.413, train_accuracy=0.944, val_loss=0.232, val_accuracy=0.906]   
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 33:  89%|████████▉ | 228/255 [01:21<00:09,  2.79it/s, loss=0.2, v_num=3, train_loss=0.413, train_accuracy=0.944, val_loss=0.232, val_accuracy=0.906]
Epoch 33:  90%|█████████ | 230/255 [01:21<00:08,  2.81it/s, loss=0.2, v_num=3, train_loss=0.413, train_accuracy=0.944, val_loss=0.232, val_accuracy=0.906]
Epoch 33:  91%|█████████ | 232/255 [01:21<00:08,  2.83it/s, loss=0.2, v_num=3, train_loss=0.413, train_accuracy=0.944, val_loss=0.232, val_accuracy=0.906]
Epoch 33:  92%|█████████▏| 234/255 [01:22<00:07,  2.85it/s, loss=0.2, v_num=3, train_loss=0.413, train_accuracy=0.944, val_loss=0.232, val_accuracy=0.906]
Epoch 33:  93%|█████████▎| 236/255 [01:22<00:06,  2.87it/s, loss=0.2, v_num=3, train_loss=0.413, train_accuracy=0.944, val_loss=0.232,

Epoch 33, global step 7683: val_loss was not in top 2


Epoch 34:  89%|████████▊ | 226/255 [01:17<00:09,  2.90it/s, loss=0.213, v_num=3, train_loss=0.167, train_accuracy=0.889, val_loss=0.256, val_accuracy=0.896] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 34:  89%|████████▉ | 228/255 [01:21<00:09,  2.79it/s, loss=0.213, v_num=3, train_loss=0.167, train_accuracy=0.889, val_loss=0.256, val_accuracy=0.896]
Epoch 34:  90%|█████████ | 230/255 [01:21<00:08,  2.81it/s, loss=0.213, v_num=3, train_loss=0.167, train_accuracy=0.889, val_loss=0.256, val_accuracy=0.896]
Epoch 34:  91%|█████████ | 232/255 [01:21<00:08,  2.83it/s, loss=0.213, v_num=3, train_loss=0.167, train_accuracy=0.889, val_loss=0.256, val_accuracy=0.896]
Epoch 34:  92%|█████████▏| 234/255 [01:22<00:07,  2.85it/s, loss=0.213, v_num=3, train_loss=0.167, train_accuracy=0.889, val_loss=0.256, val_accuracy=0.896]
Epoch 34:  93%|█████████▎| 236/255 [01:22<00:06,  2.87it/s, loss=0.213, v_num=3, train_loss=0.167, train_accuracy=0.889, val_l

Epoch 34, global step 7909: val_loss reached 0.23225 (best 0.23154), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-18-v7.ckpt" as top 2


Epoch 35:  89%|████████▊ | 226/255 [01:17<00:09,  2.90it/s, loss=0.216, v_num=3, train_loss=0.365, train_accuracy=0.889, val_loss=0.232, val_accuracy=0.901] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 35:  89%|████████▉ | 228/255 [01:21<00:09,  2.79it/s, loss=0.216, v_num=3, train_loss=0.365, train_accuracy=0.889, val_loss=0.232, val_accuracy=0.901]
Epoch 35:  90%|█████████ | 230/255 [01:21<00:08,  2.81it/s, loss=0.216, v_num=3, train_loss=0.365, train_accuracy=0.889, val_loss=0.232, val_accuracy=0.901]
Epoch 35:  91%|█████████ | 232/255 [01:21<00:08,  2.83it/s, loss=0.216, v_num=3, train_loss=0.365, train_accuracy=0.889, val_loss=0.232, val_accuracy=0.901]
Epoch 35:  92%|█████████▏| 234/255 [01:22<00:07,  2.85it/s, loss=0.216, v_num=3, train_loss=0.365, train_accuracy=0.889, val_loss=0.232, val_accuracy=0.901]
Epoch 35:  93%|█████████▎| 236/255 [01:22<00:06,  2.87it/s, loss=0.216, v_num=3, train_loss=0.365, train_accuracy=0.889, val_l

Epoch 35, global step 8135: val_loss was not in top 2


Epoch 36:  89%|████████▊ | 226/255 [01:17<00:09,  2.91it/s, loss=0.197, v_num=3, train_loss=0.0626, train_accuracy=1.000, val_loss=0.253, val_accuracy=0.898]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 36:  89%|████████▉ | 228/255 [01:21<00:09,  2.80it/s, loss=0.197, v_num=3, train_loss=0.0626, train_accuracy=1.000, val_loss=0.253, val_accuracy=0.898]
Epoch 36:  90%|█████████ | 230/255 [01:21<00:08,  2.82it/s, loss=0.197, v_num=3, train_loss=0.0626, train_accuracy=1.000, val_loss=0.253, val_accuracy=0.898]
Epoch 36:  91%|█████████ | 232/255 [01:21<00:08,  2.84it/s, loss=0.197, v_num=3, train_loss=0.0626, train_accuracy=1.000, val_loss=0.253, val_accuracy=0.898]
Epoch 36:  92%|█████████▏| 234/255 [01:21<00:07,  2.86it/s, loss=0.197, v_num=3, train_loss=0.0626, train_accuracy=1.000, val_loss=0.253, val_accuracy=0.898]
Epoch 36:  93%|█████████▎| 236/255 [01:22<00:06,  2.88it/s, loss=0.197, v_num=3, train_loss=0.0626, train_accuracy=1.000, 

Epoch 36, global step 8361: val_loss was not in top 2


Epoch 37:  89%|████████▊ | 226/255 [01:17<00:09,  2.90it/s, loss=0.213, v_num=3, train_loss=0.138, train_accuracy=0.944, val_loss=0.240, val_accuracy=0.898] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 37:  89%|████████▉ | 228/255 [01:21<00:09,  2.79it/s, loss=0.213, v_num=3, train_loss=0.138, train_accuracy=0.944, val_loss=0.240, val_accuracy=0.898]
Epoch 37:  90%|█████████ | 230/255 [01:21<00:08,  2.81it/s, loss=0.213, v_num=3, train_loss=0.138, train_accuracy=0.944, val_loss=0.240, val_accuracy=0.898]
Epoch 37:  91%|█████████ | 232/255 [01:21<00:08,  2.83it/s, loss=0.213, v_num=3, train_loss=0.138, train_accuracy=0.944, val_loss=0.240, val_accuracy=0.898]
Epoch 37:  92%|█████████▏| 234/255 [01:22<00:07,  2.85it/s, loss=0.213, v_num=3, train_loss=0.138, train_accuracy=0.944, val_loss=0.240, val_accuracy=0.898]
Epoch 37:  93%|█████████▎| 236/255 [01:22<00:06,  2.87it/s, loss=0.213, v_num=3, train_loss=0.138, train_accuracy=0.944, val_l

Epoch 37, global step 8587: val_loss reached 0.21685 (best 0.21685), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-18-v7.ckpt" as top 2


Epoch 38:  89%|████████▊ | 226/255 [01:17<00:09,  2.90it/s, loss=0.177, v_num=3, train_loss=0.0985, train_accuracy=1.000, val_loss=0.217, val_accuracy=0.906]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 38:  89%|████████▉ | 228/255 [01:21<00:09,  2.80it/s, loss=0.177, v_num=3, train_loss=0.0985, train_accuracy=1.000, val_loss=0.217, val_accuracy=0.906]
Epoch 38:  90%|█████████ | 230/255 [01:21<00:08,  2.81it/s, loss=0.177, v_num=3, train_loss=0.0985, train_accuracy=1.000, val_loss=0.217, val_accuracy=0.906]
Epoch 38:  91%|█████████ | 232/255 [01:21<00:08,  2.83it/s, loss=0.177, v_num=3, train_loss=0.0985, train_accuracy=1.000, val_loss=0.217, val_accuracy=0.906]
Epoch 38:  92%|█████████▏| 234/255 [01:22<00:07,  2.85it/s, loss=0.177, v_num=3, train_loss=0.0985, train_accuracy=1.000, val_loss=0.217, val_accuracy=0.906]
Epoch 38:  93%|█████████▎| 236/255 [01:22<00:06,  2.87it/s, loss=0.177, v_num=3, train_loss=0.0985, train_accuracy=1.000, 

Epoch 38, global step 8813: val_loss was not in top 2


Epoch 39:  89%|████████▊ | 226/255 [01:17<00:09,  2.90it/s, loss=0.168, v_num=3, train_loss=0.113, train_accuracy=0.944, val_loss=0.243, val_accuracy=0.904] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 39:  89%|████████▉ | 228/255 [01:21<00:09,  2.80it/s, loss=0.168, v_num=3, train_loss=0.113, train_accuracy=0.944, val_loss=0.243, val_accuracy=0.904]
Epoch 39:  90%|█████████ | 230/255 [01:21<00:08,  2.81it/s, loss=0.168, v_num=3, train_loss=0.113, train_accuracy=0.944, val_loss=0.243, val_accuracy=0.904]
Epoch 39:  91%|█████████ | 232/255 [01:21<00:08,  2.83it/s, loss=0.168, v_num=3, train_loss=0.113, train_accuracy=0.944, val_loss=0.243, val_accuracy=0.904]
Epoch 39:  92%|█████████▏| 234/255 [01:22<00:07,  2.85it/s, loss=0.168, v_num=3, train_loss=0.113, train_accuracy=0.944, val_loss=0.243, val_accuracy=0.904]
Epoch 39:  93%|█████████▎| 236/255 [01:22<00:06,  2.87it/s, loss=0.168, v_num=3, train_loss=0.113, train_accuracy=0.944, val_l

Epoch 39, global step 9039: val_loss was not in top 2


Epoch 40:  89%|████████▊ | 226/255 [01:17<00:09,  2.90it/s, loss=0.21, v_num=3, train_loss=0.286, train_accuracy=0.889, val_loss=0.265, val_accuracy=0.900]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 40:  89%|████████▉ | 228/255 [01:21<00:09,  2.80it/s, loss=0.21, v_num=3, train_loss=0.286, train_accuracy=0.889, val_loss=0.265, val_accuracy=0.900]
Epoch 40:  90%|█████████ | 230/255 [01:21<00:08,  2.81it/s, loss=0.21, v_num=3, train_loss=0.286, train_accuracy=0.889, val_loss=0.265, val_accuracy=0.900]
Epoch 40:  91%|█████████ | 232/255 [01:21<00:08,  2.83it/s, loss=0.21, v_num=3, train_loss=0.286, train_accuracy=0.889, val_loss=0.265, val_accuracy=0.900]
Epoch 40:  92%|█████████▏| 234/255 [01:22<00:07,  2.85it/s, loss=0.21, v_num=3, train_loss=0.286, train_accuracy=0.889, val_loss=0.265, val_accuracy=0.900]
Epoch 40:  93%|█████████▎| 236/255 [01:22<00:06,  2.87it/s, loss=0.21, v_num=3, train_loss=0.286, train_accuracy=0.889, val_loss=0

Epoch 40, global step 9265: val_loss was not in top 2


Epoch 41:  89%|████████▊ | 226/255 [01:17<00:09,  2.90it/s, loss=0.248, v_num=3, train_loss=0.422, train_accuracy=0.722, val_loss=0.233, val_accuracy=0.905] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 41:  89%|████████▉ | 228/255 [01:21<00:09,  2.79it/s, loss=0.248, v_num=3, train_loss=0.422, train_accuracy=0.722, val_loss=0.233, val_accuracy=0.905]
Epoch 41:  90%|█████████ | 230/255 [01:21<00:08,  2.81it/s, loss=0.248, v_num=3, train_loss=0.422, train_accuracy=0.722, val_loss=0.233, val_accuracy=0.905]
Epoch 41:  91%|█████████ | 232/255 [01:21<00:08,  2.83it/s, loss=0.248, v_num=3, train_loss=0.422, train_accuracy=0.722, val_loss=0.233, val_accuracy=0.905]
Epoch 41:  92%|█████████▏| 234/255 [01:22<00:07,  2.85it/s, loss=0.248, v_num=3, train_loss=0.422, train_accuracy=0.722, val_loss=0.233, val_accuracy=0.905]
Epoch 41:  93%|█████████▎| 236/255 [01:22<00:06,  2.87it/s, loss=0.248, v_num=3, train_loss=0.422, train_accuracy=0.722, val_l

Epoch 41, global step 9491: val_loss was not in top 2


Epoch 42:  89%|████████▊ | 226/255 [01:17<00:09,  2.90it/s, loss=0.201, v_num=3, train_loss=0.0613, train_accuracy=0.944, val_loss=0.261, val_accuracy=0.881]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 42:  89%|████████▉ | 228/255 [01:21<00:09,  2.79it/s, loss=0.201, v_num=3, train_loss=0.0613, train_accuracy=0.944, val_loss=0.261, val_accuracy=0.881]
Epoch 42:  90%|█████████ | 230/255 [01:21<00:08,  2.81it/s, loss=0.201, v_num=3, train_loss=0.0613, train_accuracy=0.944, val_loss=0.261, val_accuracy=0.881]
Epoch 42:  91%|█████████ | 232/255 [01:21<00:08,  2.83it/s, loss=0.201, v_num=3, train_loss=0.0613, train_accuracy=0.944, val_loss=0.261, val_accuracy=0.881]
Epoch 42:  92%|█████████▏| 234/255 [01:22<00:07,  2.85it/s, loss=0.201, v_num=3, train_loss=0.0613, train_accuracy=0.944, val_loss=0.261, val_accuracy=0.881]
Epoch 42:  93%|█████████▎| 236/255 [01:22<00:06,  2.87it/s, loss=0.201, v_num=3, train_loss=0.0613, train_accuracy=0.944, 

Epoch 42, global step 9717: val_loss was not in top 2


Epoch 43:  89%|████████▊ | 226/255 [01:17<00:10,  2.90it/s, loss=0.182, v_num=3, train_loss=0.157, train_accuracy=0.944, val_loss=0.243, val_accuracy=0.908] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 43:  89%|████████▉ | 228/255 [01:21<00:09,  2.79it/s, loss=0.182, v_num=3, train_loss=0.157, train_accuracy=0.944, val_loss=0.243, val_accuracy=0.908]
Epoch 43:  90%|█████████ | 230/255 [01:21<00:08,  2.81it/s, loss=0.182, v_num=3, train_loss=0.157, train_accuracy=0.944, val_loss=0.243, val_accuracy=0.908]
Epoch 43:  91%|█████████ | 232/255 [01:22<00:08,  2.83it/s, loss=0.182, v_num=3, train_loss=0.157, train_accuracy=0.944, val_loss=0.243, val_accuracy=0.908]
Epoch 43:  92%|█████████▏| 234/255 [01:22<00:07,  2.85it/s, loss=0.182, v_num=3, train_loss=0.157, train_accuracy=0.944, val_loss=0.243, val_accuracy=0.908]
Epoch 43:  93%|█████████▎| 236/255 [01:22<00:06,  2.87it/s, loss=0.182, v_num=3, train_loss=0.157, train_accuracy=0.944, val_l

Epoch 43, global step 9943: val_loss reached 0.23095 (best 0.21685), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-18-v6.ckpt" as top 2


Epoch 44:  89%|████████▊ | 226/255 [01:17<00:10,  2.90it/s, loss=0.169, v_num=3, train_loss=0.049, train_accuracy=1.000, val_loss=0.231, val_accuracy=0.903] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 44:  89%|████████▉ | 228/255 [01:21<00:09,  2.79it/s, loss=0.169, v_num=3, train_loss=0.049, train_accuracy=1.000, val_loss=0.231, val_accuracy=0.903]
Epoch 44:  90%|█████████ | 230/255 [01:21<00:08,  2.81it/s, loss=0.169, v_num=3, train_loss=0.049, train_accuracy=1.000, val_loss=0.231, val_accuracy=0.903]
Epoch 44:  91%|█████████ | 232/255 [01:21<00:08,  2.83it/s, loss=0.169, v_num=3, train_loss=0.049, train_accuracy=1.000, val_loss=0.231, val_accuracy=0.903]
Epoch 44:  92%|█████████▏| 234/255 [01:22<00:07,  2.85it/s, loss=0.169, v_num=3, train_loss=0.049, train_accuracy=1.000, val_loss=0.231, val_accuracy=0.903]
Epoch 44:  93%|█████████▎| 236/255 [01:22<00:06,  2.87it/s, loss=0.169, v_num=3, train_loss=0.049, train_accuracy=1.000, val_l

Epoch 44, global step 10169: val_loss reached 0.21531 (best 0.21531), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-18-v6.ckpt" as top 2


Epoch 45:  89%|████████▊ | 226/255 [01:17<00:10,  2.90it/s, loss=0.143, v_num=3, train_loss=0.182, train_accuracy=0.944, val_loss=0.215, val_accuracy=0.908] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 45:  89%|████████▉ | 228/255 [01:21<00:09,  2.79it/s, loss=0.143, v_num=3, train_loss=0.182, train_accuracy=0.944, val_loss=0.215, val_accuracy=0.908]
Epoch 45:  90%|█████████ | 230/255 [01:21<00:08,  2.81it/s, loss=0.143, v_num=3, train_loss=0.182, train_accuracy=0.944, val_loss=0.215, val_accuracy=0.908]
Epoch 45:  91%|█████████ | 232/255 [01:21<00:08,  2.83it/s, loss=0.143, v_num=3, train_loss=0.182, train_accuracy=0.944, val_loss=0.215, val_accuracy=0.908]
Epoch 45:  92%|█████████▏| 234/255 [01:22<00:07,  2.85it/s, loss=0.143, v_num=3, train_loss=0.182, train_accuracy=0.944, val_loss=0.215, val_accuracy=0.908]
Epoch 45:  93%|█████████▎| 236/255 [01:22<00:06,  2.87it/s, loss=0.143, v_num=3, train_loss=0.182, train_accuracy=0.944, val_l

Epoch 45, global step 10395: val_loss was not in top 2


Epoch 46:  89%|████████▊ | 226/255 [01:17<00:09,  2.90it/s, loss=0.148, v_num=3, train_loss=0.112, train_accuracy=0.944, val_loss=0.226, val_accuracy=0.916] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 46:  89%|████████▉ | 228/255 [01:21<00:09,  2.79it/s, loss=0.148, v_num=3, train_loss=0.112, train_accuracy=0.944, val_loss=0.226, val_accuracy=0.916]
Epoch 46:  90%|█████████ | 230/255 [01:21<00:08,  2.81it/s, loss=0.148, v_num=3, train_loss=0.112, train_accuracy=0.944, val_loss=0.226, val_accuracy=0.916]
Epoch 46:  91%|█████████ | 232/255 [01:21<00:08,  2.83it/s, loss=0.148, v_num=3, train_loss=0.112, train_accuracy=0.944, val_loss=0.226, val_accuracy=0.916]
Epoch 46:  92%|█████████▏| 234/255 [01:22<00:07,  2.85it/s, loss=0.148, v_num=3, train_loss=0.112, train_accuracy=0.944, val_loss=0.226, val_accuracy=0.916]
Epoch 46:  93%|█████████▎| 236/255 [01:22<00:06,  2.87it/s, loss=0.148, v_num=3, train_loss=0.112, train_accuracy=0.944, val_l

Epoch 46, global step 10621: val_loss reached 0.21358 (best 0.21358), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-18-v7.ckpt" as top 2


Epoch 47:  89%|████████▊ | 226/255 [01:17<00:10,  2.90it/s, loss=0.167, v_num=3, train_loss=0.055, train_accuracy=1.000, val_loss=0.214, val_accuracy=0.917] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 47:  89%|████████▉ | 228/255 [01:21<00:09,  2.79it/s, loss=0.167, v_num=3, train_loss=0.055, train_accuracy=1.000, val_loss=0.214, val_accuracy=0.917]
Epoch 47:  90%|█████████ | 230/255 [01:21<00:08,  2.81it/s, loss=0.167, v_num=3, train_loss=0.055, train_accuracy=1.000, val_loss=0.214, val_accuracy=0.917]
Epoch 47:  91%|█████████ | 232/255 [01:22<00:08,  2.83it/s, loss=0.167, v_num=3, train_loss=0.055, train_accuracy=1.000, val_loss=0.214, val_accuracy=0.917]
Epoch 47:  92%|█████████▏| 234/255 [01:22<00:07,  2.85it/s, loss=0.167, v_num=3, train_loss=0.055, train_accuracy=1.000, val_loss=0.214, val_accuracy=0.917]
Epoch 47:  93%|█████████▎| 236/255 [01:22<00:06,  2.87it/s, loss=0.167, v_num=3, train_loss=0.055, train_accuracy=1.000, val_l

Epoch 47, global step 10847: val_loss was not in top 2


Epoch 48:  89%|████████▊ | 226/255 [01:17<00:09,  2.90it/s, loss=0.187, v_num=3, train_loss=0.237, train_accuracy=0.889, val_loss=0.233, val_accuracy=0.911] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 48:  89%|████████▉ | 228/255 [01:21<00:09,  2.79it/s, loss=0.187, v_num=3, train_loss=0.237, train_accuracy=0.889, val_loss=0.233, val_accuracy=0.911]
Epoch 48:  90%|█████████ | 230/255 [01:21<00:08,  2.81it/s, loss=0.187, v_num=3, train_loss=0.237, train_accuracy=0.889, val_loss=0.233, val_accuracy=0.911]
Epoch 48:  91%|█████████ | 232/255 [01:21<00:08,  2.83it/s, loss=0.187, v_num=3, train_loss=0.237, train_accuracy=0.889, val_loss=0.233, val_accuracy=0.911]
Epoch 48:  92%|█████████▏| 234/255 [01:22<00:07,  2.85it/s, loss=0.187, v_num=3, train_loss=0.237, train_accuracy=0.889, val_loss=0.233, val_accuracy=0.911]
Epoch 48:  93%|█████████▎| 236/255 [01:22<00:06,  2.87it/s, loss=0.187, v_num=3, train_loss=0.237, train_accuracy=0.889, val_l

Epoch 48, global step 11073: val_loss reached 0.21098 (best 0.21098), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-18-v6.ckpt" as top 2


Epoch 49:  89%|████████▊ | 226/255 [01:17<00:09,  2.90it/s, loss=0.158, v_num=3, train_loss=0.344, train_accuracy=0.889, val_loss=0.211, val_accuracy=0.912] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 49:  89%|████████▉ | 228/255 [01:21<00:09,  2.79it/s, loss=0.158, v_num=3, train_loss=0.344, train_accuracy=0.889, val_loss=0.211, val_accuracy=0.912]
Epoch 49:  90%|█████████ | 230/255 [01:21<00:08,  2.81it/s, loss=0.158, v_num=3, train_loss=0.344, train_accuracy=0.889, val_loss=0.211, val_accuracy=0.912]
Epoch 49:  91%|█████████ | 232/255 [01:21<00:08,  2.83it/s, loss=0.158, v_num=3, train_loss=0.344, train_accuracy=0.889, val_loss=0.211, val_accuracy=0.912]
Epoch 49:  92%|█████████▏| 234/255 [01:22<00:07,  2.85it/s, loss=0.158, v_num=3, train_loss=0.344, train_accuracy=0.889, val_loss=0.211, val_accuracy=0.912]
Epoch 49:  93%|█████████▎| 236/255 [01:22<00:06,  2.87it/s, loss=0.158, v_num=3, train_loss=0.344, train_accuracy=0.889, val_l

Epoch 49, global step 11299: val_loss reached 0.20939 (best 0.20939), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-18-v7.ckpt" as top 2


Epoch 50:  89%|████████▊ | 226/255 [01:17<00:09,  2.90it/s, loss=0.144, v_num=3, train_loss=0.0461, train_accuracy=1.000, val_loss=0.209, val_accuracy=0.923]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 50:  89%|████████▉ | 228/255 [01:21<00:09,  2.79it/s, loss=0.144, v_num=3, train_loss=0.0461, train_accuracy=1.000, val_loss=0.209, val_accuracy=0.923]
Epoch 50:  90%|█████████ | 230/255 [01:21<00:08,  2.81it/s, loss=0.144, v_num=3, train_loss=0.0461, train_accuracy=1.000, val_loss=0.209, val_accuracy=0.923]
Epoch 50:  91%|█████████ | 232/255 [01:21<00:08,  2.83it/s, loss=0.144, v_num=3, train_loss=0.0461, train_accuracy=1.000, val_loss=0.209, val_accuracy=0.923]
Epoch 50:  92%|█████████▏| 234/255 [01:22<00:07,  2.85it/s, loss=0.144, v_num=3, train_loss=0.0461, train_accuracy=1.000, val_loss=0.209, val_accuracy=0.923]
Epoch 50:  93%|█████████▎| 236/255 [01:22<00:06,  2.87it/s, loss=0.144, v_num=3, train_loss=0.0461, train_accuracy=1.000, 

Epoch 50, global step 11525: val_loss was not in top 2


Epoch 51:  89%|████████▊ | 226/255 [01:17<00:10,  2.90it/s, loss=0.136, v_num=3, train_loss=0.390, train_accuracy=0.778, val_loss=0.252, val_accuracy=0.908] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 51:  89%|████████▉ | 228/255 [01:21<00:09,  2.79it/s, loss=0.136, v_num=3, train_loss=0.390, train_accuracy=0.778, val_loss=0.252, val_accuracy=0.908]
Epoch 51:  90%|█████████ | 230/255 [01:21<00:08,  2.81it/s, loss=0.136, v_num=3, train_loss=0.390, train_accuracy=0.778, val_loss=0.252, val_accuracy=0.908]
Epoch 51:  91%|█████████ | 232/255 [01:21<00:08,  2.83it/s, loss=0.136, v_num=3, train_loss=0.390, train_accuracy=0.778, val_loss=0.252, val_accuracy=0.908]
Epoch 51:  92%|█████████▏| 234/255 [01:22<00:07,  2.85it/s, loss=0.136, v_num=3, train_loss=0.390, train_accuracy=0.778, val_loss=0.252, val_accuracy=0.908]
Epoch 51:  93%|█████████▎| 236/255 [01:22<00:06,  2.87it/s, loss=0.136, v_num=3, train_loss=0.390, train_accuracy=0.778, val_l

Epoch 51, global step 11751: val_loss reached 0.20442 (best 0.20442), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-18-v6.ckpt" as top 2


Epoch 52:  89%|████████▊ | 226/255 [01:17<00:10,  2.90it/s, loss=0.137, v_num=3, train_loss=0.246, train_accuracy=0.889, val_loss=0.204, val_accuracy=0.918] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 52:  89%|████████▉ | 228/255 [01:21<00:09,  2.79it/s, loss=0.137, v_num=3, train_loss=0.246, train_accuracy=0.889, val_loss=0.204, val_accuracy=0.918]
Epoch 52:  90%|█████████ | 230/255 [01:21<00:08,  2.81it/s, loss=0.137, v_num=3, train_loss=0.246, train_accuracy=0.889, val_loss=0.204, val_accuracy=0.918]
Epoch 52:  91%|█████████ | 232/255 [01:22<00:08,  2.83it/s, loss=0.137, v_num=3, train_loss=0.246, train_accuracy=0.889, val_loss=0.204, val_accuracy=0.918]
Epoch 52:  92%|█████████▏| 234/255 [01:22<00:07,  2.85it/s, loss=0.137, v_num=3, train_loss=0.246, train_accuracy=0.889, val_loss=0.204, val_accuracy=0.918]
Epoch 52:  93%|█████████▎| 236/255 [01:22<00:06,  2.87it/s, loss=0.137, v_num=3, train_loss=0.246, train_accuracy=0.889, val_l

Epoch 52, global step 11977: val_loss was not in top 2


Epoch 53:  89%|████████▊ | 226/255 [01:17<00:10,  2.90it/s, loss=0.162, v_num=3, train_loss=0.157, train_accuracy=0.944, val_loss=0.221, val_accuracy=0.922] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 53:  89%|████████▉ | 228/255 [01:21<00:09,  2.79it/s, loss=0.162, v_num=3, train_loss=0.157, train_accuracy=0.944, val_loss=0.221, val_accuracy=0.922]
Epoch 53:  90%|█████████ | 230/255 [01:21<00:08,  2.81it/s, loss=0.162, v_num=3, train_loss=0.157, train_accuracy=0.944, val_loss=0.221, val_accuracy=0.922]
Epoch 53:  91%|█████████ | 232/255 [01:21<00:08,  2.83it/s, loss=0.162, v_num=3, train_loss=0.157, train_accuracy=0.944, val_loss=0.221, val_accuracy=0.922]
Epoch 53:  92%|█████████▏| 234/255 [01:22<00:07,  2.85it/s, loss=0.162, v_num=3, train_loss=0.157, train_accuracy=0.944, val_loss=0.221, val_accuracy=0.922]
Epoch 53:  93%|█████████▎| 236/255 [01:22<00:06,  2.87it/s, loss=0.162, v_num=3, train_loss=0.157, train_accuracy=0.944, val_l

Epoch 53, global step 12203: val_loss reached 0.18717 (best 0.18717), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-18-v7.ckpt" as top 2


Epoch 54:  89%|████████▊ | 226/255 [01:17<00:10,  2.90it/s, loss=0.29, v_num=3, train_loss=0.249, train_accuracy=0.944, val_loss=0.187, val_accuracy=0.926]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 54:  89%|████████▉ | 228/255 [01:21<00:09,  2.79it/s, loss=0.29, v_num=3, train_loss=0.249, train_accuracy=0.944, val_loss=0.187, val_accuracy=0.926]
Epoch 54:  90%|█████████ | 230/255 [01:21<00:08,  2.81it/s, loss=0.29, v_num=3, train_loss=0.249, train_accuracy=0.944, val_loss=0.187, val_accuracy=0.926]
Epoch 54:  91%|█████████ | 232/255 [01:21<00:08,  2.83it/s, loss=0.29, v_num=3, train_loss=0.249, train_accuracy=0.944, val_loss=0.187, val_accuracy=0.926]
Epoch 54:  92%|█████████▏| 234/255 [01:22<00:07,  2.85it/s, loss=0.29, v_num=3, train_loss=0.249, train_accuracy=0.944, val_loss=0.187, val_accuracy=0.926]
Epoch 54:  93%|█████████▎| 236/255 [01:22<00:06,  2.87it/s, loss=0.29, v_num=3, train_loss=0.249, train_accuracy=0.944, val_loss=0

Epoch 54, global step 12429: val_loss was not in top 2


Epoch 55:  89%|████████▊ | 226/255 [01:17<00:09,  2.90it/s, loss=0.195, v_num=3, train_loss=0.218, train_accuracy=0.889, val_loss=0.317, val_accuracy=0.860]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 55:  89%|████████▉ | 228/255 [01:21<00:09,  2.80it/s, loss=0.195, v_num=3, train_loss=0.218, train_accuracy=0.889, val_loss=0.317, val_accuracy=0.860]
Epoch 55:  90%|█████████ | 230/255 [01:21<00:08,  2.82it/s, loss=0.195, v_num=3, train_loss=0.218, train_accuracy=0.889, val_loss=0.317, val_accuracy=0.860]
Epoch 55:  91%|█████████ | 232/255 [01:21<00:08,  2.83it/s, loss=0.195, v_num=3, train_loss=0.218, train_accuracy=0.889, val_loss=0.317, val_accuracy=0.860]
Epoch 55:  92%|█████████▏| 234/255 [01:21<00:07,  2.85it/s, loss=0.195, v_num=3, train_loss=0.218, train_accuracy=0.889, val_loss=0.317, val_accuracy=0.860]
Epoch 55:  93%|█████████▎| 236/255 [01:22<00:06,  2.87it/s, loss=0.195, v_num=3, train_loss=0.218, train_accuracy=0.889, val_lo

Epoch 55, global step 12655: val_loss was not in top 2


Epoch 56:  89%|████████▊ | 226/255 [01:17<00:10,  2.90it/s, loss=0.178, v_num=3, train_loss=0.0437, train_accuracy=1.000, val_loss=0.230, val_accuracy=0.896]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 56:  89%|████████▉ | 228/255 [01:21<00:09,  2.79it/s, loss=0.178, v_num=3, train_loss=0.0437, train_accuracy=1.000, val_loss=0.230, val_accuracy=0.896]
Epoch 56:  90%|█████████ | 230/255 [01:21<00:08,  2.81it/s, loss=0.178, v_num=3, train_loss=0.0437, train_accuracy=1.000, val_loss=0.230, val_accuracy=0.896]
Epoch 56:  91%|█████████ | 232/255 [01:21<00:08,  2.83it/s, loss=0.178, v_num=3, train_loss=0.0437, train_accuracy=1.000, val_loss=0.230, val_accuracy=0.896]
Epoch 56:  92%|█████████▏| 234/255 [01:22<00:07,  2.85it/s, loss=0.178, v_num=3, train_loss=0.0437, train_accuracy=1.000, val_loss=0.230, val_accuracy=0.896]
Epoch 56:  93%|█████████▎| 236/255 [01:22<00:06,  2.87it/s, loss=0.178, v_num=3, train_loss=0.0437, train_accuracy=1.000, 

Epoch 56, global step 12881: val_loss was not in top 2


Epoch 57:  89%|████████▊ | 226/255 [01:17<00:10,  2.90it/s, loss=0.142, v_num=3, train_loss=0.236, train_accuracy=0.944, val_loss=0.228, val_accuracy=0.910] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 57:  89%|████████▉ | 228/255 [01:21<00:09,  2.79it/s, loss=0.142, v_num=3, train_loss=0.236, train_accuracy=0.944, val_loss=0.228, val_accuracy=0.910]
Epoch 57:  90%|█████████ | 230/255 [01:21<00:08,  2.81it/s, loss=0.142, v_num=3, train_loss=0.236, train_accuracy=0.944, val_loss=0.228, val_accuracy=0.910]
Epoch 57:  91%|█████████ | 232/255 [01:21<00:08,  2.83it/s, loss=0.142, v_num=3, train_loss=0.236, train_accuracy=0.944, val_loss=0.228, val_accuracy=0.910]
Epoch 57:  92%|█████████▏| 234/255 [01:22<00:07,  2.85it/s, loss=0.142, v_num=3, train_loss=0.236, train_accuracy=0.944, val_loss=0.228, val_accuracy=0.910]
Epoch 57:  93%|█████████▎| 236/255 [01:22<00:06,  2.87it/s, loss=0.142, v_num=3, train_loss=0.236, train_accuracy=0.944, val_l

Epoch 57, global step 13107: val_loss was not in top 2


Epoch 58:  89%|████████▊ | 226/255 [01:17<00:10,  2.90it/s, loss=0.109, v_num=3, train_loss=0.0669, train_accuracy=1.000, val_loss=0.210, val_accuracy=0.921]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 58:  89%|████████▉ | 228/255 [01:21<00:09,  2.79it/s, loss=0.109, v_num=3, train_loss=0.0669, train_accuracy=1.000, val_loss=0.210, val_accuracy=0.921]
Epoch 58:  90%|█████████ | 230/255 [01:21<00:08,  2.81it/s, loss=0.109, v_num=3, train_loss=0.0669, train_accuracy=1.000, val_loss=0.210, val_accuracy=0.921]
Epoch 58:  91%|█████████ | 232/255 [01:22<00:08,  2.83it/s, loss=0.109, v_num=3, train_loss=0.0669, train_accuracy=1.000, val_loss=0.210, val_accuracy=0.921]
Epoch 58:  92%|█████████▏| 234/255 [01:22<00:07,  2.85it/s, loss=0.109, v_num=3, train_loss=0.0669, train_accuracy=1.000, val_loss=0.210, val_accuracy=0.921]
Epoch 58:  93%|█████████▎| 236/255 [01:22<00:06,  2.87it/s, loss=0.109, v_num=3, train_loss=0.0669, train_accuracy=1.000, 

Epoch 58, global step 13333: val_loss was not in top 2


Epoch 59:  89%|████████▊ | 226/255 [01:17<00:10,  2.90it/s, loss=0.154, v_num=3, train_loss=0.0233, train_accuracy=1.000, val_loss=0.206, val_accuracy=0.925]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 59:  89%|████████▉ | 228/255 [01:21<00:09,  2.79it/s, loss=0.154, v_num=3, train_loss=0.0233, train_accuracy=1.000, val_loss=0.206, val_accuracy=0.925]
Epoch 59:  90%|█████████ | 230/255 [01:21<00:08,  2.81it/s, loss=0.154, v_num=3, train_loss=0.0233, train_accuracy=1.000, val_loss=0.206, val_accuracy=0.925]
Epoch 59:  91%|█████████ | 232/255 [01:21<00:08,  2.83it/s, loss=0.154, v_num=3, train_loss=0.0233, train_accuracy=1.000, val_loss=0.206, val_accuracy=0.925]
Epoch 59:  92%|█████████▏| 234/255 [01:22<00:07,  2.85it/s, loss=0.154, v_num=3, train_loss=0.0233, train_accuracy=1.000, val_loss=0.206, val_accuracy=0.925]
Epoch 59:  93%|█████████▎| 236/255 [01:22<00:06,  2.87it/s, loss=0.154, v_num=3, train_loss=0.0233, train_accuracy=1.000, 

Epoch 59, global step 13559: val_loss reached 0.19847 (best 0.18717), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-18-v6.ckpt" as top 2


Epoch 60:  89%|████████▊ | 226/255 [01:17<00:10,  2.90it/s, loss=0.322, v_num=3, train_loss=0.363, train_accuracy=0.722, val_loss=0.198, val_accuracy=0.916] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 60:  89%|████████▉ | 228/255 [01:21<00:09,  2.79it/s, loss=0.322, v_num=3, train_loss=0.363, train_accuracy=0.722, val_loss=0.198, val_accuracy=0.916]
Epoch 60:  90%|█████████ | 230/255 [01:21<00:08,  2.81it/s, loss=0.322, v_num=3, train_loss=0.363, train_accuracy=0.722, val_loss=0.198, val_accuracy=0.916]
Epoch 60:  91%|█████████ | 232/255 [01:22<00:08,  2.83it/s, loss=0.322, v_num=3, train_loss=0.363, train_accuracy=0.722, val_loss=0.198, val_accuracy=0.916]
Epoch 60:  92%|█████████▏| 234/255 [01:22<00:07,  2.84it/s, loss=0.322, v_num=3, train_loss=0.363, train_accuracy=0.722, val_loss=0.198, val_accuracy=0.916]
Epoch 60:  93%|█████████▎| 236/255 [01:22<00:06,  2.86it/s, loss=0.322, v_num=3, train_loss=0.363, train_accuracy=0.722, val_l

Epoch 60, global step 13785: val_loss was not in top 2


Epoch 61:  89%|████████▊ | 226/255 [01:17<00:09,  2.90it/s, loss=0.162, v_num=3, train_loss=0.165, train_accuracy=0.944, val_loss=0.254, val_accuracy=0.889] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 61:  89%|████████▉ | 228/255 [01:21<00:09,  2.79it/s, loss=0.162, v_num=3, train_loss=0.165, train_accuracy=0.944, val_loss=0.254, val_accuracy=0.889]
Epoch 61:  90%|█████████ | 230/255 [01:21<00:08,  2.81it/s, loss=0.162, v_num=3, train_loss=0.165, train_accuracy=0.944, val_loss=0.254, val_accuracy=0.889]
Epoch 61:  91%|█████████ | 232/255 [01:21<00:08,  2.83it/s, loss=0.162, v_num=3, train_loss=0.165, train_accuracy=0.944, val_loss=0.254, val_accuracy=0.889]
Epoch 61:  92%|█████████▏| 234/255 [01:22<00:07,  2.85it/s, loss=0.162, v_num=3, train_loss=0.165, train_accuracy=0.944, val_loss=0.254, val_accuracy=0.889]
Epoch 61:  93%|█████████▎| 236/255 [01:22<00:06,  2.87it/s, loss=0.162, v_num=3, train_loss=0.165, train_accuracy=0.944, val_l

Epoch 61, global step 14011: val_loss reached 0.19291 (best 0.18717), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-18-v6.ckpt" as top 2


Epoch 62:  89%|████████▊ | 226/255 [01:17<00:09,  2.90it/s, loss=0.162, v_num=3, train_loss=0.234, train_accuracy=0.833, val_loss=0.193, val_accuracy=0.923] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 62:  89%|████████▉ | 228/255 [01:21<00:09,  2.80it/s, loss=0.162, v_num=3, train_loss=0.234, train_accuracy=0.833, val_loss=0.193, val_accuracy=0.923]
Epoch 62:  90%|█████████ | 230/255 [01:21<00:08,  2.82it/s, loss=0.162, v_num=3, train_loss=0.234, train_accuracy=0.833, val_loss=0.193, val_accuracy=0.923]
Epoch 62:  91%|█████████ | 232/255 [01:21<00:08,  2.83it/s, loss=0.162, v_num=3, train_loss=0.234, train_accuracy=0.833, val_loss=0.193, val_accuracy=0.923]
Epoch 62:  92%|█████████▏| 234/255 [01:22<00:07,  2.85it/s, loss=0.162, v_num=3, train_loss=0.234, train_accuracy=0.833, val_loss=0.193, val_accuracy=0.923]
Epoch 62:  93%|█████████▎| 236/255 [01:22<00:06,  2.87it/s, loss=0.162, v_num=3, train_loss=0.234, train_accuracy=0.833, val_l

Epoch 62, global step 14237: val_loss reached 0.18279 (best 0.18279), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-18-v6.ckpt" as top 2


Epoch 63:  89%|████████▊ | 226/255 [01:17<00:10,  2.90it/s, loss=0.182, v_num=3, train_loss=0.343, train_accuracy=0.889, val_loss=0.183, val_accuracy=0.929] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 63:  89%|████████▉ | 228/255 [01:21<00:09,  2.79it/s, loss=0.182, v_num=3, train_loss=0.343, train_accuracy=0.889, val_loss=0.183, val_accuracy=0.929]
Epoch 63:  90%|█████████ | 230/255 [01:21<00:08,  2.81it/s, loss=0.182, v_num=3, train_loss=0.343, train_accuracy=0.889, val_loss=0.183, val_accuracy=0.929]
Epoch 63:  91%|█████████ | 232/255 [01:21<00:08,  2.83it/s, loss=0.182, v_num=3, train_loss=0.343, train_accuracy=0.889, val_loss=0.183, val_accuracy=0.929]
Epoch 63:  92%|█████████▏| 234/255 [01:22<00:07,  2.85it/s, loss=0.182, v_num=3, train_loss=0.343, train_accuracy=0.889, val_loss=0.183, val_accuracy=0.929]
Epoch 63:  93%|█████████▎| 236/255 [01:22<00:06,  2.87it/s, loss=0.182, v_num=3, train_loss=0.343, train_accuracy=0.889, val_l

Epoch 63, global step 14463: val_loss was not in top 2


Epoch 64:  89%|████████▊ | 226/255 [01:18<00:10,  2.90it/s, loss=0.139, v_num=3, train_loss=0.130, train_accuracy=0.944, val_loss=0.216, val_accuracy=0.921] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 64:  89%|████████▉ | 228/255 [01:21<00:09,  2.79it/s, loss=0.139, v_num=3, train_loss=0.130, train_accuracy=0.944, val_loss=0.216, val_accuracy=0.921]
Epoch 64:  90%|█████████ | 230/255 [01:21<00:08,  2.81it/s, loss=0.139, v_num=3, train_loss=0.130, train_accuracy=0.944, val_loss=0.216, val_accuracy=0.921]
Epoch 64:  91%|█████████ | 232/255 [01:22<00:08,  2.83it/s, loss=0.139, v_num=3, train_loss=0.130, train_accuracy=0.944, val_loss=0.216, val_accuracy=0.921]
Epoch 64:  92%|█████████▏| 234/255 [01:22<00:07,  2.85it/s, loss=0.139, v_num=3, train_loss=0.130, train_accuracy=0.944, val_loss=0.216, val_accuracy=0.921]
Epoch 64:  93%|█████████▎| 236/255 [01:22<00:06,  2.87it/s, loss=0.139, v_num=3, train_loss=0.130, train_accuracy=0.944, val_l

Epoch 64, global step 14689: val_loss was not in top 2


Epoch 65:  89%|████████▊ | 226/255 [01:18<00:10,  2.89it/s, loss=0.137, v_num=3, train_loss=0.0275, train_accuracy=1.000, val_loss=0.196, val_accuracy=0.917] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 65:  89%|████████▉ | 228/255 [01:21<00:09,  2.79it/s, loss=0.137, v_num=3, train_loss=0.0275, train_accuracy=1.000, val_loss=0.196, val_accuracy=0.917]
Epoch 65:  90%|█████████ | 230/255 [01:21<00:08,  2.80it/s, loss=0.137, v_num=3, train_loss=0.0275, train_accuracy=1.000, val_loss=0.196, val_accuracy=0.917]
Epoch 65:  91%|█████████ | 232/255 [01:22<00:08,  2.82it/s, loss=0.137, v_num=3, train_loss=0.0275, train_accuracy=1.000, val_loss=0.196, val_accuracy=0.917]
Epoch 65:  92%|█████████▏| 234/255 [01:22<00:07,  2.84it/s, loss=0.137, v_num=3, train_loss=0.0275, train_accuracy=1.000, val_loss=0.196, val_accuracy=0.917]
Epoch 65:  93%|█████████▎| 236/255 [01:22<00:06,  2.86it/s, loss=0.137, v_num=3, train_loss=0.0275, train_accuracy=1.000,

Epoch 65, global step 14915: val_loss was not in top 2


Epoch 66:  89%|████████▊ | 226/255 [01:17<00:10,  2.90it/s, loss=0.146, v_num=3, train_loss=0.134, train_accuracy=0.833, val_loss=0.200, val_accuracy=0.925] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 66:  89%|████████▉ | 228/255 [01:21<00:09,  2.79it/s, loss=0.146, v_num=3, train_loss=0.134, train_accuracy=0.833, val_loss=0.200, val_accuracy=0.925]
Epoch 66:  90%|█████████ | 230/255 [01:21<00:08,  2.81it/s, loss=0.146, v_num=3, train_loss=0.134, train_accuracy=0.833, val_loss=0.200, val_accuracy=0.925]
Epoch 66:  91%|█████████ | 232/255 [01:21<00:08,  2.83it/s, loss=0.146, v_num=3, train_loss=0.134, train_accuracy=0.833, val_loss=0.200, val_accuracy=0.925]
Epoch 66:  92%|█████████▏| 234/255 [01:22<00:07,  2.85it/s, loss=0.146, v_num=3, train_loss=0.134, train_accuracy=0.833, val_loss=0.200, val_accuracy=0.925]
Epoch 66:  93%|█████████▎| 236/255 [01:22<00:06,  2.87it/s, loss=0.146, v_num=3, train_loss=0.134, train_accuracy=0.833, val_l

Epoch 66, global step 15141: val_loss reached 0.18342 (best 0.18279), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-18-v7.ckpt" as top 2


Epoch 67:  89%|████████▊ | 226/255 [01:18<00:10,  2.89it/s, loss=0.135, v_num=3, train_loss=0.431, train_accuracy=0.778, val_loss=0.183, val_accuracy=0.923] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 67:  89%|████████▉ | 228/255 [01:21<00:09,  2.78it/s, loss=0.135, v_num=3, train_loss=0.431, train_accuracy=0.778, val_loss=0.183, val_accuracy=0.923]
Epoch 67:  90%|█████████ | 230/255 [01:22<00:08,  2.80it/s, loss=0.135, v_num=3, train_loss=0.431, train_accuracy=0.778, val_loss=0.183, val_accuracy=0.923]
Epoch 67:  91%|█████████ | 232/255 [01:22<00:08,  2.82it/s, loss=0.135, v_num=3, train_loss=0.431, train_accuracy=0.778, val_loss=0.183, val_accuracy=0.923]
Epoch 67:  92%|█████████▏| 234/255 [01:22<00:07,  2.84it/s, loss=0.135, v_num=3, train_loss=0.431, train_accuracy=0.778, val_loss=0.183, val_accuracy=0.923]
Epoch 67:  93%|█████████▎| 236/255 [01:22<00:06,  2.86it/s, loss=0.135, v_num=3, train_loss=0.431, train_accuracy=0.778, val_l

Epoch 67, global step 15367: val_loss reached 0.18049 (best 0.18049), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-18-v7.ckpt" as top 2


Epoch 68:  89%|████████▊ | 226/255 [01:17<00:10,  2.90it/s, loss=0.118, v_num=3, train_loss=0.188, train_accuracy=0.889, val_loss=0.180, val_accuracy=0.925]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 68:  89%|████████▉ | 228/255 [01:21<00:09,  2.79it/s, loss=0.118, v_num=3, train_loss=0.188, train_accuracy=0.889, val_loss=0.180, val_accuracy=0.925]
Epoch 68:  90%|█████████ | 230/255 [01:21<00:08,  2.81it/s, loss=0.118, v_num=3, train_loss=0.188, train_accuracy=0.889, val_loss=0.180, val_accuracy=0.925]
Epoch 68:  91%|█████████ | 232/255 [01:21<00:08,  2.83it/s, loss=0.118, v_num=3, train_loss=0.188, train_accuracy=0.889, val_loss=0.180, val_accuracy=0.925]
Epoch 68:  92%|█████████▏| 234/255 [01:22<00:07,  2.85it/s, loss=0.118, v_num=3, train_loss=0.188, train_accuracy=0.889, val_loss=0.180, val_accuracy=0.925]
Epoch 68:  93%|█████████▎| 236/255 [01:22<00:06,  2.87it/s, loss=0.118, v_num=3, train_loss=0.188, train_accuracy=0.889, val_

Epoch 68, global step 15593: val_loss reached 0.17997 (best 0.17997), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-18-v6.ckpt" as top 2


Epoch 69:  89%|████████▊ | 226/255 [01:18<00:10,  2.90it/s, loss=0.13, v_num=3, train_loss=0.133, train_accuracy=0.944, val_loss=0.180, val_accuracy=0.925]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 69:  89%|████████▉ | 228/255 [01:21<00:09,  2.79it/s, loss=0.13, v_num=3, train_loss=0.133, train_accuracy=0.944, val_loss=0.180, val_accuracy=0.925]
Epoch 69:  90%|█████████ | 230/255 [01:21<00:08,  2.81it/s, loss=0.13, v_num=3, train_loss=0.133, train_accuracy=0.944, val_loss=0.180, val_accuracy=0.925]
Epoch 69:  91%|█████████ | 232/255 [01:22<00:08,  2.83it/s, loss=0.13, v_num=3, train_loss=0.133, train_accuracy=0.944, val_loss=0.180, val_accuracy=0.925]
Epoch 69:  92%|█████████▏| 234/255 [01:22<00:07,  2.85it/s, loss=0.13, v_num=3, train_loss=0.133, train_accuracy=0.944, val_loss=0.180, val_accuracy=0.925]
Epoch 69:  93%|█████████▎| 236/255 [01:22<00:06,  2.87it/s, loss=0.13, v_num=3, train_loss=0.133, train_accuracy=0.944, val_loss=0

Epoch 69, global step 15819: val_loss reached 0.16945 (best 0.16945), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-18-v7.ckpt" as top 2


Epoch 70:  89%|████████▊ | 226/255 [01:18<00:10,  2.90it/s, loss=0.0987, v_num=3, train_loss=0.143, train_accuracy=0.944, val_loss=0.169, val_accuracy=0.928] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 70:  89%|████████▉ | 228/255 [01:21<00:09,  2.79it/s, loss=0.0987, v_num=3, train_loss=0.143, train_accuracy=0.944, val_loss=0.169, val_accuracy=0.928]
Epoch 70:  90%|█████████ | 230/255 [01:21<00:08,  2.81it/s, loss=0.0987, v_num=3, train_loss=0.143, train_accuracy=0.944, val_loss=0.169, val_accuracy=0.928]
Epoch 70:  91%|█████████ | 232/255 [01:22<00:08,  2.83it/s, loss=0.0987, v_num=3, train_loss=0.143, train_accuracy=0.944, val_loss=0.169, val_accuracy=0.928]
Epoch 70:  92%|█████████▏| 234/255 [01:22<00:07,  2.85it/s, loss=0.0987, v_num=3, train_loss=0.143, train_accuracy=0.944, val_loss=0.169, val_accuracy=0.928]
Epoch 70:  93%|█████████▎| 236/255 [01:22<00:06,  2.87it/s, loss=0.0987, v_num=3, train_loss=0.143, train_accuracy=0.944,

Epoch 70, global step 16045: val_loss reached 0.16260 (best 0.16260), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-18-v6.ckpt" as top 2


Epoch 71:  89%|████████▊ | 226/255 [01:17<00:09,  2.92it/s, loss=0.127, v_num=3, train_loss=0.251, train_accuracy=0.889, val_loss=0.163, val_accuracy=0.928]   
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 71:  89%|████████▉ | 228/255 [01:21<00:09,  2.81it/s, loss=0.127, v_num=3, train_loss=0.251, train_accuracy=0.889, val_loss=0.163, val_accuracy=0.928]
Epoch 71:  90%|█████████ | 230/255 [01:21<00:08,  2.83it/s, loss=0.127, v_num=3, train_loss=0.251, train_accuracy=0.889, val_loss=0.163, val_accuracy=0.928]
Epoch 71:  91%|█████████ | 232/255 [01:21<00:08,  2.85it/s, loss=0.127, v_num=3, train_loss=0.251, train_accuracy=0.889, val_loss=0.163, val_accuracy=0.928]
Epoch 71:  92%|█████████▏| 234/255 [01:21<00:07,  2.87it/s, loss=0.127, v_num=3, train_loss=0.251, train_accuracy=0.889, val_loss=0.163, val_accuracy=0.928]
Epoch 71:  93%|█████████▎| 236/255 [01:21<00:06,  2.89it/s, loss=0.127, v_num=3, train_loss=0.251, train_accuracy=0.889, val

Epoch 71, global step 16271: val_loss was not in top 2


Epoch 72:  89%|████████▊ | 226/255 [01:17<00:09,  2.91it/s, loss=0.178, v_num=3, train_loss=0.295, train_accuracy=0.889, val_loss=0.170, val_accuracy=0.932]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 72:  89%|████████▉ | 228/255 [01:21<00:09,  2.80it/s, loss=0.178, v_num=3, train_loss=0.295, train_accuracy=0.889, val_loss=0.170, val_accuracy=0.932]
Epoch 72:  90%|█████████ | 230/255 [01:21<00:08,  2.82it/s, loss=0.178, v_num=3, train_loss=0.295, train_accuracy=0.889, val_loss=0.170, val_accuracy=0.932]
Epoch 72:  91%|█████████ | 232/255 [01:21<00:08,  2.84it/s, loss=0.178, v_num=3, train_loss=0.295, train_accuracy=0.889, val_loss=0.170, val_accuracy=0.932]
Epoch 72:  92%|█████████▏| 234/255 [01:21<00:07,  2.86it/s, loss=0.178, v_num=3, train_loss=0.295, train_accuracy=0.889, val_loss=0.170, val_accuracy=0.932]
Epoch 72:  93%|█████████▎| 236/255 [01:22<00:06,  2.88it/s, loss=0.178, v_num=3, train_loss=0.295, train_accuracy=0.889, val_

Epoch 72, global step 16497: val_loss was not in top 2


Epoch 73:  89%|████████▊ | 226/255 [01:18<00:10,  2.89it/s, loss=0.0872, v_num=3, train_loss=0.0395, train_accuracy=1.000, val_loss=0.266, val_accuracy=0.900]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 73:  89%|████████▉ | 228/255 [01:22<00:09,  2.78it/s, loss=0.0872, v_num=3, train_loss=0.0395, train_accuracy=1.000, val_loss=0.266, val_accuracy=0.900]
Epoch 73:  90%|█████████ | 230/255 [01:22<00:08,  2.80it/s, loss=0.0872, v_num=3, train_loss=0.0395, train_accuracy=1.000, val_loss=0.266, val_accuracy=0.900]
Epoch 73:  91%|█████████ | 232/255 [01:22<00:08,  2.82it/s, loss=0.0872, v_num=3, train_loss=0.0395, train_accuracy=1.000, val_loss=0.266, val_accuracy=0.900]
Epoch 73:  92%|█████████▏| 234/255 [01:22<00:07,  2.84it/s, loss=0.0872, v_num=3, train_loss=0.0395, train_accuracy=1.000, val_loss=0.266, val_accuracy=0.900]
Epoch 73:  93%|█████████▎| 236/255 [01:22<00:06,  2.85it/s, loss=0.0872, v_num=3, train_loss=0.0395, train_accuracy=1

Epoch 73, global step 16723: val_loss was not in top 2


Epoch 74:  89%|████████▊ | 226/255 [01:18<00:10,  2.88it/s, loss=0.11, v_num=3, train_loss=0.105, train_accuracy=0.944, val_loss=0.184, val_accuracy=0.934]   
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 74:  89%|████████▉ | 228/255 [01:22<00:09,  2.78it/s, loss=0.11, v_num=3, train_loss=0.105, train_accuracy=0.944, val_loss=0.184, val_accuracy=0.934]
Epoch 74:  90%|█████████ | 230/255 [01:22<00:08,  2.80it/s, loss=0.11, v_num=3, train_loss=0.105, train_accuracy=0.944, val_loss=0.184, val_accuracy=0.934]
Epoch 74:  91%|█████████ | 232/255 [01:22<00:08,  2.81it/s, loss=0.11, v_num=3, train_loss=0.105, train_accuracy=0.944, val_loss=0.184, val_accuracy=0.934]
Epoch 74:  92%|█████████▏| 234/255 [01:22<00:07,  2.83it/s, loss=0.11, v_num=3, train_loss=0.105, train_accuracy=0.944, val_loss=0.184, val_accuracy=0.934]
Epoch 74:  93%|█████████▎| 236/255 [01:22<00:06,  2.85it/s, loss=0.11, v_num=3, train_loss=0.105, train_accuracy=0.944, val_loss=

Epoch 74, global step 16949: val_loss was not in top 2


Epoch 75:  89%|████████▊ | 226/255 [01:18<00:10,  2.89it/s, loss=0.0901, v_num=3, train_loss=0.0212, train_accuracy=1.000, val_loss=0.186, val_accuracy=0.938]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 75:  89%|████████▉ | 228/255 [01:22<00:09,  2.78it/s, loss=0.0901, v_num=3, train_loss=0.0212, train_accuracy=1.000, val_loss=0.186, val_accuracy=0.938]
Epoch 75:  90%|█████████ | 230/255 [01:22<00:08,  2.80it/s, loss=0.0901, v_num=3, train_loss=0.0212, train_accuracy=1.000, val_loss=0.186, val_accuracy=0.938]
Epoch 75:  91%|█████████ | 232/255 [01:22<00:08,  2.82it/s, loss=0.0901, v_num=3, train_loss=0.0212, train_accuracy=1.000, val_loss=0.186, val_accuracy=0.938]
Epoch 75:  92%|█████████▏| 234/255 [01:22<00:07,  2.84it/s, loss=0.0901, v_num=3, train_loss=0.0212, train_accuracy=1.000, val_loss=0.186, val_accuracy=0.938]
Epoch 75:  93%|█████████▎| 236/255 [01:22<00:06,  2.85it/s, loss=0.0901, v_num=3, train_loss=0.0212, train_accuracy=1

Epoch 75, global step 17175: val_loss was not in top 2


Epoch 76:  54%|█████▎    | 137/255 [01:34<01:21,  1.45it/s, loss=0.145, v_num=3, train_loss=0.490, train_accuracy=0.860, val_loss=0.181, val_accuracy=0.933]  

## Load Checkpoint 

In [None]:
# best-checkpoint-corr-3-v1.ckptn
# trainer.fit(model, data_module, ckpt_path="/Workspace/code/checkpoints/best-checkpoint-corr-3-v1.ckpt")