In [1]:
import os
import pandas as pd
import numpy as np
from sklearn.preprocessing import LabelEncoder
from sklearn.model_selection import train_test_split
from sklearn.metrics import classification_report, confusion_matrix
import matplotlib.pyplot as plt

import torch
from torch import nn, optim
from torch.nn import functional as F
from torch.utils.data import Dataset, DataLoader

import torchmetrics
from torchmetrics.functional import accuracy, f1_score

import pytorch_lightning as pl
from pytorch_lightning.loggers import TensorBoardLogger
from pytorch_lightning.callbacks import ModelCheckpoint

device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
print(device)

  from .autonotebook import tqdm as notebook_tqdm


cuda


## Model Setup 

In [13]:
pl.seed_everything(42, workers=True)

class DrowsyDataset(Dataset):
    
    def __init__(self, sequences):
        self.sequences = sequences
        
    def __len__(self):
        return len(self.sequences)
    
    def __getitem__(self, idx):
        sequence, label = self.sequences[idx]
        return dict(
            sequence=torch.Tensor(sequence.to_numpy()),
            label=torch.tensor(label).long()
        )
    
class DrowsyDataModule(pl.LightningDataModule):
    
    def __init__(self, train_sequences, val_sequences, test_sequences, batch_size):
        super().__init__()
        self.train_sequences = train_sequences
        self.val_sequences = val_sequences
        self.test_sequences = test_sequences
        self.batch_size = batch_size

    def setup(self, stage=None):
        self.train_dataset = DrowsyDataset(self.train_sequences)
        self.val_dataset = DrowsyDataset(self.val_sequences)
        self.test_dataset = DrowsyDataset(self.test_sequences)
        
    def train_dataloader(self):
        return DataLoader(
            self.train_dataset,
            batch_size=self.batch_size,
            shuffle=True,
            num_workers=os.cpu_count()
        )
    
    def val_dataloader(self):
        return DataLoader(
            self.val_dataset,
            batch_size=self.batch_size,
            shuffle=False,
            num_workers=os.cpu_count()
        )
    
    def test_dataloader(self):
        return DataLoader(
            self.test_dataset,
            batch_size=self.batch_size,
            shuffle=False,
            num_workers=os.cpu_count()
        ) 

class DrowsyModel(nn.Module):
    
    def __init__(self, n_features, n_classes, n_hidden=256, n_layers=3):
        super().__init__()
        
        self.n_hidden = n_hidden
        
        self.lstm = nn.LSTM(
            input_size=n_features,
            hidden_size=n_hidden,
            num_layers=n_layers,
            batch_first=True,
            dropout=0.75
        )
        
        self.classifier = nn.Linear(n_hidden, n_classes)
        
    def forward(self, x):
        self.lstm.flatten_parameters()
        _, (hidden, _) = self.lstm(x)
        
        out = hidden[-1]
        return self.classifier(out)
    
class DrowsyPredictor(pl.LightningModule):
    
    def __init__(self, n_features: int, n_classes: int):
        super().__init__()
        self.model = DrowsyModel(n_features, n_classes)
        self.criterion = nn.CrossEntropyLoss()
        
    def forward(self, x, label=None):
        output = self.model(x)
        loss = 0
        if label is not None:
            loss = self.criterion(output, label)
        return loss, output
        
    def training_step(self, batch, batch_idx):
        sequences = batch["sequence"]
        labels = batch["label"]
        loss, outputs = self(sequences, labels)
        predictions = torch.argmax(outputs, dim=1)
        step_accuracy = accuracy(predictions, labels)
        my_f1_score = f1_score(predictions, labels)
        
        self.log("train_loss", loss, prog_bar=True, logger=True)
        self.log("train_accuracy", step_accuracy, prog_bar=True, logger=True)
        self.log("train_f1_score", my_f1_score, prog_bar=True, logger=True)
        
        return {"loss": loss, "accuracy": step_accuracy}
    
    def validation_step(self, batch, batch_idx):
        sequences = batch["sequence"]
        labels = batch["label"]
        loss, outputs = self(sequences, labels)
        predictions = torch.argmax(outputs, dim=1)
        step_accuracy = accuracy(predictions, labels)
        my_f1_score = f1_score(predictions, labels)
        
        self.log("val_loss", loss, prog_bar=True, logger=True)
        self.log("val_accuracy", step_accuracy, prog_bar=True, logger=True)
        self.log("val_f1_score", my_f1_score, prog_bar=True, logger=True)
        
        return {"loss": loss, "accuracy": step_accuracy}
    
    def test_step(self, batch, batch_idx):
        sequences = batch["sequence"]
        labels = batch["label"]
        loss, outputs = self(sequences, labels)
        predictions = torch.argmax(outputs, dim=1)
        step_accuracy = accuracy(predictions, labels)
        my_f1_score = f1_score(predictions, labels)
        
        self.log("test_loss", loss, prog_bar=True, logger=True)
        self.log("test_accuracy", step_accuracy, prog_bar=True, logger=True)
        self.log("test_f1_score", my_f1_score, prog_bar=True, logger=True)
        
        return {"loss": loss, "accuracy": step_accuracy}
    
    def configure_optimizers(self):
        return optim.Adam(self.parameters(), lr=0.0001)

Global seed set to 42


## 參數設置

In [3]:
%load_ext tensorboard
%reload_ext tensorboard
%tensorboard --logdir ./lightning_logs --host 0.0.0.0 --port=8888

Reusing TensorBoard on port 8888 (pid 7376), started 0:00:03 ago. (Use '!kill 7376' to kill it.)

In [4]:
X_train = pd.read_csv('../data2.csv')

In [8]:
N_EPOCHS = 200
BATCH_SIZE = 50

# randomed 
# ORG_FEATURE_COLUMNS = ['HEOR', 'T5', 'VEOL', 'VEOU', 'F8', 'FZ', 'F7', 'TP8', 'FC3', 'T4', 'HEOL', 'FT10', 'O2', 'FC4', 'FCZ', 'CP3', 'FP2', 'TP7', 'C3', 'F3', 'PZ', 'F4', 'O1', 'FT7', 'CP4', 'FP1', 'C4', 'T6', 'FT8', 'CZ', 'PO1', 'OZ', 'A2', 'A1', 'T3', 'P4', 'P3', 'FT9', 'CPZ', 'PO2']
ORG_FEATURE_COLUMNS = ['HEOR', 'T5', 'VEOL', 'VEOU', 'F8', 'FZ', 'F7', 'TP8', 'FC3', 'T4', 'HEOL', 'FT10', 'O2', 'FC4', 'FCZ', 'CP3', 'FP2', 'TP7', 'C3', 'F3', 'PZ', 'F4', 'O1', 'FT7', 'CP4', 'FP1', 'C4', 'T6', 'FT8', 'CZ', 'PO1', 'OZ', 'A2', 'A1', 'T3', 'P4', 'P3', 'FT9', 'CPZ', 'PO2']
g = X_train.groupby("group")

# For 口試補充：
# ORG_FEATURE_COLUMNS = ['FP1','FP2','FZ']


In [6]:
# import random
# ORG_FEATURE_COLUMNS = ['TP8', 'FP2', 'FCZ', 'FT10', 'O2', 'O1', 'FT7', 'F4', 'TP7', 'C3', 'C4', 'F3', 'FT8', 'T6', 'HEOR', 'T5', 'VEOL', 'F7', 'FZ', 'VEOU', 'A1', 'P3', 'PZ', 'CP3', 'P4', 'CPZ', 'A2', 'HEOL', 'CP4', 'FT9', 'F8', 'OZ', 'CZ', 'FC4', 'FC3', 'FP1', 'PO1', 'T3', 'T4', 'PO2']
# random.shuffle(ORG_FEATURE_COLUMNS)
# print(ORG_FEATURE_COLUMNS)

## Main

In [15]:
n = 0
FEATURE_COLUMNS = ORG_FEATURE_COLUMNS[n:]

while(n < 40):
    print("------------------ Round: " + str(n) + " ------------------")
    print(FEATURE_COLUMNS)
    print("Len:", len(FEATURE_COLUMNS))
    
    label_encoder = LabelEncoder()
    encoded_labels = label_encoder.fit_transform(X_train.state)

    label_encoder.classes_

    X_train['label'] = encoded_labels

    # Prepare data ###########################################
    sequences = [] 

    for name, group in g:
        sequence_features = group[FEATURE_COLUMNS]
        label = group.label.iloc[0]

        # print((sequence_features, label))
        sequences.append((sequence_features, label))

    # Setting up train, test, val gruop #######################
    train_sequences, test_sequences = train_test_split(sequences, test_size=0.2)
    val_sequences, test_sequences = train_test_split(test_sequences, test_size=0.5)


    # Setting up data module ##################################
    data_module = DrowsyDataModule(
        train_sequences, val_sequences, test_sequences, BATCH_SIZE
    )

    model = DrowsyPredictor(
        n_features=len(FEATURE_COLUMNS), 
        n_classes=len(label_encoder.classes_)
    )

    # Check points and logger #################################
    checkpoint_callback = ModelCheckpoint(
        dirpath="checkpoints",
        filename="best-checkpoint-corr-mi-" + str(n),
        save_top_k=2,
        verbose=True,
        monitor="val_loss",
        mode="min"
    )

    logger = TensorBoardLogger("lightning_logs", name="Drowsy_MI" + str(n))

    trainer = pl.Trainer(
        logger=logger,
        callbacks=[checkpoint_callback],
        max_epochs=N_EPOCHS,
        gpus=[2],
#         gpus=1, 
#         auto_select_gpus=True,
        auto_lr_find=True, 
        # check_val_every_n_epoch=10
        # refresh_rate=20,
    )
    
    # Training start
    if (n == 44):
        trainer.fit(model, data_module, ckpt_path="/Workspace/code/checkpoints/best-checkpoint-corr-mi-0-v3.ckpt")
    else:
        trainer.fit(model, data_module)
    trainer.test(model, data_module)
    
    FEATURE_COLUMNS.pop(0)
    n = n + 1

------------------ Round: 0 ------------------
['HEOR', 'T5', 'VEOL', 'VEOU', 'F8', 'FZ', 'F7', 'TP8', 'FC3', 'T4', 'HEOL', 'FT10', 'O2', 'FC4', 'FCZ', 'CP3', 'FP2', 'TP7', 'C3', 'F3', 'PZ', 'F4', 'O1', 'FT7', 'CP4', 'FP1', 'C4', 'T6', 'FT8', 'CZ', 'PO1', 'OZ', 'A2', 'A1', 'T3', 'P4', 'P3', 'FT9', 'CPZ', 'PO2']
Len: 40


GPU available: True, used: True
TPU available: False, using: 0 TPU cores
IPU available: False, using: 0 IPUs
LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1,2]

  | Name      | Type             | Params
-----------------------------------------------
0 | model     | DrowsyModel      | 1.4 M 
1 | criterion | CrossEntropyLoss | 0     
-----------------------------------------------
1.4 M     Trainable params
0         Non-trainable params
1.4 M     Total params
5.433     Total estimated model params size (MB)
  rank_zero_warn(f"Checkpoint directory {dirpath} exists and is not empty.")


                                                                      

Global seed set to 42


Epoch 0:  89%|████████▊ | 226/255 [01:19<00:10,  2.84it/s, loss=0.621, v_num=4, train_loss=0.580, train_accuracy=0.778, train_f1_score=0.778]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 0:  89%|████████▉ | 228/255 [01:26<00:10,  2.63it/s, loss=0.621, v_num=4, train_loss=0.580, train_accuracy=0.778, train_f1_score=0.778]
Epoch 0:  90%|█████████ | 230/255 [01:26<00:09,  2.65it/s, loss=0.621, v_num=4, train_loss=0.580, train_accuracy=0.778, train_f1_score=0.778]
Epoch 0:  91%|█████████ | 232/255 [01:26<00:08,  2.67it/s, loss=0.621, v_num=4, train_loss=0.580, train_accuracy=0.778, train_f1_score=0.778]
Epoch 0:  92%|█████████▏| 234/255 [01:27<00:07,  2.69it/s, loss=0.621, v_num=4, train_loss=0.580, train_accuracy=0.778, train_f1_score=0.778]
Epoch 0:  93%|█████████▎| 236/255 [01:27<00:07,  2.71it/s, loss=0.621, v_num=4, train_loss=0.580, train_accuracy=0.778, train_f1_score=0.778]
Epoch 0:  93%|█████████▎| 238/255 [01:27<00:06,  2.72it/s, l

Epoch 0, global step 225: val_loss reached 0.64842 (best 0.64842), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-0-v2.ckpt" as top 2


Epoch 1:  89%|████████▊ | 226/255 [01:20<00:10,  2.81it/s, loss=0.543, v_num=4, train_loss=0.666, train_accuracy=0.667, train_f1_score=0.667, val_loss=0.648, val_accuracy=0.622, val_f1_score=0.622]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 1:  89%|████████▉ | 228/255 [01:27<00:10,  2.59it/s, loss=0.543, v_num=4, train_loss=0.666, train_accuracy=0.667, train_f1_score=0.667, val_loss=0.648, val_accuracy=0.622, val_f1_score=0.622]
Epoch 1:  90%|█████████ | 230/255 [01:28<00:09,  2.61it/s, loss=0.543, v_num=4, train_loss=0.666, train_accuracy=0.667, train_f1_score=0.667, val_loss=0.648, val_accuracy=0.622, val_f1_score=0.622]
Epoch 1:  91%|█████████ | 232/255 [01:28<00:08,  2.63it/s, loss=0.543, v_num=4, train_loss=0.666, train_accuracy=0.667, train_f1_score=0.667, val_loss=0.648, val_accuracy=0.622, val_f1_score=0.622]
Epoch 1:  92%|█████████▏| 234/255 [01:28<00:07,  2.65it/s, loss=0.543, v_num=4, train_loss=0.666, train_accuracy=0.667, 

Epoch 1, global step 451: val_loss reached 0.65124 (best 0.64842), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-0-v3.ckpt" as top 2


Epoch 2:  89%|████████▊ | 226/255 [01:21<00:10,  2.78it/s, loss=0.662, v_num=4, train_loss=0.591, train_accuracy=0.667, train_f1_score=0.667, val_loss=0.651, val_accuracy=0.671, val_f1_score=0.671]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 2:  89%|████████▉ | 228/255 [01:28<00:10,  2.56it/s, loss=0.662, v_num=4, train_loss=0.591, train_accuracy=0.667, train_f1_score=0.667, val_loss=0.651, val_accuracy=0.671, val_f1_score=0.671]
Epoch 2:  90%|█████████ | 230/255 [01:29<00:09,  2.58it/s, loss=0.662, v_num=4, train_loss=0.591, train_accuracy=0.667, train_f1_score=0.667, val_loss=0.651, val_accuracy=0.671, val_f1_score=0.671]
Epoch 2:  91%|█████████ | 232/255 [01:29<00:08,  2.60it/s, loss=0.662, v_num=4, train_loss=0.591, train_accuracy=0.667, train_f1_score=0.667, val_loss=0.651, val_accuracy=0.671, val_f1_score=0.671]
Epoch 2:  92%|█████████▏| 234/255 [01:29<00:08,  2.62it/s, loss=0.662, v_num=4, train_loss=0.591, train_accuracy=0.667, 

Epoch 2, global step 677: val_loss reached 0.58367 (best 0.58367), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-0-v3.ckpt" as top 2


Epoch 3:  89%|████████▊ | 226/255 [01:20<00:10,  2.80it/s, loss=0.475, v_num=4, train_loss=0.443, train_accuracy=0.722, train_f1_score=0.722, val_loss=0.584, val_accuracy=0.688, val_f1_score=0.688]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 3:  89%|████████▉ | 228/255 [01:28<00:10,  2.59it/s, loss=0.475, v_num=4, train_loss=0.443, train_accuracy=0.722, train_f1_score=0.722, val_loss=0.584, val_accuracy=0.688, val_f1_score=0.688]
Epoch 3:  90%|█████████ | 230/255 [01:28<00:09,  2.61it/s, loss=0.475, v_num=4, train_loss=0.443, train_accuracy=0.722, train_f1_score=0.722, val_loss=0.584, val_accuracy=0.688, val_f1_score=0.688]
Epoch 3:  91%|█████████ | 232/255 [01:28<00:08,  2.63it/s, loss=0.475, v_num=4, train_loss=0.443, train_accuracy=0.722, train_f1_score=0.722, val_loss=0.584, val_accuracy=0.688, val_f1_score=0.688]
Epoch 3:  92%|█████████▏| 234/255 [01:28<00:07,  2.64it/s, loss=0.475, v_num=4, train_loss=0.443, train_accuracy=0.722, 

Epoch 3, global step 903: val_loss reached 0.49782 (best 0.49782), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-0-v2.ckpt" as top 2


Epoch 4:  89%|████████▊ | 226/255 [01:26<00:11,  2.62it/s, loss=0.642, v_num=4, train_loss=0.663, train_accuracy=0.722, train_f1_score=0.722, val_loss=0.498, val_accuracy=0.789, val_f1_score=0.789]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 4:  89%|████████▉ | 228/255 [01:34<00:11,  2.42it/s, loss=0.642, v_num=4, train_loss=0.663, train_accuracy=0.722, train_f1_score=0.722, val_loss=0.498, val_accuracy=0.789, val_f1_score=0.789]
Epoch 4:  90%|█████████ | 230/255 [01:34<00:10,  2.44it/s, loss=0.642, v_num=4, train_loss=0.663, train_accuracy=0.722, train_f1_score=0.722, val_loss=0.498, val_accuracy=0.789, val_f1_score=0.789]
Epoch 4:  91%|█████████ | 232/255 [01:34<00:09,  2.45it/s, loss=0.642, v_num=4, train_loss=0.663, train_accuracy=0.722, train_f1_score=0.722, val_loss=0.498, val_accuracy=0.789, val_f1_score=0.789]
Epoch 4:  92%|█████████▏| 234/255 [01:34<00:08,  2.47it/s, loss=0.642, v_num=4, train_loss=0.663, train_accuracy=0.722, 

Epoch 4, global step 1129: val_loss was not in top 2


Epoch 5:  89%|████████▊ | 226/255 [01:26<00:11,  2.61it/s, loss=0.489, v_num=4, train_loss=0.482, train_accuracy=0.722, train_f1_score=0.722, val_loss=0.693, val_accuracy=0.686, val_f1_score=0.686]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 5:  89%|████████▉ | 228/255 [01:34<00:11,  2.42it/s, loss=0.489, v_num=4, train_loss=0.482, train_accuracy=0.722, train_f1_score=0.722, val_loss=0.693, val_accuracy=0.686, val_f1_score=0.686]
Validating:   7%|▋         | 2/29 [00:07<01:22,  3.07s/it][A
Epoch 5:  90%|█████████ | 230/255 [01:34<00:10,  2.44it/s, loss=0.489, v_num=4, train_loss=0.482, train_accuracy=0.722, train_f1_score=0.722, val_loss=0.693, val_accuracy=0.686, val_f1_score=0.686]
Epoch 5:  91%|█████████ | 232/255 [01:34<00:09,  2.46it/s, loss=0.489, v_num=4, train_loss=0.482, train_accuracy=0.722, train_f1_score=0.722, val_loss=0.693, val_accuracy=0.686, val_f1_score=0.686]
Epoch 5:  92%|█████████▏| 234/255 [01:34<00:08,  2.47it/s,

Epoch 5, global step 1355: val_loss reached 0.51844 (best 0.49782), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-0-v3.ckpt" as top 2


Epoch 6:  89%|████████▊ | 226/255 [01:26<00:11,  2.61it/s, loss=0.395, v_num=4, train_loss=0.179, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.518, val_accuracy=0.751, val_f1_score=0.751]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 6:  89%|████████▉ | 228/255 [01:33<00:11,  2.43it/s, loss=0.395, v_num=4, train_loss=0.179, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.518, val_accuracy=0.751, val_f1_score=0.751]
Epoch 6:  90%|█████████ | 230/255 [01:34<00:10,  2.45it/s, loss=0.395, v_num=4, train_loss=0.179, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.518, val_accuracy=0.751, val_f1_score=0.751]
Epoch 6:  91%|█████████ | 232/255 [01:34<00:09,  2.46it/s, loss=0.395, v_num=4, train_loss=0.179, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.518, val_accuracy=0.751, val_f1_score=0.751]
Epoch 6:  92%|█████████▏| 234/255 [01:34<00:08,  2.48it/s, loss=0.395, v_num=4, train_loss=0.179, train_accuracy=0.944, 

Epoch 6, global step 1581: val_loss reached 0.44842 (best 0.44842), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-0-v3.ckpt" as top 2


Epoch 7:  89%|████████▊ | 226/255 [01:26<00:11,  2.61it/s, loss=0.404, v_num=4, train_loss=0.250, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.448, val_accuracy=0.813, val_f1_score=0.813]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 7:  89%|████████▉ | 228/255 [01:34<00:11,  2.43it/s, loss=0.404, v_num=4, train_loss=0.250, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.448, val_accuracy=0.813, val_f1_score=0.813]
Epoch 7:  90%|█████████ | 230/255 [01:34<00:10,  2.44it/s, loss=0.404, v_num=4, train_loss=0.250, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.448, val_accuracy=0.813, val_f1_score=0.813]
Epoch 7:  91%|█████████ | 232/255 [01:34<00:09,  2.46it/s, loss=0.404, v_num=4, train_loss=0.250, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.448, val_accuracy=0.813, val_f1_score=0.813]
Epoch 7:  92%|█████████▏| 234/255 [01:34<00:08,  2.48it/s, loss=0.404, v_num=4, train_loss=0.250, train_accuracy=0.944, 

Epoch 7, global step 1807: val_loss was not in top 2


Epoch 8:  89%|████████▊ | 226/255 [01:26<00:11,  2.61it/s, loss=0.322, v_num=4, train_loss=0.267, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.524, val_accuracy=0.778, val_f1_score=0.778]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 8:  89%|████████▉ | 228/255 [01:33<00:11,  2.43it/s, loss=0.322, v_num=4, train_loss=0.267, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.524, val_accuracy=0.778, val_f1_score=0.778]
Epoch 8:  90%|█████████ | 230/255 [01:34<00:10,  2.45it/s, loss=0.322, v_num=4, train_loss=0.267, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.524, val_accuracy=0.778, val_f1_score=0.778]
Epoch 8:  91%|█████████ | 232/255 [01:34<00:09,  2.46it/s, loss=0.322, v_num=4, train_loss=0.267, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.524, val_accuracy=0.778, val_f1_score=0.778]
Epoch 8:  92%|█████████▏| 234/255 [01:34<00:08,  2.48it/s, loss=0.322, v_num=4, train_loss=0.267, train_accuracy=0.889, 

Epoch 8, global step 2033: val_loss was not in top 2


Epoch 9:  89%|████████▊ | 226/255 [01:26<00:11,  2.61it/s, loss=0.361, v_num=4, train_loss=0.434, train_accuracy=0.722, train_f1_score=0.722, val_loss=0.503, val_accuracy=0.785, val_f1_score=0.785]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 9:  89%|████████▉ | 228/255 [01:34<00:11,  2.43it/s, loss=0.361, v_num=4, train_loss=0.434, train_accuracy=0.722, train_f1_score=0.722, val_loss=0.503, val_accuracy=0.785, val_f1_score=0.785]
Epoch 9:  90%|█████████ | 230/255 [01:34<00:10,  2.44it/s, loss=0.361, v_num=4, train_loss=0.434, train_accuracy=0.722, train_f1_score=0.722, val_loss=0.503, val_accuracy=0.785, val_f1_score=0.785]
Epoch 9:  91%|█████████ | 232/255 [01:34<00:09,  2.46it/s, loss=0.361, v_num=4, train_loss=0.434, train_accuracy=0.722, train_f1_score=0.722, val_loss=0.503, val_accuracy=0.785, val_f1_score=0.785]
Epoch 9:  92%|█████████▏| 234/255 [01:34<00:08,  2.48it/s, loss=0.361, v_num=4, train_loss=0.434, train_accuracy=0.722, 

Epoch 9, global step 2259: val_loss reached 0.44052 (best 0.44052), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-0-v2.ckpt" as top 2


Epoch 10:  89%|████████▊ | 226/255 [01:26<00:11,  2.61it/s, loss=0.302, v_num=4, train_loss=0.398, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.441, val_accuracy=0.818, val_f1_score=0.818] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 10:  89%|████████▉ | 228/255 [01:34<00:11,  2.42it/s, loss=0.302, v_num=4, train_loss=0.398, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.441, val_accuracy=0.818, val_f1_score=0.818]
Epoch 10:  90%|█████████ | 230/255 [01:34<00:10,  2.44it/s, loss=0.302, v_num=4, train_loss=0.398, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.441, val_accuracy=0.818, val_f1_score=0.818]
Epoch 10:  91%|█████████ | 232/255 [01:34<00:09,  2.46it/s, loss=0.302, v_num=4, train_loss=0.398, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.441, val_accuracy=0.818, val_f1_score=0.818]
Epoch 10:  92%|█████████▏| 234/255 [01:34<00:08,  2.47it/s, loss=0.302, v_num=4, train_loss=0.398, train_accuracy=0

Epoch 10, global step 2485: val_loss was not in top 2


Epoch 11:  89%|████████▊ | 226/255 [01:26<00:11,  2.60it/s, loss=0.288, v_num=4, train_loss=0.217, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.497, val_accuracy=0.820, val_f1_score=0.820]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 11:  89%|████████▉ | 228/255 [01:34<00:11,  2.42it/s, loss=0.288, v_num=4, train_loss=0.217, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.497, val_accuracy=0.820, val_f1_score=0.820]
Epoch 11:  90%|█████████ | 230/255 [01:34<00:10,  2.44it/s, loss=0.288, v_num=4, train_loss=0.217, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.497, val_accuracy=0.820, val_f1_score=0.820]
Epoch 11:  91%|█████████ | 232/255 [01:34<00:09,  2.45it/s, loss=0.288, v_num=4, train_loss=0.217, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.497, val_accuracy=0.820, val_f1_score=0.820]
Epoch 11:  92%|█████████▏| 234/255 [01:34<00:08,  2.47it/s, loss=0.288, v_num=4, train_loss=0.217, train_accuracy=0.

Epoch 11, global step 2711: val_loss was not in top 2


Epoch 12:  89%|████████▊ | 226/255 [01:26<00:11,  2.61it/s, loss=0.301, v_num=4, train_loss=0.192, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.534, val_accuracy=0.799, val_f1_score=0.799]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 12:  89%|████████▉ | 228/255 [01:34<00:11,  2.42it/s, loss=0.301, v_num=4, train_loss=0.192, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.534, val_accuracy=0.799, val_f1_score=0.799]
Epoch 12:  90%|█████████ | 230/255 [01:34<00:10,  2.43it/s, loss=0.301, v_num=4, train_loss=0.192, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.534, val_accuracy=0.799, val_f1_score=0.799]
Epoch 12:  91%|█████████ | 232/255 [01:34<00:09,  2.45it/s, loss=0.301, v_num=4, train_loss=0.192, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.534, val_accuracy=0.799, val_f1_score=0.799]
Epoch 12:  92%|█████████▏| 234/255 [01:34<00:08,  2.47it/s, loss=0.301, v_num=4, train_loss=0.192, train_accuracy=0.

Epoch 12, global step 2937: val_loss reached 0.44535 (best 0.44052), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-0-v3.ckpt" as top 2


Epoch 13:  89%|████████▊ | 226/255 [01:26<00:11,  2.61it/s, loss=0.266, v_num=4, train_loss=0.369, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.445, val_accuracy=0.835, val_f1_score=0.835] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 13:  89%|████████▉ | 228/255 [01:34<00:11,  2.42it/s, loss=0.266, v_num=4, train_loss=0.369, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.445, val_accuracy=0.835, val_f1_score=0.835]
Epoch 13:  90%|█████████ | 230/255 [01:34<00:10,  2.43it/s, loss=0.266, v_num=4, train_loss=0.369, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.445, val_accuracy=0.835, val_f1_score=0.835]
Epoch 13:  91%|█████████ | 232/255 [01:34<00:09,  2.45it/s, loss=0.266, v_num=4, train_loss=0.369, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.445, val_accuracy=0.835, val_f1_score=0.835]
Epoch 13:  92%|█████████▏| 234/255 [01:34<00:08,  2.46it/s, loss=0.266, v_num=4, train_loss=0.369, train_accuracy=0

Epoch 13, global step 3163: val_loss was not in top 2


Epoch 14:  89%|████████▊ | 226/255 [01:27<00:11,  2.59it/s, loss=0.331, v_num=4, train_loss=0.262, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.467, val_accuracy=0.840, val_f1_score=0.840]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 14:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.331, v_num=4, train_loss=0.262, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.467, val_accuracy=0.840, val_f1_score=0.840]
Epoch 14:  90%|█████████ | 230/255 [01:34<00:10,  2.42it/s, loss=0.331, v_num=4, train_loss=0.262, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.467, val_accuracy=0.840, val_f1_score=0.840]
Epoch 14:  91%|█████████ | 232/255 [01:35<00:09,  2.44it/s, loss=0.331, v_num=4, train_loss=0.262, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.467, val_accuracy=0.840, val_f1_score=0.840]
Epoch 14:  92%|█████████▏| 234/255 [01:35<00:08,  2.46it/s, loss=0.331, v_num=4, train_loss=0.262, train_accuracy=0.

Epoch 14, global step 3389: val_loss was not in top 2


Epoch 15:  89%|████████▊ | 226/255 [01:27<00:11,  2.59it/s, loss=0.284, v_num=4, train_loss=0.330, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.507, val_accuracy=0.789, val_f1_score=0.789]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 15:  89%|████████▉ | 228/255 [01:34<00:11,  2.40it/s, loss=0.284, v_num=4, train_loss=0.330, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.507, val_accuracy=0.789, val_f1_score=0.789]
Epoch 15:  90%|█████████ | 230/255 [01:35<00:10,  2.42it/s, loss=0.284, v_num=4, train_loss=0.330, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.507, val_accuracy=0.789, val_f1_score=0.789]
Epoch 15:  91%|█████████ | 232/255 [01:35<00:09,  2.43it/s, loss=0.284, v_num=4, train_loss=0.330, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.507, val_accuracy=0.789, val_f1_score=0.789]
Epoch 15:  92%|█████████▏| 234/255 [01:35<00:08,  2.45it/s, loss=0.284, v_num=4, train_loss=0.330, train_accuracy=0.

Epoch 15, global step 3615: val_loss was not in top 2


Epoch 16:  89%|████████▊ | 226/255 [01:26<00:11,  2.60it/s, loss=0.397, v_num=4, train_loss=0.285, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.482, val_accuracy=0.818, val_f1_score=0.818]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 16:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.397, v_num=4, train_loss=0.285, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.482, val_accuracy=0.818, val_f1_score=0.818]
Epoch 16:  90%|█████████ | 230/255 [01:34<00:10,  2.43it/s, loss=0.397, v_num=4, train_loss=0.285, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.482, val_accuracy=0.818, val_f1_score=0.818]
Epoch 16:  91%|█████████ | 232/255 [01:34<00:09,  2.45it/s, loss=0.397, v_num=4, train_loss=0.285, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.482, val_accuracy=0.818, val_f1_score=0.818]
Epoch 16:  92%|█████████▏| 234/255 [01:34<00:08,  2.46it/s, loss=0.397, v_num=4, train_loss=0.285, train_accuracy=0.

Epoch 16, global step 3841: val_loss was not in top 2


Epoch 17:  89%|████████▊ | 226/255 [01:26<00:11,  2.60it/s, loss=0.343, v_num=4, train_loss=0.365, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.570, val_accuracy=0.795, val_f1_score=0.795]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 17:  89%|████████▉ | 228/255 [01:34<00:11,  2.42it/s, loss=0.343, v_num=4, train_loss=0.365, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.570, val_accuracy=0.795, val_f1_score=0.795]
Epoch 17:  90%|█████████ | 230/255 [01:34<00:10,  2.44it/s, loss=0.343, v_num=4, train_loss=0.365, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.570, val_accuracy=0.795, val_f1_score=0.795]
Epoch 17:  91%|█████████ | 232/255 [01:34<00:09,  2.45it/s, loss=0.343, v_num=4, train_loss=0.365, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.570, val_accuracy=0.795, val_f1_score=0.795]
Epoch 17:  92%|█████████▏| 234/255 [01:34<00:08,  2.47it/s, loss=0.343, v_num=4, train_loss=0.365, train_accuracy=0.

Epoch 17, global step 4067: val_loss was not in top 2


Epoch 18:  89%|████████▊ | 226/255 [01:27<00:11,  2.59it/s, loss=0.273, v_num=4, train_loss=0.155, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.553, val_accuracy=0.790, val_f1_score=0.790]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 18:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.273, v_num=4, train_loss=0.155, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.553, val_accuracy=0.790, val_f1_score=0.790]
Validating:   7%|▋         | 2/29 [00:07<01:26,  3.20s/it][A
Epoch 18:  90%|█████████ | 230/255 [01:34<00:10,  2.42it/s, loss=0.273, v_num=4, train_loss=0.155, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.553, val_accuracy=0.790, val_f1_score=0.790]
Epoch 18:  91%|█████████ | 232/255 [01:35<00:09,  2.44it/s, loss=0.273, v_num=4, train_loss=0.155, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.553, val_accuracy=0.790, val_f1_score=0.790]
Epoch 18:  92%|█████████▏| 234/255 [01:35<00:08,  2.45

Epoch 18, global step 4293: val_loss was not in top 2


Epoch 19:  89%|████████▊ | 226/255 [01:26<00:11,  2.61it/s, loss=0.234, v_num=4, train_loss=0.256, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.459, val_accuracy=0.808, val_f1_score=0.808] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 19:  89%|████████▉ | 228/255 [01:34<00:11,  2.42it/s, loss=0.234, v_num=4, train_loss=0.256, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.459, val_accuracy=0.808, val_f1_score=0.808]
Epoch 19:  90%|█████████ | 230/255 [01:34<00:10,  2.44it/s, loss=0.234, v_num=4, train_loss=0.256, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.459, val_accuracy=0.808, val_f1_score=0.808]
Epoch 19:  91%|█████████ | 232/255 [01:34<00:09,  2.45it/s, loss=0.234, v_num=4, train_loss=0.256, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.459, val_accuracy=0.808, val_f1_score=0.808]
Epoch 19:  92%|█████████▏| 234/255 [01:34<00:08,  2.47it/s, loss=0.234, v_num=4, train_loss=0.256, train_accuracy=0

Epoch 19, global step 4519: val_loss reached 0.42238 (best 0.42238), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-0-v3.ckpt" as top 2


Epoch 20:  89%|████████▊ | 226/255 [01:26<00:11,  2.60it/s, loss=0.211, v_num=4, train_loss=0.250, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.422, val_accuracy=0.847, val_f1_score=0.847] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 20:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.211, v_num=4, train_loss=0.250, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.422, val_accuracy=0.847, val_f1_score=0.847]
Validating:   7%|▋         | 2/29 [00:07<01:26,  3.22s/it][A
Epoch 20:  90%|█████████ | 230/255 [01:34<00:10,  2.43it/s, loss=0.211, v_num=4, train_loss=0.250, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.422, val_accuracy=0.847, val_f1_score=0.847]
Epoch 20:  91%|█████████ | 232/255 [01:34<00:09,  2.44it/s, loss=0.211, v_num=4, train_loss=0.250, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.422, val_accuracy=0.847, val_f1_score=0.847]
Epoch 20:  92%|█████████▏| 234/255 [01:35<00:08,  2.4

Epoch 20, global step 4745: val_loss was not in top 2


Epoch 21:  89%|████████▊ | 226/255 [01:27<00:11,  2.59it/s, loss=0.325, v_num=4, train_loss=0.290, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.612, val_accuracy=0.811, val_f1_score=0.811]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 21:  89%|████████▉ | 228/255 [01:34<00:11,  2.40it/s, loss=0.325, v_num=4, train_loss=0.290, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.612, val_accuracy=0.811, val_f1_score=0.811]
Epoch 21:  90%|█████████ | 230/255 [01:34<00:10,  2.42it/s, loss=0.325, v_num=4, train_loss=0.290, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.612, val_accuracy=0.811, val_f1_score=0.811]
Epoch 21:  91%|█████████ | 232/255 [01:35<00:09,  2.44it/s, loss=0.325, v_num=4, train_loss=0.290, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.612, val_accuracy=0.811, val_f1_score=0.811]
Epoch 21:  92%|█████████▏| 234/255 [01:35<00:08,  2.45it/s, loss=0.325, v_num=4, train_loss=0.290, train_accuracy=0.

Epoch 21, global step 4971: val_loss was not in top 2


Epoch 22:  89%|████████▊ | 226/255 [01:27<00:11,  2.59it/s, loss=0.271, v_num=4, train_loss=0.246, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.642, val_accuracy=0.798, val_f1_score=0.798]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 22:  89%|████████▉ | 228/255 [01:34<00:11,  2.40it/s, loss=0.271, v_num=4, train_loss=0.246, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.642, val_accuracy=0.798, val_f1_score=0.798]
Validating:   7%|▋         | 2/29 [00:07<01:26,  3.22s/it][A
Epoch 22:  90%|█████████ | 230/255 [01:35<00:10,  2.42it/s, loss=0.271, v_num=4, train_loss=0.246, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.642, val_accuracy=0.798, val_f1_score=0.798]
Epoch 22:  91%|█████████ | 232/255 [01:35<00:09,  2.43it/s, loss=0.271, v_num=4, train_loss=0.246, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.642, val_accuracy=0.798, val_f1_score=0.798]
Epoch 22:  92%|█████████▏| 234/255 [01:35<00:08,  2.45

Epoch 22, global step 5197: val_loss reached 0.43581 (best 0.42238), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-0-v2.ckpt" as top 2


Epoch 23:  89%|████████▊ | 226/255 [01:26<00:11,  2.60it/s, loss=0.386, v_num=4, train_loss=0.133, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.436, val_accuracy=0.830, val_f1_score=0.830] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 23:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.386, v_num=4, train_loss=0.133, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.436, val_accuracy=0.830, val_f1_score=0.830]
Epoch 23:  90%|█████████ | 230/255 [01:34<00:10,  2.43it/s, loss=0.386, v_num=4, train_loss=0.133, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.436, val_accuracy=0.830, val_f1_score=0.830]
Epoch 23:  91%|█████████ | 232/255 [01:34<00:09,  2.45it/s, loss=0.386, v_num=4, train_loss=0.133, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.436, val_accuracy=0.830, val_f1_score=0.830]
Epoch 23:  92%|█████████▏| 234/255 [01:34<00:08,  2.46it/s, loss=0.386, v_num=4, train_loss=0.133, train_accuracy=0

Epoch 23, global step 5423: val_loss was not in top 2


Epoch 24:  89%|████████▊ | 226/255 [01:27<00:11,  2.60it/s, loss=0.339, v_num=4, train_loss=0.470, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.491, val_accuracy=0.832, val_f1_score=0.832]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 24:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.339, v_num=4, train_loss=0.470, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.491, val_accuracy=0.832, val_f1_score=0.832]
Epoch 24:  90%|█████████ | 230/255 [01:34<00:10,  2.42it/s, loss=0.339, v_num=4, train_loss=0.470, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.491, val_accuracy=0.832, val_f1_score=0.832]
Epoch 24:  91%|█████████ | 232/255 [01:35<00:09,  2.44it/s, loss=0.339, v_num=4, train_loss=0.470, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.491, val_accuracy=0.832, val_f1_score=0.832]
Epoch 24:  92%|█████████▏| 234/255 [01:35<00:08,  2.46it/s, loss=0.339, v_num=4, train_loss=0.470, train_accuracy=0.

Epoch 24, global step 5649: val_loss was not in top 2


Epoch 25:  89%|████████▊ | 226/255 [01:26<00:11,  2.60it/s, loss=0.269, v_num=4, train_loss=0.294, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.482, val_accuracy=0.823, val_f1_score=0.823]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 25:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.269, v_num=4, train_loss=0.294, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.482, val_accuracy=0.823, val_f1_score=0.823]
Epoch 25:  90%|█████████ | 230/255 [01:34<00:10,  2.43it/s, loss=0.269, v_num=4, train_loss=0.294, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.482, val_accuracy=0.823, val_f1_score=0.823]
Epoch 25:  91%|█████████ | 232/255 [01:34<00:09,  2.45it/s, loss=0.269, v_num=4, train_loss=0.294, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.482, val_accuracy=0.823, val_f1_score=0.823]
Epoch 25:  92%|█████████▏| 234/255 [01:35<00:08,  2.46it/s, loss=0.269, v_num=4, train_loss=0.294, train_accuracy=0.

Epoch 25, global step 5875: val_loss was not in top 2


Epoch 26:  89%|████████▊ | 226/255 [01:27<00:11,  2.59it/s, loss=0.238, v_num=4, train_loss=0.157, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.491, val_accuracy=0.817, val_f1_score=0.817]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 26:  89%|████████▉ | 228/255 [01:35<00:11,  2.40it/s, loss=0.238, v_num=4, train_loss=0.157, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.491, val_accuracy=0.817, val_f1_score=0.817]
Epoch 26:  90%|█████████ | 230/255 [01:35<00:10,  2.42it/s, loss=0.238, v_num=4, train_loss=0.157, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.491, val_accuracy=0.817, val_f1_score=0.817]
Epoch 26:  91%|█████████ | 232/255 [01:35<00:09,  2.43it/s, loss=0.238, v_num=4, train_loss=0.157, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.491, val_accuracy=0.817, val_f1_score=0.817]
Epoch 26:  92%|█████████▏| 234/255 [01:35<00:08,  2.45it/s, loss=0.238, v_num=4, train_loss=0.157, train_accuracy=1.

Epoch 26, global step 6101: val_loss was not in top 2


Epoch 27:  89%|████████▊ | 226/255 [01:27<00:11,  2.59it/s, loss=0.236, v_num=4, train_loss=0.337, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.462, val_accuracy=0.816, val_f1_score=0.816] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 27:  89%|████████▉ | 228/255 [01:35<00:11,  2.40it/s, loss=0.236, v_num=4, train_loss=0.337, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.462, val_accuracy=0.816, val_f1_score=0.816]
Epoch 27:  90%|█████████ | 230/255 [01:35<00:10,  2.41it/s, loss=0.236, v_num=4, train_loss=0.337, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.462, val_accuracy=0.816, val_f1_score=0.816]
Epoch 27:  91%|█████████ | 232/255 [01:35<00:09,  2.43it/s, loss=0.236, v_num=4, train_loss=0.337, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.462, val_accuracy=0.816, val_f1_score=0.816]
Epoch 27:  92%|█████████▏| 234/255 [01:35<00:08,  2.45it/s, loss=0.236, v_num=4, train_loss=0.337, train_accuracy=0

Epoch 27, global step 6327: val_loss reached 0.42787 (best 0.42238), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-0-v2.ckpt" as top 2


Epoch 28:  89%|████████▊ | 226/255 [01:26<00:11,  2.60it/s, loss=0.221, v_num=4, train_loss=0.212, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.428, val_accuracy=0.835, val_f1_score=0.835] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 28:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.221, v_num=4, train_loss=0.212, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.428, val_accuracy=0.835, val_f1_score=0.835]
Epoch 28:  90%|█████████ | 230/255 [01:34<00:10,  2.43it/s, loss=0.221, v_num=4, train_loss=0.212, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.428, val_accuracy=0.835, val_f1_score=0.835]
Epoch 28:  91%|█████████ | 232/255 [01:34<00:09,  2.45it/s, loss=0.221, v_num=4, train_loss=0.212, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.428, val_accuracy=0.835, val_f1_score=0.835]
Epoch 28:  92%|█████████▏| 234/255 [01:35<00:08,  2.46it/s, loss=0.221, v_num=4, train_loss=0.212, train_accuracy=0

Epoch 28, global step 6553: val_loss reached 0.39500 (best 0.39500), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-0-v2.ckpt" as top 2


Epoch 29:  89%|████████▊ | 226/255 [01:26<00:11,  2.60it/s, loss=0.24, v_num=4, train_loss=0.338, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.395, val_accuracy=0.850, val_f1_score=0.850]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 29:  89%|████████▉ | 228/255 [01:34<00:11,  2.42it/s, loss=0.24, v_num=4, train_loss=0.338, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.395, val_accuracy=0.850, val_f1_score=0.850]
Epoch 29:  90%|█████████ | 230/255 [01:34<00:10,  2.43it/s, loss=0.24, v_num=4, train_loss=0.338, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.395, val_accuracy=0.850, val_f1_score=0.850]
Validating:  14%|█▍        | 4/29 [00:07<00:33,  1.36s/it][A
Epoch 29:  91%|█████████ | 232/255 [01:34<00:09,  2.45it/s, loss=0.24, v_num=4, train_loss=0.338, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.395, val_accuracy=0.850, val_f1_score=0.850]
Epoch 29:  92%|█████████▏| 234/255 [01:34<00:08,  2.46it

Epoch 29, global step 6779: val_loss reached 0.38835 (best 0.38835), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-0-v3.ckpt" as top 2


Epoch 30:  89%|████████▊ | 226/255 [01:26<00:11,  2.60it/s, loss=0.248, v_num=4, train_loss=0.385, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.388, val_accuracy=0.865, val_f1_score=0.865] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 30:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.248, v_num=4, train_loss=0.385, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.388, val_accuracy=0.865, val_f1_score=0.865]
Epoch 30:  90%|█████████ | 230/255 [01:34<00:10,  2.43it/s, loss=0.248, v_num=4, train_loss=0.385, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.388, val_accuracy=0.865, val_f1_score=0.865]
Epoch 30:  91%|█████████ | 232/255 [01:34<00:09,  2.45it/s, loss=0.248, v_num=4, train_loss=0.385, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.388, val_accuracy=0.865, val_f1_score=0.865]
Epoch 30:  92%|█████████▏| 234/255 [01:35<00:08,  2.46it/s, loss=0.248, v_num=4, train_loss=0.385, train_accuracy=0

Epoch 30, global step 7005: val_loss was not in top 2


Epoch 31:  89%|████████▊ | 226/255 [01:26<00:11,  2.60it/s, loss=0.195, v_num=4, train_loss=0.158, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.443, val_accuracy=0.859, val_f1_score=0.859] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 31:  89%|████████▉ | 228/255 [01:34<00:11,  2.42it/s, loss=0.195, v_num=4, train_loss=0.158, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.443, val_accuracy=0.859, val_f1_score=0.859]
Epoch 31:  90%|█████████ | 230/255 [01:34<00:10,  2.43it/s, loss=0.195, v_num=4, train_loss=0.158, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.443, val_accuracy=0.859, val_f1_score=0.859]
Epoch 31:  91%|█████████ | 232/255 [01:34<00:09,  2.45it/s, loss=0.195, v_num=4, train_loss=0.158, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.443, val_accuracy=0.859, val_f1_score=0.859]
Epoch 31:  92%|█████████▏| 234/255 [01:34<00:08,  2.46it/s, loss=0.195, v_num=4, train_loss=0.158, train_accuracy=0

Epoch 31, global step 7231: val_loss reached 0.39346 (best 0.38835), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-0-v2.ckpt" as top 2


Epoch 32:  89%|████████▊ | 226/255 [01:26<00:11,  2.60it/s, loss=0.189, v_num=4, train_loss=0.216, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.393, val_accuracy=0.869, val_f1_score=0.869] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 32:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.189, v_num=4, train_loss=0.216, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.393, val_accuracy=0.869, val_f1_score=0.869]
Validating:   7%|▋         | 2/29 [00:07<01:25,  3.18s/it][A
Epoch 32:  90%|█████████ | 230/255 [01:34<00:10,  2.43it/s, loss=0.189, v_num=4, train_loss=0.216, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.393, val_accuracy=0.869, val_f1_score=0.869]
Epoch 32:  91%|█████████ | 232/255 [01:34<00:09,  2.44it/s, loss=0.189, v_num=4, train_loss=0.216, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.393, val_accuracy=0.869, val_f1_score=0.869]
Epoch 32:  92%|█████████▏| 234/255 [01:35<00:08,  2.4

Epoch 32, global step 7457: val_loss was not in top 2


Epoch 33:  89%|████████▊ | 226/255 [01:26<00:11,  2.60it/s, loss=0.191, v_num=4, train_loss=0.466, train_accuracy=0.722, train_f1_score=0.722, val_loss=0.431, val_accuracy=0.869, val_f1_score=0.869] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 33:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.191, v_num=4, train_loss=0.466, train_accuracy=0.722, train_f1_score=0.722, val_loss=0.431, val_accuracy=0.869, val_f1_score=0.869]
Epoch 33:  90%|█████████ | 230/255 [01:34<00:10,  2.43it/s, loss=0.191, v_num=4, train_loss=0.466, train_accuracy=0.722, train_f1_score=0.722, val_loss=0.431, val_accuracy=0.869, val_f1_score=0.869]
Epoch 33:  91%|█████████ | 232/255 [01:34<00:09,  2.45it/s, loss=0.191, v_num=4, train_loss=0.466, train_accuracy=0.722, train_f1_score=0.722, val_loss=0.431, val_accuracy=0.869, val_f1_score=0.869]
Epoch 33:  92%|█████████▏| 234/255 [01:35<00:08,  2.46it/s, loss=0.191, v_num=4, train_loss=0.466, train_accuracy=0

Epoch 33, global step 7683: val_loss was not in top 2


Epoch 34:  89%|████████▊ | 226/255 [01:26<00:11,  2.60it/s, loss=0.225, v_num=4, train_loss=0.223, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.408, val_accuracy=0.859, val_f1_score=0.859] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 34:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.225, v_num=4, train_loss=0.223, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.408, val_accuracy=0.859, val_f1_score=0.859]
Epoch 34:  90%|█████████ | 230/255 [01:34<00:10,  2.42it/s, loss=0.225, v_num=4, train_loss=0.223, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.408, val_accuracy=0.859, val_f1_score=0.859]
Epoch 34:  91%|█████████ | 232/255 [01:35<00:09,  2.44it/s, loss=0.225, v_num=4, train_loss=0.223, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.408, val_accuracy=0.859, val_f1_score=0.859]
Epoch 34:  92%|█████████▏| 234/255 [01:35<00:08,  2.46it/s, loss=0.225, v_num=4, train_loss=0.223, train_accuracy=0

Epoch 34, global step 7909: val_loss was not in top 2


Epoch 35:  89%|████████▊ | 226/255 [01:26<00:11,  2.60it/s, loss=0.366, v_num=4, train_loss=0.580, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.495, val_accuracy=0.842, val_f1_score=0.842] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 35:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.366, v_num=4, train_loss=0.580, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.495, val_accuracy=0.842, val_f1_score=0.842]
Epoch 35:  90%|█████████ | 230/255 [01:34<00:10,  2.43it/s, loss=0.366, v_num=4, train_loss=0.580, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.495, val_accuracy=0.842, val_f1_score=0.842]
Epoch 35:  91%|█████████ | 232/255 [01:34<00:09,  2.44it/s, loss=0.366, v_num=4, train_loss=0.580, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.495, val_accuracy=0.842, val_f1_score=0.842]
Epoch 35:  92%|█████████▏| 234/255 [01:35<00:08,  2.46it/s, loss=0.366, v_num=4, train_loss=0.580, train_accuracy=0

Epoch 35, global step 8135: val_loss was not in top 2


Epoch 36:  89%|████████▊ | 226/255 [01:27<00:11,  2.59it/s, loss=0.24, v_num=4, train_loss=0.286, train_accuracy=0.722, train_f1_score=0.722, val_loss=0.423, val_accuracy=0.839, val_f1_score=0.839] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 36:  89%|████████▉ | 228/255 [01:35<00:11,  2.40it/s, loss=0.24, v_num=4, train_loss=0.286, train_accuracy=0.722, train_f1_score=0.722, val_loss=0.423, val_accuracy=0.839, val_f1_score=0.839]
Epoch 36:  90%|█████████ | 230/255 [01:35<00:10,  2.41it/s, loss=0.24, v_num=4, train_loss=0.286, train_accuracy=0.722, train_f1_score=0.722, val_loss=0.423, val_accuracy=0.839, val_f1_score=0.839]
Epoch 36:  91%|█████████ | 232/255 [01:35<00:09,  2.43it/s, loss=0.24, v_num=4, train_loss=0.286, train_accuracy=0.722, train_f1_score=0.722, val_loss=0.423, val_accuracy=0.839, val_f1_score=0.839]
Epoch 36:  92%|█████████▏| 234/255 [01:35<00:08,  2.45it/s, loss=0.24, v_num=4, train_loss=0.286, train_accuracy=0.722,

Epoch 36, global step 8361: val_loss reached 0.37534 (best 0.37534), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-0-v2.ckpt" as top 2


Epoch 37:  89%|████████▊ | 226/255 [01:27<00:11,  2.59it/s, loss=0.192, v_num=4, train_loss=0.184, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.375, val_accuracy=0.853, val_f1_score=0.853] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 37:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.192, v_num=4, train_loss=0.184, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.375, val_accuracy=0.853, val_f1_score=0.853]
Epoch 37:  90%|█████████ | 230/255 [01:34<00:10,  2.42it/s, loss=0.192, v_num=4, train_loss=0.184, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.375, val_accuracy=0.853, val_f1_score=0.853]
Epoch 37:  91%|█████████ | 232/255 [01:35<00:09,  2.44it/s, loss=0.192, v_num=4, train_loss=0.184, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.375, val_accuracy=0.853, val_f1_score=0.853]
Epoch 37:  92%|█████████▏| 234/255 [01:35<00:08,  2.45it/s, loss=0.192, v_num=4, train_loss=0.184, train_accuracy=0

Epoch 37, global step 8587: val_loss reached 0.38540 (best 0.37534), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-0-v3.ckpt" as top 2


Epoch 38:  89%|████████▊ | 226/255 [01:27<00:11,  2.59it/s, loss=0.195, v_num=4, train_loss=0.344, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.385, val_accuracy=0.869, val_f1_score=0.869] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 38:  89%|████████▉ | 228/255 [01:35<00:11,  2.40it/s, loss=0.195, v_num=4, train_loss=0.344, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.385, val_accuracy=0.869, val_f1_score=0.869]
Epoch 38:  90%|█████████ | 230/255 [01:35<00:10,  2.42it/s, loss=0.195, v_num=4, train_loss=0.344, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.385, val_accuracy=0.869, val_f1_score=0.869]
Epoch 38:  91%|█████████ | 232/255 [01:35<00:09,  2.43it/s, loss=0.195, v_num=4, train_loss=0.344, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.385, val_accuracy=0.869, val_f1_score=0.869]
Epoch 38:  92%|█████████▏| 234/255 [01:35<00:08,  2.45it/s, loss=0.195, v_num=4, train_loss=0.344, train_accuracy=0

Epoch 38, global step 8813: val_loss reached 0.35758 (best 0.35758), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-0-v3.ckpt" as top 2


Epoch 39:  89%|████████▊ | 226/255 [01:27<00:11,  2.58it/s, loss=0.263, v_num=4, train_loss=0.223, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.358, val_accuracy=0.859, val_f1_score=0.859]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 39:  89%|████████▉ | 228/255 [01:35<00:11,  2.39it/s, loss=0.263, v_num=4, train_loss=0.223, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.358, val_accuracy=0.859, val_f1_score=0.859]
Epoch 39:  90%|█████████ | 230/255 [01:35<00:10,  2.41it/s, loss=0.263, v_num=4, train_loss=0.223, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.358, val_accuracy=0.859, val_f1_score=0.859]
Epoch 39:  91%|█████████ | 232/255 [01:35<00:09,  2.43it/s, loss=0.263, v_num=4, train_loss=0.223, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.358, val_accuracy=0.859, val_f1_score=0.859]
Epoch 39:  92%|█████████▏| 234/255 [01:35<00:08,  2.44it/s, loss=0.263, v_num=4, train_loss=0.223, train_accuracy=0.

Epoch 39, global step 9039: val_loss was not in top 2


Epoch 40:  89%|████████▊ | 226/255 [01:27<00:11,  2.59it/s, loss=0.236, v_num=4, train_loss=0.341, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.394, val_accuracy=0.859, val_f1_score=0.859] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 40:  89%|████████▉ | 228/255 [01:35<00:11,  2.40it/s, loss=0.236, v_num=4, train_loss=0.341, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.394, val_accuracy=0.859, val_f1_score=0.859]
Epoch 40:  90%|█████████ | 230/255 [01:35<00:10,  2.42it/s, loss=0.236, v_num=4, train_loss=0.341, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.394, val_accuracy=0.859, val_f1_score=0.859]
Epoch 40:  91%|█████████ | 232/255 [01:35<00:09,  2.43it/s, loss=0.236, v_num=4, train_loss=0.341, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.394, val_accuracy=0.859, val_f1_score=0.859]
Epoch 40:  92%|█████████▏| 234/255 [01:35<00:08,  2.45it/s, loss=0.236, v_num=4, train_loss=0.341, train_accuracy=0

Epoch 40, global step 9265: val_loss reached 0.36964 (best 0.35758), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-0-v2.ckpt" as top 2


Epoch 41:  89%|████████▊ | 226/255 [01:26<00:11,  2.60it/s, loss=0.211, v_num=4, train_loss=0.393, train_accuracy=0.722, train_f1_score=0.722, val_loss=0.370, val_accuracy=0.868, val_f1_score=0.868]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 41:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.211, v_num=4, train_loss=0.393, train_accuracy=0.722, train_f1_score=0.722, val_loss=0.370, val_accuracy=0.868, val_f1_score=0.868]
Epoch 41:  90%|█████████ | 230/255 [01:34<00:10,  2.43it/s, loss=0.211, v_num=4, train_loss=0.393, train_accuracy=0.722, train_f1_score=0.722, val_loss=0.370, val_accuracy=0.868, val_f1_score=0.868]
Epoch 41:  91%|█████████ | 232/255 [01:34<00:09,  2.44it/s, loss=0.211, v_num=4, train_loss=0.393, train_accuracy=0.722, train_f1_score=0.722, val_loss=0.370, val_accuracy=0.868, val_f1_score=0.868]
Epoch 41:  92%|█████████▏| 234/255 [01:35<00:08,  2.46it/s, loss=0.211, v_num=4, train_loss=0.393, train_accuracy=0.

Epoch 41, global step 9491: val_loss reached 0.34456 (best 0.34456), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-0-v2.ckpt" as top 2


Epoch 42:  89%|████████▊ | 226/255 [01:26<00:11,  2.60it/s, loss=0.214, v_num=4, train_loss=0.273, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.345, val_accuracy=0.870, val_f1_score=0.870] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 42:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.214, v_num=4, train_loss=0.273, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.345, val_accuracy=0.870, val_f1_score=0.870]
Epoch 42:  90%|█████████ | 230/255 [01:34<00:10,  2.43it/s, loss=0.214, v_num=4, train_loss=0.273, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.345, val_accuracy=0.870, val_f1_score=0.870]
Epoch 42:  91%|█████████ | 232/255 [01:34<00:09,  2.45it/s, loss=0.214, v_num=4, train_loss=0.273, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.345, val_accuracy=0.870, val_f1_score=0.870]
Epoch 42:  92%|█████████▏| 234/255 [01:35<00:08,  2.46it/s, loss=0.214, v_num=4, train_loss=0.273, train_accuracy=0

Epoch 42, global step 9717: val_loss reached 0.33132 (best 0.33132), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-0-v3.ckpt" as top 2


Epoch 43:  89%|████████▊ | 226/255 [01:26<00:11,  2.60it/s, loss=0.24, v_num=4, train_loss=0.216, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.331, val_accuracy=0.864, val_f1_score=0.864]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 43:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.24, v_num=4, train_loss=0.216, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.331, val_accuracy=0.864, val_f1_score=0.864]
Epoch 43:  90%|█████████ | 230/255 [01:34<00:10,  2.42it/s, loss=0.24, v_num=4, train_loss=0.216, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.331, val_accuracy=0.864, val_f1_score=0.864]
Epoch 43:  91%|█████████ | 232/255 [01:35<00:09,  2.44it/s, loss=0.24, v_num=4, train_loss=0.216, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.331, val_accuracy=0.864, val_f1_score=0.864]
Epoch 43:  92%|█████████▏| 234/255 [01:35<00:08,  2.46it/s, loss=0.24, v_num=4, train_loss=0.216, train_accuracy=0.889

Epoch 43, global step 9943: val_loss was not in top 2


Epoch 44:  89%|████████▊ | 226/255 [01:26<00:11,  2.60it/s, loss=0.22, v_num=4, train_loss=0.270, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.384, val_accuracy=0.857, val_f1_score=0.857]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 44:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.22, v_num=4, train_loss=0.270, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.384, val_accuracy=0.857, val_f1_score=0.857]
Epoch 44:  90%|█████████ | 230/255 [01:34<00:10,  2.42it/s, loss=0.22, v_num=4, train_loss=0.270, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.384, val_accuracy=0.857, val_f1_score=0.857]
Epoch 44:  91%|█████████ | 232/255 [01:35<00:09,  2.44it/s, loss=0.22, v_num=4, train_loss=0.270, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.384, val_accuracy=0.857, val_f1_score=0.857]
Epoch 44:  92%|█████████▏| 234/255 [01:35<00:08,  2.45it/s, loss=0.22, v_num=4, train_loss=0.270, train_accuracy=0.889

Epoch 44, global step 10169: val_loss was not in top 2


Epoch 45:  89%|████████▊ | 226/255 [01:27<00:11,  2.59it/s, loss=0.139, v_num=4, train_loss=0.386, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.380, val_accuracy=0.860, val_f1_score=0.860] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 45:  89%|████████▉ | 228/255 [01:34<00:11,  2.40it/s, loss=0.139, v_num=4, train_loss=0.386, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.380, val_accuracy=0.860, val_f1_score=0.860]
Epoch 45:  90%|█████████ | 230/255 [01:35<00:10,  2.42it/s, loss=0.139, v_num=4, train_loss=0.386, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.380, val_accuracy=0.860, val_f1_score=0.860]
Epoch 45:  91%|█████████ | 232/255 [01:35<00:09,  2.44it/s, loss=0.139, v_num=4, train_loss=0.386, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.380, val_accuracy=0.860, val_f1_score=0.860]
Epoch 45:  92%|█████████▏| 234/255 [01:35<00:08,  2.45it/s, loss=0.139, v_num=4, train_loss=0.386, train_accuracy=0

Epoch 45, global step 10395: val_loss reached 0.31614 (best 0.31614), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-0-v2.ckpt" as top 2


Epoch 46:  89%|████████▊ | 226/255 [01:26<00:11,  2.60it/s, loss=0.153, v_num=4, train_loss=0.0783, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.316, val_accuracy=0.887, val_f1_score=0.887]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 46:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.153, v_num=4, train_loss=0.0783, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.316, val_accuracy=0.887, val_f1_score=0.887]
Epoch 46:  90%|█████████ | 230/255 [01:34<00:10,  2.43it/s, loss=0.153, v_num=4, train_loss=0.0783, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.316, val_accuracy=0.887, val_f1_score=0.887]
Epoch 46:  91%|█████████ | 232/255 [01:34<00:09,  2.45it/s, loss=0.153, v_num=4, train_loss=0.0783, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.316, val_accuracy=0.887, val_f1_score=0.887]
Epoch 46:  92%|█████████▏| 234/255 [01:35<00:08,  2.46it/s, loss=0.153, v_num=4, train_loss=0.0783, train_accura

Epoch 46, global step 10621: val_loss was not in top 2


Epoch 47:  89%|████████▊ | 226/255 [01:26<00:11,  2.60it/s, loss=0.194, v_num=4, train_loss=0.0652, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.373, val_accuracy=0.882, val_f1_score=0.882]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 47:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.194, v_num=4, train_loss=0.0652, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.373, val_accuracy=0.882, val_f1_score=0.882]
Epoch 47:  90%|█████████ | 230/255 [01:34<00:10,  2.43it/s, loss=0.194, v_num=4, train_loss=0.0652, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.373, val_accuracy=0.882, val_f1_score=0.882]
Epoch 47:  91%|█████████ | 232/255 [01:35<00:09,  2.44it/s, loss=0.194, v_num=4, train_loss=0.0652, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.373, val_accuracy=0.882, val_f1_score=0.882]
Epoch 47:  92%|█████████▏| 234/255 [01:35<00:08,  2.46it/s, loss=0.194, v_num=4, train_loss=0.0652, train_accura

Epoch 47, global step 10847: val_loss was not in top 2


Epoch 48:  89%|████████▊ | 226/255 [01:27<00:11,  2.59it/s, loss=0.149, v_num=4, train_loss=0.330, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.357, val_accuracy=0.886, val_f1_score=0.886] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 48:  89%|████████▉ | 228/255 [01:34<00:11,  2.40it/s, loss=0.149, v_num=4, train_loss=0.330, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.357, val_accuracy=0.886, val_f1_score=0.886]
Epoch 48:  90%|█████████ | 230/255 [01:35<00:10,  2.42it/s, loss=0.149, v_num=4, train_loss=0.330, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.357, val_accuracy=0.886, val_f1_score=0.886]
Validating:  14%|█▍        | 4/29 [00:08<00:34,  1.39s/it][A
Epoch 48:  91%|█████████ | 232/255 [01:35<00:09,  2.43it/s, loss=0.149, v_num=4, train_loss=0.330, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.357, val_accuracy=0.886, val_f1_score=0.886]
Epoch 48:  92%|█████████▏| 234/255 [01:35<00:08,  2.4

Epoch 48, global step 11073: val_loss was not in top 2


Epoch 49:  89%|████████▊ | 226/255 [01:27<00:11,  2.59it/s, loss=0.171, v_num=4, train_loss=0.188, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.379, val_accuracy=0.876, val_f1_score=0.876] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 49:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.171, v_num=4, train_loss=0.188, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.379, val_accuracy=0.876, val_f1_score=0.876]
Epoch 49:  90%|█████████ | 230/255 [01:35<00:10,  2.42it/s, loss=0.171, v_num=4, train_loss=0.188, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.379, val_accuracy=0.876, val_f1_score=0.876]
Epoch 49:  91%|█████████ | 232/255 [01:35<00:09,  2.44it/s, loss=0.171, v_num=4, train_loss=0.188, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.379, val_accuracy=0.876, val_f1_score=0.876]
Epoch 49:  92%|█████████▏| 234/255 [01:35<00:08,  2.45it/s, loss=0.171, v_num=4, train_loss=0.188, train_accuracy=0

Epoch 49, global step 11299: val_loss reached 0.32033 (best 0.31614), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-0-v3.ckpt" as top 2


Epoch 50:  89%|████████▊ | 226/255 [01:27<00:11,  2.59it/s, loss=0.139, v_num=4, train_loss=0.0589, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.320, val_accuracy=0.883, val_f1_score=0.883]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 50:  89%|████████▉ | 228/255 [01:35<00:11,  2.40it/s, loss=0.139, v_num=4, train_loss=0.0589, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.320, val_accuracy=0.883, val_f1_score=0.883]
Epoch 50:  90%|█████████ | 230/255 [01:35<00:10,  2.41it/s, loss=0.139, v_num=4, train_loss=0.0589, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.320, val_accuracy=0.883, val_f1_score=0.883]
Epoch 50:  91%|█████████ | 232/255 [01:35<00:09,  2.43it/s, loss=0.139, v_num=4, train_loss=0.0589, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.320, val_accuracy=0.883, val_f1_score=0.883]
Epoch 50:  92%|█████████▏| 234/255 [01:35<00:08,  2.45it/s, loss=0.139, v_num=4, train_loss=0.0589, train_accura

Epoch 50, global step 11525: val_loss was not in top 2


Epoch 51:  89%|████████▊ | 226/255 [01:27<00:11,  2.57it/s, loss=0.15, v_num=4, train_loss=0.295, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.413, val_accuracy=0.886, val_f1_score=0.886]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 51:  89%|████████▉ | 228/255 [01:35<00:11,  2.38it/s, loss=0.15, v_num=4, train_loss=0.295, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.413, val_accuracy=0.886, val_f1_score=0.886]
Epoch 51:  90%|█████████ | 230/255 [01:36<00:10,  2.40it/s, loss=0.15, v_num=4, train_loss=0.295, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.413, val_accuracy=0.886, val_f1_score=0.886]
Epoch 51:  91%|█████████ | 232/255 [01:36<00:09,  2.41it/s, loss=0.15, v_num=4, train_loss=0.295, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.413, val_accuracy=0.886, val_f1_score=0.886]
Epoch 51:  92%|█████████▏| 234/255 [01:36<00:08,  2.43it/s, loss=0.15, v_num=4, train_loss=0.295, train_accuracy=0.889

Epoch 51, global step 11751: val_loss reached 0.31619 (best 0.31614), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-0-v3.ckpt" as top 2


Epoch 52:  89%|████████▊ | 226/255 [01:27<00:11,  2.59it/s, loss=0.175, v_num=4, train_loss=0.188, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.316, val_accuracy=0.895, val_f1_score=0.895] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 52:  89%|████████▉ | 228/255 [01:34<00:11,  2.40it/s, loss=0.175, v_num=4, train_loss=0.188, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.316, val_accuracy=0.895, val_f1_score=0.895]
Epoch 52:  90%|█████████ | 230/255 [01:35<00:10,  2.42it/s, loss=0.175, v_num=4, train_loss=0.188, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.316, val_accuracy=0.895, val_f1_score=0.895]
Epoch 52:  91%|█████████ | 232/255 [01:35<00:09,  2.43it/s, loss=0.175, v_num=4, train_loss=0.188, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.316, val_accuracy=0.895, val_f1_score=0.895]
Epoch 52:  92%|█████████▏| 234/255 [01:35<00:08,  2.45it/s, loss=0.175, v_num=4, train_loss=0.188, train_accuracy=0

Epoch 52, global step 11977: val_loss reached 0.28995 (best 0.28995), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-0-v3.ckpt" as top 2


Epoch 53:  89%|████████▊ | 226/255 [01:26<00:11,  2.60it/s, loss=0.128, v_num=4, train_loss=0.130, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.290, val_accuracy=0.889, val_f1_score=0.889] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 53:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.128, v_num=4, train_loss=0.130, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.290, val_accuracy=0.889, val_f1_score=0.889]
Epoch 53:  90%|█████████ | 230/255 [01:34<00:10,  2.43it/s, loss=0.128, v_num=4, train_loss=0.130, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.290, val_accuracy=0.889, val_f1_score=0.889]
Epoch 53:  91%|█████████ | 232/255 [01:34<00:09,  2.44it/s, loss=0.128, v_num=4, train_loss=0.130, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.290, val_accuracy=0.889, val_f1_score=0.889]
Epoch 53:  92%|█████████▏| 234/255 [01:35<00:08,  2.46it/s, loss=0.128, v_num=4, train_loss=0.130, train_accuracy=0

Epoch 53, global step 12203: val_loss reached 0.28728 (best 0.28728), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-0-v2.ckpt" as top 2


Epoch 54:  89%|████████▊ | 226/255 [01:27<00:11,  2.60it/s, loss=0.125, v_num=4, train_loss=0.047, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.287, val_accuracy=0.902, val_f1_score=0.902] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 54:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.125, v_num=4, train_loss=0.047, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.287, val_accuracy=0.902, val_f1_score=0.902]
Validating:   7%|▋         | 2/29 [00:07<01:26,  3.20s/it][A
Epoch 54:  90%|█████████ | 230/255 [01:34<00:10,  2.42it/s, loss=0.125, v_num=4, train_loss=0.047, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.287, val_accuracy=0.902, val_f1_score=0.902]
Epoch 54:  91%|█████████ | 232/255 [01:35<00:09,  2.44it/s, loss=0.125, v_num=4, train_loss=0.047, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.287, val_accuracy=0.902, val_f1_score=0.902]
Epoch 54:  92%|█████████▏| 234/255 [01:35<00:08,  2.4

Epoch 54, global step 12429: val_loss was not in top 2


Epoch 55:  89%|████████▊ | 226/255 [01:27<00:11,  2.59it/s, loss=0.137, v_num=4, train_loss=0.0773, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.345, val_accuracy=0.894, val_f1_score=0.894] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 55:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.137, v_num=4, train_loss=0.0773, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.345, val_accuracy=0.894, val_f1_score=0.894]
Validating:   7%|▋         | 2/29 [00:07<01:26,  3.21s/it][A
Epoch 55:  90%|█████████ | 230/255 [01:35<00:10,  2.42it/s, loss=0.137, v_num=4, train_loss=0.0773, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.345, val_accuracy=0.894, val_f1_score=0.894]
Epoch 55:  91%|█████████ | 232/255 [01:35<00:09,  2.44it/s, loss=0.137, v_num=4, train_loss=0.0773, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.345, val_accuracy=0.894, val_f1_score=0.894]
Epoch 55:  92%|█████████▏| 234/255 [01:35<00:08, 

Epoch 55, global step 12655: val_loss reached 0.28275 (best 0.28275), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-0-v3.ckpt" as top 2


Epoch 56:  89%|████████▊ | 226/255 [01:26<00:11,  2.60it/s, loss=0.16, v_num=4, train_loss=0.152, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.283, val_accuracy=0.898, val_f1_score=0.898]   
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 56:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.16, v_num=4, train_loss=0.152, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.283, val_accuracy=0.898, val_f1_score=0.898]
Epoch 56:  90%|█████████ | 230/255 [01:34<00:10,  2.43it/s, loss=0.16, v_num=4, train_loss=0.152, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.283, val_accuracy=0.898, val_f1_score=0.898]
Epoch 56:  91%|█████████ | 232/255 [01:35<00:09,  2.44it/s, loss=0.16, v_num=4, train_loss=0.152, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.283, val_accuracy=0.898, val_f1_score=0.898]
Epoch 56:  92%|█████████▏| 234/255 [01:35<00:08,  2.46it/s, loss=0.16, v_num=4, train_loss=0.152, train_accuracy=0.94

Epoch 56, global step 12881: val_loss was not in top 2


Epoch 57:  89%|████████▊ | 226/255 [01:27<00:11,  2.59it/s, loss=0.128, v_num=4, train_loss=0.0418, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.309, val_accuracy=0.899, val_f1_score=0.899] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 57:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.128, v_num=4, train_loss=0.0418, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.309, val_accuracy=0.899, val_f1_score=0.899]
Epoch 57:  90%|█████████ | 230/255 [01:34<00:10,  2.42it/s, loss=0.128, v_num=4, train_loss=0.0418, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.309, val_accuracy=0.899, val_f1_score=0.899]
Epoch 57:  91%|█████████ | 232/255 [01:35<00:09,  2.44it/s, loss=0.128, v_num=4, train_loss=0.0418, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.309, val_accuracy=0.899, val_f1_score=0.899]
Epoch 57:  92%|█████████▏| 234/255 [01:35<00:08,  2.46it/s, loss=0.128, v_num=4, train_loss=0.0418, train_accur

Epoch 57, global step 13107: val_loss was not in top 2


Epoch 58:  89%|████████▊ | 226/255 [01:27<00:11,  2.60it/s, loss=0.132, v_num=4, train_loss=0.0451, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.308, val_accuracy=0.896, val_f1_score=0.896]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 58:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.132, v_num=4, train_loss=0.0451, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.308, val_accuracy=0.896, val_f1_score=0.896]
Epoch 58:  90%|█████████ | 230/255 [01:34<00:10,  2.42it/s, loss=0.132, v_num=4, train_loss=0.0451, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.308, val_accuracy=0.896, val_f1_score=0.896]
Epoch 58:  91%|█████████ | 232/255 [01:35<00:09,  2.44it/s, loss=0.132, v_num=4, train_loss=0.0451, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.308, val_accuracy=0.896, val_f1_score=0.896]
Epoch 58:  92%|█████████▏| 234/255 [01:35<00:08,  2.46it/s, loss=0.132, v_num=4, train_loss=0.0451, train_accura

Epoch 58, global step 13333: val_loss was not in top 2


Epoch 59:  89%|████████▊ | 226/255 [01:27<00:11,  2.59it/s, loss=0.115, v_num=4, train_loss=0.0458, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.326, val_accuracy=0.894, val_f1_score=0.894] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 59:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.115, v_num=4, train_loss=0.0458, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.326, val_accuracy=0.894, val_f1_score=0.894]
Epoch 59:  90%|█████████ | 230/255 [01:34<00:10,  2.42it/s, loss=0.115, v_num=4, train_loss=0.0458, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.326, val_accuracy=0.894, val_f1_score=0.894]
Epoch 59:  91%|█████████ | 232/255 [01:35<00:09,  2.44it/s, loss=0.115, v_num=4, train_loss=0.0458, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.326, val_accuracy=0.894, val_f1_score=0.894]
Epoch 59:  92%|█████████▏| 234/255 [01:35<00:08,  2.45it/s, loss=0.115, v_num=4, train_loss=0.0458, train_accur

Epoch 59, global step 13559: val_loss was not in top 2


Epoch 60:  89%|████████▊ | 226/255 [01:26<00:11,  2.60it/s, loss=0.0931, v_num=4, train_loss=0.144, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.325, val_accuracy=0.894, val_f1_score=0.894] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 60:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.0931, v_num=4, train_loss=0.144, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.325, val_accuracy=0.894, val_f1_score=0.894]
Epoch 60:  90%|█████████ | 230/255 [01:34<00:10,  2.42it/s, loss=0.0931, v_num=4, train_loss=0.144, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.325, val_accuracy=0.894, val_f1_score=0.894]
Epoch 60:  91%|█████████ | 232/255 [01:35<00:09,  2.44it/s, loss=0.0931, v_num=4, train_loss=0.144, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.325, val_accuracy=0.894, val_f1_score=0.894]
Epoch 60:  92%|█████████▏| 234/255 [01:35<00:08,  2.46it/s, loss=0.0931, v_num=4, train_loss=0.144, train_accur

Epoch 60, global step 13785: val_loss was not in top 2


Epoch 61:  89%|████████▊ | 226/255 [01:26<00:11,  2.60it/s, loss=0.105, v_num=4, train_loss=0.0307, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.316, val_accuracy=0.903, val_f1_score=0.903] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 61:  89%|████████▉ | 228/255 [01:34<00:11,  2.40it/s, loss=0.105, v_num=4, train_loss=0.0307, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.316, val_accuracy=0.903, val_f1_score=0.903]
Epoch 61:  90%|█████████ | 230/255 [01:35<00:10,  2.42it/s, loss=0.105, v_num=4, train_loss=0.0307, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.316, val_accuracy=0.903, val_f1_score=0.903]
Epoch 61:  91%|█████████ | 232/255 [01:35<00:09,  2.43it/s, loss=0.105, v_num=4, train_loss=0.0307, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.316, val_accuracy=0.903, val_f1_score=0.903]
Epoch 61:  92%|█████████▏| 234/255 [01:35<00:08,  2.45it/s, loss=0.105, v_num=4, train_loss=0.0307, train_accur

Epoch 61, global step 14011: val_loss was not in top 2


Epoch 62:  89%|████████▊ | 226/255 [01:27<00:11,  2.59it/s, loss=0.0977, v_num=4, train_loss=0.0617, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.340, val_accuracy=0.902, val_f1_score=0.902]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 62:  89%|████████▉ | 228/255 [01:35<00:11,  2.39it/s, loss=0.0977, v_num=4, train_loss=0.0617, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.340, val_accuracy=0.902, val_f1_score=0.902]
Epoch 62:  90%|█████████ | 230/255 [01:35<00:10,  2.41it/s, loss=0.0977, v_num=4, train_loss=0.0617, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.340, val_accuracy=0.902, val_f1_score=0.902]
Epoch 62:  91%|█████████ | 232/255 [01:35<00:09,  2.42it/s, loss=0.0977, v_num=4, train_loss=0.0617, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.340, val_accuracy=0.902, val_f1_score=0.902]
Epoch 62:  92%|█████████▏| 234/255 [01:35<00:08,  2.44it/s, loss=0.0977, v_num=4, train_loss=0.0617, train_a

Epoch 62, global step 14237: val_loss was not in top 2


Epoch 63:  89%|████████▊ | 226/255 [01:27<00:11,  2.58it/s, loss=0.15, v_num=4, train_loss=0.227, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.348, val_accuracy=0.891, val_f1_score=0.891]   
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 63:  89%|████████▉ | 228/255 [01:35<00:11,  2.38it/s, loss=0.15, v_num=4, train_loss=0.227, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.348, val_accuracy=0.891, val_f1_score=0.891]
Epoch 63:  90%|█████████ | 230/255 [01:35<00:10,  2.40it/s, loss=0.15, v_num=4, train_loss=0.227, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.348, val_accuracy=0.891, val_f1_score=0.891]
Epoch 63:  91%|█████████ | 232/255 [01:36<00:09,  2.41it/s, loss=0.15, v_num=4, train_loss=0.227, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.348, val_accuracy=0.891, val_f1_score=0.891]
Epoch 63:  92%|█████████▏| 234/255 [01:36<00:08,  2.43it/s, loss=0.15, v_num=4, train_loss=0.227, train_accuracy=0.94

Epoch 63, global step 14463: val_loss was not in top 2


Epoch 64:  89%|████████▊ | 226/255 [01:27<00:11,  2.58it/s, loss=0.0893, v_num=4, train_loss=0.0662, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.350, val_accuracy=0.897, val_f1_score=0.897]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 64:  89%|████████▉ | 228/255 [01:35<00:11,  2.39it/s, loss=0.0893, v_num=4, train_loss=0.0662, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.350, val_accuracy=0.897, val_f1_score=0.897]
Epoch 64:  90%|█████████ | 230/255 [01:35<00:10,  2.40it/s, loss=0.0893, v_num=4, train_loss=0.0662, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.350, val_accuracy=0.897, val_f1_score=0.897]
Epoch 64:  91%|█████████ | 232/255 [01:35<00:09,  2.42it/s, loss=0.0893, v_num=4, train_loss=0.0662, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.350, val_accuracy=0.897, val_f1_score=0.897]
Epoch 64:  92%|█████████▏| 234/255 [01:35<00:08,  2.44it/s, loss=0.0893, v_num=4, train_loss=0.0662, train_a

Epoch 64, global step 14689: val_loss was not in top 2


Epoch 65:  89%|████████▊ | 226/255 [01:27<00:11,  2.60it/s, loss=0.123, v_num=4, train_loss=0.0245, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.317, val_accuracy=0.905, val_f1_score=0.905] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 65:  89%|████████▉ | 228/255 [01:34<00:11,  2.40it/s, loss=0.123, v_num=4, train_loss=0.0245, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.317, val_accuracy=0.905, val_f1_score=0.905]
Epoch 65:  90%|█████████ | 230/255 [01:35<00:10,  2.42it/s, loss=0.123, v_num=4, train_loss=0.0245, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.317, val_accuracy=0.905, val_f1_score=0.905]
Epoch 65:  91%|█████████ | 232/255 [01:35<00:09,  2.43it/s, loss=0.123, v_num=4, train_loss=0.0245, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.317, val_accuracy=0.905, val_f1_score=0.905]
Epoch 65:  92%|█████████▏| 234/255 [01:35<00:08,  2.45it/s, loss=0.123, v_num=4, train_loss=0.0245, train_accur

Epoch 65, global step 14915: val_loss was not in top 2


Epoch 66:  89%|████████▊ | 226/255 [01:27<00:11,  2.59it/s, loss=0.114, v_num=4, train_loss=0.372, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.304, val_accuracy=0.901, val_f1_score=0.901]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 66:  89%|████████▉ | 228/255 [01:34<00:11,  2.40it/s, loss=0.114, v_num=4, train_loss=0.372, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.304, val_accuracy=0.901, val_f1_score=0.901]
Epoch 66:  90%|█████████ | 230/255 [01:35<00:10,  2.42it/s, loss=0.114, v_num=4, train_loss=0.372, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.304, val_accuracy=0.901, val_f1_score=0.901]
Epoch 66:  91%|█████████ | 232/255 [01:35<00:09,  2.43it/s, loss=0.114, v_num=4, train_loss=0.372, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.304, val_accuracy=0.901, val_f1_score=0.901]
Epoch 66:  92%|█████████▏| 234/255 [01:35<00:08,  2.45it/s, loss=0.114, v_num=4, train_loss=0.372, train_accuracy=

Epoch 66, global step 15141: val_loss was not in top 2


Epoch 67:  89%|████████▊ | 226/255 [01:27<00:11,  2.59it/s, loss=0.116, v_num=4, train_loss=0.257, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.320, val_accuracy=0.904, val_f1_score=0.904]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 67:  89%|████████▉ | 228/255 [01:34<00:11,  2.40it/s, loss=0.116, v_num=4, train_loss=0.257, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.320, val_accuracy=0.904, val_f1_score=0.904]
Epoch 67:  90%|█████████ | 230/255 [01:35<00:10,  2.42it/s, loss=0.116, v_num=4, train_loss=0.257, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.320, val_accuracy=0.904, val_f1_score=0.904]
Epoch 67:  91%|█████████ | 232/255 [01:35<00:09,  2.43it/s, loss=0.116, v_num=4, train_loss=0.257, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.320, val_accuracy=0.904, val_f1_score=0.904]
Epoch 67:  92%|█████████▏| 234/255 [01:35<00:08,  2.45it/s, loss=0.116, v_num=4, train_loss=0.257, train_accuracy=

Epoch 67, global step 15367: val_loss was not in top 2


Epoch 68:  89%|████████▊ | 226/255 [01:27<00:11,  2.59it/s, loss=0.141, v_num=4, train_loss=0.0363, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.325, val_accuracy=0.903, val_f1_score=0.903]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 68:  89%|████████▉ | 228/255 [01:34<00:11,  2.40it/s, loss=0.141, v_num=4, train_loss=0.0363, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.325, val_accuracy=0.903, val_f1_score=0.903]
Epoch 68:  90%|█████████ | 230/255 [01:35<00:10,  2.42it/s, loss=0.141, v_num=4, train_loss=0.0363, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.325, val_accuracy=0.903, val_f1_score=0.903]
Validating:  14%|█▍        | 4/29 [00:08<00:31,  1.27s/it][A
Epoch 68:  91%|█████████ | 232/255 [01:35<00:09,  2.44it/s, loss=0.141, v_num=4, train_loss=0.0363, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.325, val_accuracy=0.903, val_f1_score=0.903]
Epoch 68:  92%|█████████▏| 234/255 [01:35<00:08,  

Epoch 68, global step 15593: val_loss was not in top 2


Epoch 69:  89%|████████▊ | 226/255 [01:27<00:11,  2.59it/s, loss=0.0927, v_num=4, train_loss=0.0407, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.321, val_accuracy=0.895, val_f1_score=0.895]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 69:  89%|████████▉ | 228/255 [01:34<00:11,  2.40it/s, loss=0.0927, v_num=4, train_loss=0.0407, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.321, val_accuracy=0.895, val_f1_score=0.895]
Epoch 69:  90%|█████████ | 230/255 [01:35<00:10,  2.42it/s, loss=0.0927, v_num=4, train_loss=0.0407, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.321, val_accuracy=0.895, val_f1_score=0.895]
Epoch 69:  91%|█████████ | 232/255 [01:35<00:09,  2.43it/s, loss=0.0927, v_num=4, train_loss=0.0407, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.321, val_accuracy=0.895, val_f1_score=0.895]
Epoch 69:  92%|█████████▏| 234/255 [01:35<00:08,  2.45it/s, loss=0.0927, v_num=4, train_loss=0.0407, train_a

Epoch 69, global step 15819: val_loss was not in top 2


Epoch 70:  89%|████████▊ | 226/255 [01:26<00:11,  2.60it/s, loss=0.0835, v_num=4, train_loss=0.0693, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.342, val_accuracy=0.895, val_f1_score=0.895] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 70:  89%|████████▉ | 228/255 [01:34<00:11,  2.40it/s, loss=0.0835, v_num=4, train_loss=0.0693, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.342, val_accuracy=0.895, val_f1_score=0.895]
Epoch 70:  90%|█████████ | 230/255 [01:35<00:10,  2.42it/s, loss=0.0835, v_num=4, train_loss=0.0693, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.342, val_accuracy=0.895, val_f1_score=0.895]
Epoch 70:  91%|█████████ | 232/255 [01:35<00:09,  2.44it/s, loss=0.0835, v_num=4, train_loss=0.0693, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.342, val_accuracy=0.895, val_f1_score=0.895]
Epoch 70:  92%|█████████▏| 234/255 [01:35<00:08,  2.45it/s, loss=0.0835, v_num=4, train_loss=0.0693, train_

Epoch 70, global step 16045: val_loss was not in top 2


Epoch 71:  89%|████████▊ | 226/255 [01:27<00:11,  2.60it/s, loss=0.0721, v_num=4, train_loss=0.0256, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.331, val_accuracy=0.908, val_f1_score=0.908] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 71:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.0721, v_num=4, train_loss=0.0256, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.331, val_accuracy=0.908, val_f1_score=0.908]
Validating:   7%|▋         | 2/29 [00:07<01:27,  3.24s/it][A
Epoch 71:  90%|█████████ | 230/255 [01:35<00:10,  2.42it/s, loss=0.0721, v_num=4, train_loss=0.0256, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.331, val_accuracy=0.908, val_f1_score=0.908]
Epoch 71:  91%|█████████ | 232/255 [01:35<00:09,  2.44it/s, loss=0.0721, v_num=4, train_loss=0.0256, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.331, val_accuracy=0.908, val_f1_score=0.908]
Epoch 71:  92%|█████████▏| 234/255 [01:35<00:

Epoch 71, global step 16271: val_loss was not in top 2


Epoch 72:  89%|████████▊ | 226/255 [01:26<00:11,  2.60it/s, loss=0.0971, v_num=4, train_loss=0.193, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.314, val_accuracy=0.896, val_f1_score=0.896]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 72:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.0971, v_num=4, train_loss=0.193, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.314, val_accuracy=0.896, val_f1_score=0.896]
Validating:   7%|▋         | 2/29 [00:07<01:27,  3.24s/it][A
Epoch 72:  90%|█████████ | 230/255 [01:34<00:10,  2.43it/s, loss=0.0971, v_num=4, train_loss=0.193, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.314, val_accuracy=0.896, val_f1_score=0.896]
Epoch 72:  91%|█████████ | 232/255 [01:35<00:09,  2.44it/s, loss=0.0971, v_num=4, train_loss=0.193, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.314, val_accuracy=0.896, val_f1_score=0.896]
Epoch 72:  92%|█████████▏| 234/255 [01:35<00:08,

Epoch 72, global step 16497: val_loss reached 0.26931 (best 0.26931), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-0-v2.ckpt" as top 2


Epoch 73:  89%|████████▊ | 226/255 [01:26<00:11,  2.60it/s, loss=0.0935, v_num=4, train_loss=0.0217, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.269, val_accuracy=0.914, val_f1_score=0.914] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 73:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.0935, v_num=4, train_loss=0.0217, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.269, val_accuracy=0.914, val_f1_score=0.914]
Epoch 73:  90%|█████████ | 230/255 [01:34<00:10,  2.43it/s, loss=0.0935, v_num=4, train_loss=0.0217, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.269, val_accuracy=0.914, val_f1_score=0.914]
Validating:  14%|█▍        | 4/29 [00:07<00:31,  1.25s/it][A
Epoch 73:  91%|█████████ | 232/255 [01:34<00:09,  2.45it/s, loss=0.0935, v_num=4, train_loss=0.0217, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.269, val_accuracy=0.914, val_f1_score=0.914]
Epoch 73:  92%|█████████▏| 234/255 [01:35<00:

Epoch 73, global step 16723: val_loss was not in top 2


Epoch 74:  89%|████████▊ | 226/255 [01:28<00:11,  2.56it/s, loss=0.0748, v_num=4, train_loss=0.0787, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.344, val_accuracy=0.901, val_f1_score=0.901] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 74:  89%|████████▉ | 228/255 [01:35<00:11,  2.38it/s, loss=0.0748, v_num=4, train_loss=0.0787, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.344, val_accuracy=0.901, val_f1_score=0.901]
Validating:   7%|▋         | 2/29 [00:07<01:26,  3.19s/it][A
Epoch 74:  90%|█████████ | 230/255 [01:36<00:10,  2.39it/s, loss=0.0748, v_num=4, train_loss=0.0787, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.344, val_accuracy=0.901, val_f1_score=0.901]
Epoch 74:  91%|█████████ | 232/255 [01:36<00:09,  2.41it/s, loss=0.0748, v_num=4, train_loss=0.0787, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.344, val_accuracy=0.901, val_f1_score=0.901]
Epoch 74:  92%|█████████▏| 234/255 [01:36<00:

Epoch 74, global step 16949: val_loss was not in top 2


Epoch 75:  89%|████████▊ | 226/255 [01:27<00:11,  2.59it/s, loss=0.128, v_num=4, train_loss=0.0647, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.356, val_accuracy=0.905, val_f1_score=0.905] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 75:  89%|████████▉ | 228/255 [01:34<00:11,  2.40it/s, loss=0.128, v_num=4, train_loss=0.0647, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.356, val_accuracy=0.905, val_f1_score=0.905]
Epoch 75:  90%|█████████ | 230/255 [01:35<00:10,  2.42it/s, loss=0.128, v_num=4, train_loss=0.0647, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.356, val_accuracy=0.905, val_f1_score=0.905]
Epoch 75:  91%|█████████ | 232/255 [01:35<00:09,  2.44it/s, loss=0.128, v_num=4, train_loss=0.0647, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.356, val_accuracy=0.905, val_f1_score=0.905]
Epoch 75:  92%|█████████▏| 234/255 [01:35<00:08,  2.45it/s, loss=0.128, v_num=4, train_loss=0.0647, train_accur

Epoch 75, global step 17175: val_loss was not in top 2


Epoch 76:  89%|████████▊ | 226/255 [01:26<00:11,  2.60it/s, loss=0.076, v_num=4, train_loss=0.0228, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.321, val_accuracy=0.902, val_f1_score=0.902] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 76:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.076, v_num=4, train_loss=0.0228, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.321, val_accuracy=0.902, val_f1_score=0.902]
Epoch 76:  90%|█████████ | 230/255 [01:34<00:10,  2.43it/s, loss=0.076, v_num=4, train_loss=0.0228, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.321, val_accuracy=0.902, val_f1_score=0.902]
Epoch 76:  91%|█████████ | 232/255 [01:34<00:09,  2.44it/s, loss=0.076, v_num=4, train_loss=0.0228, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.321, val_accuracy=0.902, val_f1_score=0.902]
Epoch 76:  92%|█████████▏| 234/255 [01:35<00:08,  2.46it/s, loss=0.076, v_num=4, train_loss=0.0228, train_accur

Epoch 76, global step 17401: val_loss was not in top 2


Epoch 77:  89%|████████▊ | 226/255 [01:26<00:11,  2.61it/s, loss=0.0754, v_num=4, train_loss=0.132, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.317, val_accuracy=0.908, val_f1_score=0.908]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 77:  89%|████████▉ | 228/255 [01:34<00:11,  2.42it/s, loss=0.0754, v_num=4, train_loss=0.132, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.317, val_accuracy=0.908, val_f1_score=0.908]
Epoch 77:  90%|█████████ | 230/255 [01:34<00:10,  2.43it/s, loss=0.0754, v_num=4, train_loss=0.132, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.317, val_accuracy=0.908, val_f1_score=0.908]
Epoch 77:  91%|█████████ | 232/255 [01:34<00:09,  2.45it/s, loss=0.0754, v_num=4, train_loss=0.132, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.317, val_accuracy=0.908, val_f1_score=0.908]
Epoch 77:  92%|█████████▏| 234/255 [01:34<00:08,  2.47it/s, loss=0.0754, v_num=4, train_loss=0.132, train_accu

Epoch 77, global step 17627: val_loss was not in top 2


Epoch 78:  89%|████████▊ | 226/255 [01:26<00:11,  2.61it/s, loss=0.119, v_num=4, train_loss=0.0585, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.305, val_accuracy=0.914, val_f1_score=0.914] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 78:  89%|████████▉ | 228/255 [01:34<00:11,  2.42it/s, loss=0.119, v_num=4, train_loss=0.0585, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.305, val_accuracy=0.914, val_f1_score=0.914]
Epoch 78:  90%|█████████ | 230/255 [01:34<00:10,  2.43it/s, loss=0.119, v_num=4, train_loss=0.0585, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.305, val_accuracy=0.914, val_f1_score=0.914]
Epoch 78:  91%|█████████ | 232/255 [01:34<00:09,  2.45it/s, loss=0.119, v_num=4, train_loss=0.0585, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.305, val_accuracy=0.914, val_f1_score=0.914]
Epoch 78:  92%|█████████▏| 234/255 [01:34<00:08,  2.47it/s, loss=0.119, v_num=4, train_loss=0.0585, train_accur

Epoch 78, global step 17853: val_loss was not in top 2


Epoch 79:  89%|████████▊ | 226/255 [01:26<00:11,  2.61it/s, loss=0.103, v_num=4, train_loss=0.533, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.312, val_accuracy=0.904, val_f1_score=0.904]   
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 79:  89%|████████▉ | 228/255 [01:34<00:11,  2.42it/s, loss=0.103, v_num=4, train_loss=0.533, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.312, val_accuracy=0.904, val_f1_score=0.904]
Epoch 79:  90%|█████████ | 230/255 [01:34<00:10,  2.43it/s, loss=0.103, v_num=4, train_loss=0.533, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.312, val_accuracy=0.904, val_f1_score=0.904]
Epoch 79:  91%|█████████ | 232/255 [01:34<00:09,  2.45it/s, loss=0.103, v_num=4, train_loss=0.533, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.312, val_accuracy=0.904, val_f1_score=0.904]
Epoch 79:  92%|█████████▏| 234/255 [01:34<00:08,  2.47it/s, loss=0.103, v_num=4, train_loss=0.533, train_accuracy

Epoch 79, global step 18079: val_loss was not in top 2


Epoch 80:  89%|████████▊ | 226/255 [01:26<00:11,  2.61it/s, loss=0.0856, v_num=4, train_loss=0.191, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.364, val_accuracy=0.907, val_f1_score=0.907]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 80:  89%|████████▉ | 228/255 [01:34<00:11,  2.42it/s, loss=0.0856, v_num=4, train_loss=0.191, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.364, val_accuracy=0.907, val_f1_score=0.907]
Epoch 80:  90%|█████████ | 230/255 [01:34<00:10,  2.43it/s, loss=0.0856, v_num=4, train_loss=0.191, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.364, val_accuracy=0.907, val_f1_score=0.907]
Epoch 80:  91%|█████████ | 232/255 [01:34<00:09,  2.45it/s, loss=0.0856, v_num=4, train_loss=0.191, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.364, val_accuracy=0.907, val_f1_score=0.907]
Epoch 80:  92%|█████████▏| 234/255 [01:34<00:08,  2.47it/s, loss=0.0856, v_num=4, train_loss=0.191, train_accu

Epoch 80, global step 18305: val_loss was not in top 2


Epoch 81:  89%|████████▊ | 226/255 [01:26<00:11,  2.60it/s, loss=0.0766, v_num=4, train_loss=0.0444, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.399, val_accuracy=0.908, val_f1_score=0.908]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 81:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.0766, v_num=4, train_loss=0.0444, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.399, val_accuracy=0.908, val_f1_score=0.908]
Epoch 81:  90%|█████████ | 230/255 [01:34<00:10,  2.43it/s, loss=0.0766, v_num=4, train_loss=0.0444, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.399, val_accuracy=0.908, val_f1_score=0.908]
Epoch 81:  91%|█████████ | 232/255 [01:34<00:09,  2.45it/s, loss=0.0766, v_num=4, train_loss=0.0444, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.399, val_accuracy=0.908, val_f1_score=0.908]
Epoch 81:  92%|█████████▏| 234/255 [01:35<00:08,  2.46it/s, loss=0.0766, v_num=4, train_loss=0.0444, train_a

Epoch 81, global step 18531: val_loss was not in top 2


Epoch 82:  89%|████████▊ | 226/255 [01:26<00:11,  2.60it/s, loss=0.0945, v_num=4, train_loss=0.0384, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.287, val_accuracy=0.911, val_f1_score=0.911] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 82:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.0945, v_num=4, train_loss=0.0384, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.287, val_accuracy=0.911, val_f1_score=0.911]
Epoch 82:  90%|█████████ | 230/255 [01:34<00:10,  2.43it/s, loss=0.0945, v_num=4, train_loss=0.0384, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.287, val_accuracy=0.911, val_f1_score=0.911]
Epoch 82:  91%|█████████ | 232/255 [01:35<00:09,  2.44it/s, loss=0.0945, v_num=4, train_loss=0.0384, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.287, val_accuracy=0.911, val_f1_score=0.911]
Epoch 82:  92%|█████████▏| 234/255 [01:35<00:08,  2.46it/s, loss=0.0945, v_num=4, train_loss=0.0384, train_

Epoch 82, global step 18757: val_loss reached 0.26490 (best 0.26490), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-0-v3.ckpt" as top 2


Epoch 83:  89%|████████▊ | 226/255 [01:26<00:11,  2.61it/s, loss=0.0936, v_num=4, train_loss=0.0604, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.265, val_accuracy=0.911, val_f1_score=0.911]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 83:  89%|████████▉ | 228/255 [01:34<00:11,  2.42it/s, loss=0.0936, v_num=4, train_loss=0.0604, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.265, val_accuracy=0.911, val_f1_score=0.911]
Epoch 83:  90%|█████████ | 230/255 [01:34<00:10,  2.44it/s, loss=0.0936, v_num=4, train_loss=0.0604, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.265, val_accuracy=0.911, val_f1_score=0.911]
Epoch 83:  91%|█████████ | 232/255 [01:34<00:09,  2.45it/s, loss=0.0936, v_num=4, train_loss=0.0604, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.265, val_accuracy=0.911, val_f1_score=0.911]
Epoch 83:  92%|█████████▏| 234/255 [01:34<00:08,  2.47it/s, loss=0.0936, v_num=4, train_loss=0.0604, train_a

Epoch 83, global step 18983: val_loss was not in top 2


Epoch 84:  89%|████████▊ | 226/255 [01:26<00:11,  2.61it/s, loss=0.074, v_num=4, train_loss=0.0719, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.273, val_accuracy=0.916, val_f1_score=0.916]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 84:  89%|████████▉ | 228/255 [01:34<00:11,  2.42it/s, loss=0.074, v_num=4, train_loss=0.0719, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.273, val_accuracy=0.916, val_f1_score=0.916]
Epoch 84:  90%|█████████ | 230/255 [01:34<00:10,  2.44it/s, loss=0.074, v_num=4, train_loss=0.0719, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.273, val_accuracy=0.916, val_f1_score=0.916]
Epoch 84:  91%|█████████ | 232/255 [01:34<00:09,  2.45it/s, loss=0.074, v_num=4, train_loss=0.0719, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.273, val_accuracy=0.916, val_f1_score=0.916]
Epoch 84:  92%|█████████▏| 234/255 [01:34<00:08,  2.47it/s, loss=0.074, v_num=4, train_loss=0.0719, train_accu

Epoch 84, global step 19209: val_loss was not in top 2


Epoch 85:  89%|████████▊ | 226/255 [01:26<00:11,  2.61it/s, loss=0.0439, v_num=4, train_loss=0.0781, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.330, val_accuracy=0.899, val_f1_score=0.899] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 85:  89%|████████▉ | 228/255 [01:34<00:11,  2.42it/s, loss=0.0439, v_num=4, train_loss=0.0781, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.330, val_accuracy=0.899, val_f1_score=0.899]
Epoch 85:  90%|█████████ | 230/255 [01:34<00:10,  2.44it/s, loss=0.0439, v_num=4, train_loss=0.0781, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.330, val_accuracy=0.899, val_f1_score=0.899]
Epoch 85:  91%|█████████ | 232/255 [01:34<00:09,  2.45it/s, loss=0.0439, v_num=4, train_loss=0.0781, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.330, val_accuracy=0.899, val_f1_score=0.899]
Epoch 85:  92%|█████████▏| 234/255 [01:34<00:08,  2.47it/s, loss=0.0439, v_num=4, train_loss=0.0781, train_

Epoch 85, global step 19435: val_loss was not in top 2


Epoch 86:  89%|████████▊ | 226/255 [01:26<00:11,  2.61it/s, loss=0.073, v_num=4, train_loss=0.050, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.306, val_accuracy=0.918, val_f1_score=0.918]   
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 86:  89%|████████▉ | 228/255 [01:34<00:11,  2.42it/s, loss=0.073, v_num=4, train_loss=0.050, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.306, val_accuracy=0.918, val_f1_score=0.918]
Epoch 86:  90%|█████████ | 230/255 [01:34<00:10,  2.44it/s, loss=0.073, v_num=4, train_loss=0.050, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.306, val_accuracy=0.918, val_f1_score=0.918]
Epoch 86:  91%|█████████ | 232/255 [01:34<00:09,  2.45it/s, loss=0.073, v_num=4, train_loss=0.050, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.306, val_accuracy=0.918, val_f1_score=0.918]
Epoch 86:  92%|█████████▏| 234/255 [01:34<00:08,  2.47it/s, loss=0.073, v_num=4, train_loss=0.050, train_accuracy

Epoch 86, global step 19661: val_loss was not in top 2


Epoch 87:  89%|████████▊ | 226/255 [01:26<00:11,  2.60it/s, loss=0.0602, v_num=4, train_loss=0.00192, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.294, val_accuracy=0.919, val_f1_score=0.919]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 87:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.0602, v_num=4, train_loss=0.00192, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.294, val_accuracy=0.919, val_f1_score=0.919]
Epoch 87:  90%|█████████ | 230/255 [01:34<00:10,  2.42it/s, loss=0.0602, v_num=4, train_loss=0.00192, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.294, val_accuracy=0.919, val_f1_score=0.919]
Epoch 87:  91%|█████████ | 232/255 [01:35<00:09,  2.44it/s, loss=0.0602, v_num=4, train_loss=0.00192, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.294, val_accuracy=0.919, val_f1_score=0.919]
Epoch 87:  92%|█████████▏| 234/255 [01:35<00:08,  2.46it/s, loss=0.0602, v_num=4, train_loss=0.00192, tr

Epoch 87, global step 19887: val_loss was not in top 2


Epoch 88:  89%|████████▊ | 226/255 [01:27<00:11,  2.59it/s, loss=0.0536, v_num=4, train_loss=0.0153, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.326, val_accuracy=0.914, val_f1_score=0.914] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 88:  89%|████████▉ | 228/255 [01:35<00:11,  2.40it/s, loss=0.0536, v_num=4, train_loss=0.0153, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.326, val_accuracy=0.914, val_f1_score=0.914]
Epoch 88:  90%|█████████ | 230/255 [01:35<00:10,  2.41it/s, loss=0.0536, v_num=4, train_loss=0.0153, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.326, val_accuracy=0.914, val_f1_score=0.914]
Epoch 88:  91%|█████████ | 232/255 [01:35<00:09,  2.43it/s, loss=0.0536, v_num=4, train_loss=0.0153, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.326, val_accuracy=0.914, val_f1_score=0.914]
Epoch 88:  92%|█████████▏| 234/255 [01:35<00:08,  2.45it/s, loss=0.0536, v_num=4, train_loss=0.0153, train_

Epoch 88, global step 20113: val_loss was not in top 2


Epoch 89:  89%|████████▊ | 226/255 [01:27<00:11,  2.59it/s, loss=0.0448, v_num=4, train_loss=0.0242, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.311, val_accuracy=0.916, val_f1_score=0.916] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 89:  89%|████████▉ | 228/255 [01:34<00:11,  2.40it/s, loss=0.0448, v_num=4, train_loss=0.0242, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.311, val_accuracy=0.916, val_f1_score=0.916]
Epoch 89:  90%|█████████ | 230/255 [01:35<00:10,  2.42it/s, loss=0.0448, v_num=4, train_loss=0.0242, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.311, val_accuracy=0.916, val_f1_score=0.916]
Epoch 89:  91%|█████████ | 232/255 [01:35<00:09,  2.43it/s, loss=0.0448, v_num=4, train_loss=0.0242, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.311, val_accuracy=0.916, val_f1_score=0.916]
Epoch 89:  92%|█████████▏| 234/255 [01:35<00:08,  2.45it/s, loss=0.0448, v_num=4, train_loss=0.0242, train_

Epoch 89, global step 20339: val_loss was not in top 2


Epoch 90:  89%|████████▊ | 226/255 [01:26<00:11,  2.60it/s, loss=0.0368, v_num=4, train_loss=0.0652, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.319, val_accuracy=0.911, val_f1_score=0.911] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 90:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.0368, v_num=4, train_loss=0.0652, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.319, val_accuracy=0.911, val_f1_score=0.911]
Epoch 90:  90%|█████████ | 230/255 [01:34<00:10,  2.42it/s, loss=0.0368, v_num=4, train_loss=0.0652, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.319, val_accuracy=0.911, val_f1_score=0.911]
Epoch 90:  91%|█████████ | 232/255 [01:35<00:09,  2.44it/s, loss=0.0368, v_num=4, train_loss=0.0652, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.319, val_accuracy=0.911, val_f1_score=0.911]
Epoch 90:  92%|█████████▏| 234/255 [01:35<00:08,  2.46it/s, loss=0.0368, v_num=4, train_loss=0.0652, train_

Epoch 90, global step 20565: val_loss was not in top 2


Epoch 91:  89%|████████▊ | 226/255 [01:26<00:11,  2.61it/s, loss=0.0423, v_num=4, train_loss=0.0819, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.300, val_accuracy=0.913, val_f1_score=0.913] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 91:  89%|████████▉ | 228/255 [01:34<00:11,  2.42it/s, loss=0.0423, v_num=4, train_loss=0.0819, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.300, val_accuracy=0.913, val_f1_score=0.913]
Epoch 91:  90%|█████████ | 230/255 [01:34<00:10,  2.43it/s, loss=0.0423, v_num=4, train_loss=0.0819, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.300, val_accuracy=0.913, val_f1_score=0.913]
Epoch 91:  91%|█████████ | 232/255 [01:34<00:09,  2.45it/s, loss=0.0423, v_num=4, train_loss=0.0819, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.300, val_accuracy=0.913, val_f1_score=0.913]
Epoch 91:  92%|█████████▏| 234/255 [01:34<00:08,  2.47it/s, loss=0.0423, v_num=4, train_loss=0.0819, train_

Epoch 91, global step 20791: val_loss was not in top 2


Epoch 92:  89%|████████▊ | 226/255 [01:26<00:11,  2.61it/s, loss=0.033, v_num=4, train_loss=0.00797, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.321, val_accuracy=0.910, val_f1_score=0.910] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 92:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.033, v_num=4, train_loss=0.00797, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.321, val_accuracy=0.910, val_f1_score=0.910]
Epoch 92:  90%|█████████ | 230/255 [01:34<00:10,  2.43it/s, loss=0.033, v_num=4, train_loss=0.00797, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.321, val_accuracy=0.910, val_f1_score=0.910]
Epoch 92:  91%|█████████ | 232/255 [01:34<00:09,  2.45it/s, loss=0.033, v_num=4, train_loss=0.00797, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.321, val_accuracy=0.910, val_f1_score=0.910]
Epoch 92:  92%|█████████▏| 234/255 [01:34<00:08,  2.46it/s, loss=0.033, v_num=4, train_loss=0.00797, train_

Epoch 92, global step 21017: val_loss was not in top 2


Epoch 93:  89%|████████▊ | 226/255 [01:26<00:11,  2.61it/s, loss=0.0816, v_num=4, train_loss=0.0018, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.294, val_accuracy=0.913, val_f1_score=0.913] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 93:  89%|████████▉ | 228/255 [01:34<00:11,  2.42it/s, loss=0.0816, v_num=4, train_loss=0.0018, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.294, val_accuracy=0.913, val_f1_score=0.913]
Epoch 93:  90%|█████████ | 230/255 [01:34<00:10,  2.43it/s, loss=0.0816, v_num=4, train_loss=0.0018, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.294, val_accuracy=0.913, val_f1_score=0.913]
Epoch 93:  91%|█████████ | 232/255 [01:34<00:09,  2.45it/s, loss=0.0816, v_num=4, train_loss=0.0018, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.294, val_accuracy=0.913, val_f1_score=0.913]
Epoch 93:  92%|█████████▏| 234/255 [01:34<00:08,  2.47it/s, loss=0.0816, v_num=4, train_loss=0.0018, train_

Epoch 93, global step 21243: val_loss was not in top 2


Epoch 94:  89%|████████▊ | 226/255 [01:26<00:11,  2.60it/s, loss=0.042, v_num=4, train_loss=0.0286, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.326, val_accuracy=0.908, val_f1_score=0.908]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 94:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.042, v_num=4, train_loss=0.0286, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.326, val_accuracy=0.908, val_f1_score=0.908]
Epoch 94:  90%|█████████ | 230/255 [01:34<00:10,  2.43it/s, loss=0.042, v_num=4, train_loss=0.0286, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.326, val_accuracy=0.908, val_f1_score=0.908]
Epoch 94:  91%|█████████ | 232/255 [01:34<00:09,  2.45it/s, loss=0.042, v_num=4, train_loss=0.0286, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.326, val_accuracy=0.908, val_f1_score=0.908]
Epoch 94:  92%|█████████▏| 234/255 [01:35<00:08,  2.46it/s, loss=0.042, v_num=4, train_loss=0.0286, train_accu

Epoch 94, global step 21469: val_loss was not in top 2


Epoch 95:  89%|████████▊ | 226/255 [01:26<00:11,  2.61it/s, loss=0.0858, v_num=4, train_loss=0.386, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.315, val_accuracy=0.915, val_f1_score=0.915]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 95:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.0858, v_num=4, train_loss=0.386, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.315, val_accuracy=0.915, val_f1_score=0.915]
Epoch 95:  90%|█████████ | 230/255 [01:34<00:10,  2.43it/s, loss=0.0858, v_num=4, train_loss=0.386, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.315, val_accuracy=0.915, val_f1_score=0.915]
Epoch 95:  91%|█████████ | 232/255 [01:34<00:09,  2.45it/s, loss=0.0858, v_num=4, train_loss=0.386, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.315, val_accuracy=0.915, val_f1_score=0.915]
Epoch 95:  92%|█████████▏| 234/255 [01:35<00:08,  2.46it/s, loss=0.0858, v_num=4, train_loss=0.386, train_accu

Epoch 95, global step 21695: val_loss was not in top 2


Epoch 96:  89%|████████▊ | 226/255 [01:26<00:11,  2.61it/s, loss=0.07, v_num=4, train_loss=0.00383, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.367, val_accuracy=0.909, val_f1_score=0.909]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 96:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.07, v_num=4, train_loss=0.00383, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.367, val_accuracy=0.909, val_f1_score=0.909]
Epoch 96:  90%|█████████ | 230/255 [01:34<00:10,  2.43it/s, loss=0.07, v_num=4, train_loss=0.00383, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.367, val_accuracy=0.909, val_f1_score=0.909]
Epoch 96:  91%|█████████ | 232/255 [01:34<00:09,  2.45it/s, loss=0.07, v_num=4, train_loss=0.00383, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.367, val_accuracy=0.909, val_f1_score=0.909]
Epoch 96:  92%|█████████▏| 234/255 [01:35<00:08,  2.46it/s, loss=0.07, v_num=4, train_loss=0.00383, train_accu

Epoch 96, global step 21921: val_loss was not in top 2


Epoch 97:  89%|████████▊ | 226/255 [01:26<00:11,  2.61it/s, loss=0.0707, v_num=4, train_loss=0.165, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.312, val_accuracy=0.917, val_f1_score=0.917]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 97:  89%|████████▉ | 228/255 [01:34<00:11,  2.42it/s, loss=0.0707, v_num=4, train_loss=0.165, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.312, val_accuracy=0.917, val_f1_score=0.917]
Epoch 97:  90%|█████████ | 230/255 [01:34<00:10,  2.43it/s, loss=0.0707, v_num=4, train_loss=0.165, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.312, val_accuracy=0.917, val_f1_score=0.917]
Epoch 97:  91%|█████████ | 232/255 [01:34<00:09,  2.45it/s, loss=0.0707, v_num=4, train_loss=0.165, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.312, val_accuracy=0.917, val_f1_score=0.917]
Epoch 97:  92%|█████████▏| 234/255 [01:34<00:08,  2.47it/s, loss=0.0707, v_num=4, train_loss=0.165, train_accu

Epoch 97, global step 22147: val_loss was not in top 2


Epoch 98:  89%|████████▊ | 226/255 [01:26<00:11,  2.61it/s, loss=0.0464, v_num=4, train_loss=0.0052, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.283, val_accuracy=0.914, val_f1_score=0.914] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 98:  89%|████████▉ | 228/255 [01:34<00:11,  2.42it/s, loss=0.0464, v_num=4, train_loss=0.0052, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.283, val_accuracy=0.914, val_f1_score=0.914]
Validating:   7%|▋         | 2/29 [00:07<01:27,  3.23s/it][A
Epoch 98:  90%|█████████ | 230/255 [01:34<00:10,  2.43it/s, loss=0.0464, v_num=4, train_loss=0.0052, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.283, val_accuracy=0.914, val_f1_score=0.914]
Epoch 98:  91%|█████████ | 232/255 [01:34<00:09,  2.45it/s, loss=0.0464, v_num=4, train_loss=0.0052, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.283, val_accuracy=0.914, val_f1_score=0.914]
Epoch 98:  92%|█████████▏| 234/255 [01:34<00:

Epoch 98, global step 22373: val_loss was not in top 2


Epoch 99:  89%|████████▊ | 226/255 [01:26<00:11,  2.61it/s, loss=0.0685, v_num=4, train_loss=0.0755, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.377, val_accuracy=0.903, val_f1_score=0.903] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 99:  89%|████████▉ | 228/255 [01:34<00:11,  2.42it/s, loss=0.0685, v_num=4, train_loss=0.0755, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.377, val_accuracy=0.903, val_f1_score=0.903]
Epoch 99:  90%|█████████ | 230/255 [01:34<00:10,  2.44it/s, loss=0.0685, v_num=4, train_loss=0.0755, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.377, val_accuracy=0.903, val_f1_score=0.903]
Epoch 99:  91%|█████████ | 232/255 [01:34<00:09,  2.45it/s, loss=0.0685, v_num=4, train_loss=0.0755, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.377, val_accuracy=0.903, val_f1_score=0.903]
Epoch 99:  92%|█████████▏| 234/255 [01:34<00:08,  2.47it/s, loss=0.0685, v_num=4, train_loss=0.0755, train_

Epoch 99, global step 22599: val_loss was not in top 2


Epoch 100:  89%|████████▊ | 226/255 [01:27<00:11,  2.59it/s, loss=0.0407, v_num=4, train_loss=0.0484, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.345, val_accuracy=0.913, val_f1_score=0.913] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 100:  89%|████████▉ | 228/255 [01:34<00:11,  2.40it/s, loss=0.0407, v_num=4, train_loss=0.0484, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.345, val_accuracy=0.913, val_f1_score=0.913]
Epoch 100:  90%|█████████ | 230/255 [01:35<00:10,  2.42it/s, loss=0.0407, v_num=4, train_loss=0.0484, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.345, val_accuracy=0.913, val_f1_score=0.913]
Epoch 100:  91%|█████████ | 232/255 [01:35<00:09,  2.43it/s, loss=0.0407, v_num=4, train_loss=0.0484, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.345, val_accuracy=0.913, val_f1_score=0.913]
Epoch 100:  92%|█████████▏| 234/255 [01:35<00:08,  2.45it/s, loss=0.0407, v_num=4, train_loss=0.0484, t

Epoch 100, global step 22825: val_loss was not in top 2


Epoch 101:  89%|████████▊ | 226/255 [01:27<00:11,  2.58it/s, loss=0.026, v_num=4, train_loss=0.00427, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.347, val_accuracy=0.920, val_f1_score=0.920] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 101:  89%|████████▉ | 228/255 [01:35<00:11,  2.39it/s, loss=0.026, v_num=4, train_loss=0.00427, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.347, val_accuracy=0.920, val_f1_score=0.920]
Epoch 101:  90%|█████████ | 230/255 [01:35<00:10,  2.41it/s, loss=0.026, v_num=4, train_loss=0.00427, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.347, val_accuracy=0.920, val_f1_score=0.920]
Epoch 101:  91%|█████████ | 232/255 [01:35<00:09,  2.42it/s, loss=0.026, v_num=4, train_loss=0.00427, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.347, val_accuracy=0.920, val_f1_score=0.920]
Epoch 101:  92%|█████████▏| 234/255 [01:35<00:08,  2.44it/s, loss=0.026, v_num=4, train_loss=0.00427, t

Epoch 101, global step 23051: val_loss was not in top 2


Epoch 102:  89%|████████▊ | 226/255 [01:27<00:11,  2.59it/s, loss=0.0657, v_num=4, train_loss=0.127, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.309, val_accuracy=0.917, val_f1_score=0.917]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 102:  89%|████████▉ | 228/255 [01:35<00:11,  2.40it/s, loss=0.0657, v_num=4, train_loss=0.127, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.309, val_accuracy=0.917, val_f1_score=0.917]
Epoch 102:  90%|█████████ | 230/255 [01:35<00:10,  2.41it/s, loss=0.0657, v_num=4, train_loss=0.127, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.309, val_accuracy=0.917, val_f1_score=0.917]
Epoch 102:  91%|█████████ | 232/255 [01:35<00:09,  2.43it/s, loss=0.0657, v_num=4, train_loss=0.127, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.309, val_accuracy=0.917, val_f1_score=0.917]
Epoch 102:  92%|█████████▏| 234/255 [01:35<00:08,  2.45it/s, loss=0.0657, v_num=4, train_loss=0.127, train

Epoch 102, global step 23277: val_loss was not in top 2


Epoch 103:  89%|████████▊ | 226/255 [01:26<00:11,  2.60it/s, loss=0.0358, v_num=4, train_loss=0.00194, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.297, val_accuracy=0.918, val_f1_score=0.918]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 103:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.0358, v_num=4, train_loss=0.00194, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.297, val_accuracy=0.918, val_f1_score=0.918]
Epoch 103:  90%|█████████ | 230/255 [01:34<00:10,  2.43it/s, loss=0.0358, v_num=4, train_loss=0.00194, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.297, val_accuracy=0.918, val_f1_score=0.918]
Epoch 103:  91%|█████████ | 232/255 [01:34<00:09,  2.45it/s, loss=0.0358, v_num=4, train_loss=0.00194, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.297, val_accuracy=0.918, val_f1_score=0.918]
Epoch 103:  92%|█████████▏| 234/255 [01:34<00:08,  2.46it/s, loss=0.0358, v_num=4, train_loss=0.0019

Epoch 103, global step 23503: val_loss was not in top 2


Epoch 104:  89%|████████▊ | 226/255 [01:26<00:11,  2.61it/s, loss=0.0213, v_num=4, train_loss=0.00342, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.327, val_accuracy=0.918, val_f1_score=0.918]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 104:  89%|████████▉ | 228/255 [01:34<00:11,  2.42it/s, loss=0.0213, v_num=4, train_loss=0.00342, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.327, val_accuracy=0.918, val_f1_score=0.918]
Validating:   7%|▋         | 2/29 [00:07<01:26,  3.20s/it][A
Epoch 104:  90%|█████████ | 230/255 [01:34<00:10,  2.43it/s, loss=0.0213, v_num=4, train_loss=0.00342, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.327, val_accuracy=0.918, val_f1_score=0.918]
Epoch 104:  91%|█████████ | 232/255 [01:34<00:09,  2.45it/s, loss=0.0213, v_num=4, train_loss=0.00342, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.327, val_accuracy=0.918, val_f1_score=0.918]
Epoch 104:  92%|█████████▏| 234/255 [0

Epoch 104, global step 23729: val_loss was not in top 2


Epoch 105:  89%|████████▊ | 226/255 [01:26<00:11,  2.60it/s, loss=0.0791, v_num=4, train_loss=0.0107, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.309, val_accuracy=0.924, val_f1_score=0.924] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 105:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.0791, v_num=4, train_loss=0.0107, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.309, val_accuracy=0.924, val_f1_score=0.924]
Epoch 105:  90%|█████████ | 230/255 [01:34<00:10,  2.42it/s, loss=0.0791, v_num=4, train_loss=0.0107, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.309, val_accuracy=0.924, val_f1_score=0.924]
Epoch 105:  91%|█████████ | 232/255 [01:35<00:09,  2.44it/s, loss=0.0791, v_num=4, train_loss=0.0107, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.309, val_accuracy=0.924, val_f1_score=0.924]
Epoch 105:  92%|█████████▏| 234/255 [01:35<00:08,  2.46it/s, loss=0.0791, v_num=4, train_loss=0.0107, t

Epoch 105, global step 23955: val_loss was not in top 2


Epoch 106:  89%|████████▊ | 226/255 [01:26<00:11,  2.60it/s, loss=0.0214, v_num=4, train_loss=0.00469, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.389, val_accuracy=0.913, val_f1_score=0.913]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 106:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.0214, v_num=4, train_loss=0.00469, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.389, val_accuracy=0.913, val_f1_score=0.913]
Epoch 106:  90%|█████████ | 230/255 [01:34<00:10,  2.43it/s, loss=0.0214, v_num=4, train_loss=0.00469, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.389, val_accuracy=0.913, val_f1_score=0.913]
Epoch 106:  91%|█████████ | 232/255 [01:34<00:09,  2.44it/s, loss=0.0214, v_num=4, train_loss=0.00469, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.389, val_accuracy=0.913, val_f1_score=0.913]
Epoch 106:  92%|█████████▏| 234/255 [01:35<00:08,  2.46it/s, loss=0.0214, v_num=4, train_loss=0.0046

Epoch 106, global step 24181: val_loss was not in top 2


Epoch 107:  89%|████████▊ | 226/255 [01:26<00:11,  2.60it/s, loss=0.0754, v_num=4, train_loss=0.533, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.312, val_accuracy=0.923, val_f1_score=0.923]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 107:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.0754, v_num=4, train_loss=0.533, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.312, val_accuracy=0.923, val_f1_score=0.923]
Epoch 107:  90%|█████████ | 230/255 [01:34<00:10,  2.43it/s, loss=0.0754, v_num=4, train_loss=0.533, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.312, val_accuracy=0.923, val_f1_score=0.923]
Epoch 107:  91%|█████████ | 232/255 [01:34<00:09,  2.44it/s, loss=0.0754, v_num=4, train_loss=0.533, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.312, val_accuracy=0.923, val_f1_score=0.923]
Epoch 107:  92%|█████████▏| 234/255 [01:35<00:08,  2.46it/s, loss=0.0754, v_num=4, train_loss=0.533, train

Epoch 107, global step 24407: val_loss was not in top 2


Epoch 108:  89%|████████▊ | 226/255 [01:26<00:11,  2.61it/s, loss=0.0127, v_num=4, train_loss=0.0035, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.443, val_accuracy=0.909, val_f1_score=0.909]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 108:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.0127, v_num=4, train_loss=0.0035, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.443, val_accuracy=0.909, val_f1_score=0.909]
Epoch 108:  90%|█████████ | 230/255 [01:34<00:10,  2.43it/s, loss=0.0127, v_num=4, train_loss=0.0035, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.443, val_accuracy=0.909, val_f1_score=0.909]
Epoch 108:  91%|█████████ | 232/255 [01:34<00:09,  2.45it/s, loss=0.0127, v_num=4, train_loss=0.0035, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.443, val_accuracy=0.909, val_f1_score=0.909]
Epoch 108:  92%|█████████▏| 234/255 [01:34<00:08,  2.46it/s, loss=0.0127, v_num=4, train_loss=0.0035, 

Epoch 108, global step 24633: val_loss was not in top 2


Epoch 109:  89%|████████▊ | 226/255 [01:26<00:11,  2.61it/s, loss=0.0249, v_num=4, train_loss=0.0276, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.340, val_accuracy=0.913, val_f1_score=0.913]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 109:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.0249, v_num=4, train_loss=0.0276, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.340, val_accuracy=0.913, val_f1_score=0.913]
Epoch 109:  90%|█████████ | 230/255 [01:34<00:10,  2.43it/s, loss=0.0249, v_num=4, train_loss=0.0276, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.340, val_accuracy=0.913, val_f1_score=0.913]
Epoch 109:  91%|█████████ | 232/255 [01:34<00:09,  2.44it/s, loss=0.0249, v_num=4, train_loss=0.0276, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.340, val_accuracy=0.913, val_f1_score=0.913]
Epoch 109:  92%|█████████▏| 234/255 [01:35<00:08,  2.46it/s, loss=0.0249, v_num=4, train_loss=0.0276, 

Epoch 109, global step 24859: val_loss was not in top 2


Epoch 110:  89%|████████▊ | 226/255 [01:26<00:11,  2.61it/s, loss=0.0244, v_num=4, train_loss=0.000721, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.329, val_accuracy=0.921, val_f1_score=0.921]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 110:  89%|████████▉ | 228/255 [01:34<00:11,  2.40it/s, loss=0.0244, v_num=4, train_loss=0.000721, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.329, val_accuracy=0.921, val_f1_score=0.921]
Epoch 110:  90%|█████████ | 230/255 [01:35<00:10,  2.42it/s, loss=0.0244, v_num=4, train_loss=0.000721, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.329, val_accuracy=0.921, val_f1_score=0.921]
Validating:  14%|█▍        | 4/29 [00:08<00:33,  1.32s/it][A
Epoch 110:  91%|█████████ | 232/255 [01:35<00:09,  2.44it/s, loss=0.0244, v_num=4, train_loss=0.000721, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.329, val_accuracy=0.921, val_f1_score=0.921]
Epoch 110:  92%|█████████▏| 234/25

Epoch 110, global step 25085: val_loss was not in top 2


Epoch 111:  89%|████████▊ | 226/255 [01:27<00:11,  2.60it/s, loss=0.0429, v_num=4, train_loss=0.00301, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.374, val_accuracy=0.920, val_f1_score=0.920] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 111:  89%|████████▉ | 228/255 [01:34<00:11,  2.40it/s, loss=0.0429, v_num=4, train_loss=0.00301, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.374, val_accuracy=0.920, val_f1_score=0.920]
Epoch 111:  90%|█████████ | 230/255 [01:35<00:10,  2.42it/s, loss=0.0429, v_num=4, train_loss=0.00301, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.374, val_accuracy=0.920, val_f1_score=0.920]
Epoch 111:  91%|█████████ | 232/255 [01:35<00:09,  2.43it/s, loss=0.0429, v_num=4, train_loss=0.00301, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.374, val_accuracy=0.920, val_f1_score=0.920]
Epoch 111:  92%|█████████▏| 234/255 [01:35<00:08,  2.45it/s, loss=0.0429, v_num=4, train_loss=0.003

Epoch 111, global step 25311: val_loss was not in top 2


Epoch 112:  89%|████████▊ | 226/255 [01:26<00:11,  2.61it/s, loss=0.0186, v_num=4, train_loss=0.0044, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.378, val_accuracy=0.911, val_f1_score=0.911] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 112:  89%|████████▉ | 228/255 [01:34<00:11,  2.42it/s, loss=0.0186, v_num=4, train_loss=0.0044, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.378, val_accuracy=0.911, val_f1_score=0.911]
Epoch 112:  90%|█████████ | 230/255 [01:34<00:10,  2.43it/s, loss=0.0186, v_num=4, train_loss=0.0044, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.378, val_accuracy=0.911, val_f1_score=0.911]
Epoch 112:  91%|█████████ | 232/255 [01:34<00:09,  2.45it/s, loss=0.0186, v_num=4, train_loss=0.0044, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.378, val_accuracy=0.911, val_f1_score=0.911]
Epoch 112:  92%|█████████▏| 234/255 [01:34<00:08,  2.47it/s, loss=0.0186, v_num=4, train_loss=0.0044, t

Epoch 112, global step 25537: val_loss was not in top 2


Epoch 113:  89%|████████▊ | 226/255 [01:26<00:11,  2.60it/s, loss=0.0318, v_num=4, train_loss=0.00187, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.366, val_accuracy=0.917, val_f1_score=0.917] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 113:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.0318, v_num=4, train_loss=0.00187, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.366, val_accuracy=0.917, val_f1_score=0.917]
Epoch 113:  90%|█████████ | 230/255 [01:34<00:10,  2.42it/s, loss=0.0318, v_num=4, train_loss=0.00187, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.366, val_accuracy=0.917, val_f1_score=0.917]
Epoch 113:  91%|█████████ | 232/255 [01:35<00:09,  2.44it/s, loss=0.0318, v_num=4, train_loss=0.00187, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.366, val_accuracy=0.917, val_f1_score=0.917]
Epoch 113:  92%|█████████▏| 234/255 [01:35<00:08,  2.46it/s, loss=0.0318, v_num=4, train_loss=0.001

Epoch 113, global step 25763: val_loss was not in top 2


Epoch 114:  89%|████████▊ | 226/255 [01:27<00:11,  2.59it/s, loss=0.0554, v_num=4, train_loss=0.00424, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.347, val_accuracy=0.918, val_f1_score=0.918]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 114:  89%|████████▉ | 228/255 [01:35<00:11,  2.40it/s, loss=0.0554, v_num=4, train_loss=0.00424, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.347, val_accuracy=0.918, val_f1_score=0.918]
Epoch 114:  90%|█████████ | 230/255 [01:35<00:10,  2.41it/s, loss=0.0554, v_num=4, train_loss=0.00424, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.347, val_accuracy=0.918, val_f1_score=0.918]
Epoch 114:  91%|█████████ | 232/255 [01:35<00:09,  2.43it/s, loss=0.0554, v_num=4, train_loss=0.00424, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.347, val_accuracy=0.918, val_f1_score=0.918]
Epoch 114:  92%|█████████▏| 234/255 [01:35<00:08,  2.45it/s, loss=0.0554, v_num=4, train_loss=0.0042

Epoch 114, global step 25989: val_loss was not in top 2


Epoch 115:  89%|████████▊ | 226/255 [01:26<00:11,  2.60it/s, loss=0.021, v_num=4, train_loss=0.0142, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.312, val_accuracy=0.925, val_f1_score=0.925]   
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 115:  89%|████████▉ | 228/255 [01:35<00:11,  2.40it/s, loss=0.021, v_num=4, train_loss=0.0142, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.312, val_accuracy=0.925, val_f1_score=0.925]
Epoch 115:  90%|█████████ | 230/255 [01:35<00:10,  2.42it/s, loss=0.021, v_num=4, train_loss=0.0142, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.312, val_accuracy=0.925, val_f1_score=0.925]
Validating:  14%|█▍        | 4/29 [00:08<00:32,  1.31s/it][A
Epoch 115:  91%|█████████ | 232/255 [01:35<00:09,  2.43it/s, loss=0.021, v_num=4, train_loss=0.0142, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.312, val_accuracy=0.925, val_f1_score=0.925]
Epoch 115:  92%|█████████▏| 234/255 [01:35<

Epoch 115, global step 26215: val_loss was not in top 2


Epoch 116:  89%|████████▊ | 226/255 [01:26<00:11,  2.61it/s, loss=0.0448, v_num=4, train_loss=0.00197, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.308, val_accuracy=0.930, val_f1_score=0.930]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 116:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.0448, v_num=4, train_loss=0.00197, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.308, val_accuracy=0.930, val_f1_score=0.930]
Epoch 116:  90%|█████████ | 230/255 [01:34<00:10,  2.43it/s, loss=0.0448, v_num=4, train_loss=0.00197, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.308, val_accuracy=0.930, val_f1_score=0.930]
Epoch 116:  91%|█████████ | 232/255 [01:34<00:09,  2.45it/s, loss=0.0448, v_num=4, train_loss=0.00197, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.308, val_accuracy=0.930, val_f1_score=0.930]
Epoch 116:  92%|█████████▏| 234/255 [01:35<00:08,  2.46it/s, loss=0.0448, v_num=4, train_loss=0.0019

Epoch 116, global step 26441: val_loss was not in top 2


Epoch 117:  89%|████████▊ | 226/255 [01:26<00:11,  2.61it/s, loss=0.0598, v_num=4, train_loss=0.0138, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.306, val_accuracy=0.930, val_f1_score=0.930] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 117:  89%|████████▉ | 228/255 [01:34<00:11,  2.42it/s, loss=0.0598, v_num=4, train_loss=0.0138, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.306, val_accuracy=0.930, val_f1_score=0.930]
Epoch 117:  90%|█████████ | 230/255 [01:34<00:10,  2.43it/s, loss=0.0598, v_num=4, train_loss=0.0138, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.306, val_accuracy=0.930, val_f1_score=0.930]
Epoch 117:  91%|█████████ | 232/255 [01:34<00:09,  2.45it/s, loss=0.0598, v_num=4, train_loss=0.0138, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.306, val_accuracy=0.930, val_f1_score=0.930]
Epoch 117:  92%|█████████▏| 234/255 [01:34<00:08,  2.46it/s, loss=0.0598, v_num=4, train_loss=0.0138, t

Epoch 117, global step 26667: val_loss was not in top 2


Epoch 118:  89%|████████▊ | 226/255 [01:26<00:11,  2.60it/s, loss=0.0618, v_num=4, train_loss=0.0244, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.358, val_accuracy=0.921, val_f1_score=0.921] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 118:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.0618, v_num=4, train_loss=0.0244, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.358, val_accuracy=0.921, val_f1_score=0.921]
Epoch 118:  90%|█████████ | 230/255 [01:34<00:10,  2.43it/s, loss=0.0618, v_num=4, train_loss=0.0244, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.358, val_accuracy=0.921, val_f1_score=0.921]
Epoch 118:  91%|█████████ | 232/255 [01:34<00:09,  2.44it/s, loss=0.0618, v_num=4, train_loss=0.0244, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.358, val_accuracy=0.921, val_f1_score=0.921]
Epoch 118:  92%|█████████▏| 234/255 [01:35<00:08,  2.46it/s, loss=0.0618, v_num=4, train_loss=0.0244, t

Epoch 118, global step 26893: val_loss was not in top 2


Epoch 119:  89%|████████▊ | 226/255 [01:26<00:11,  2.60it/s, loss=0.0504, v_num=4, train_loss=0.266, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.334, val_accuracy=0.924, val_f1_score=0.924]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 119:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.0504, v_num=4, train_loss=0.266, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.334, val_accuracy=0.924, val_f1_score=0.924]
Epoch 119:  90%|█████████ | 230/255 [01:34<00:10,  2.42it/s, loss=0.0504, v_num=4, train_loss=0.266, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.334, val_accuracy=0.924, val_f1_score=0.924]
Epoch 119:  91%|█████████ | 232/255 [01:35<00:09,  2.44it/s, loss=0.0504, v_num=4, train_loss=0.266, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.334, val_accuracy=0.924, val_f1_score=0.924]
Epoch 119:  92%|█████████▏| 234/255 [01:35<00:08,  2.46it/s, loss=0.0504, v_num=4, train_loss=0.266, train

Epoch 119, global step 27119: val_loss was not in top 2


Epoch 120:  89%|████████▊ | 226/255 [01:27<00:11,  2.59it/s, loss=0.0345, v_num=4, train_loss=0.0112, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.354, val_accuracy=0.918, val_f1_score=0.918] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 120:  89%|████████▉ | 228/255 [01:34<00:11,  2.40it/s, loss=0.0345, v_num=4, train_loss=0.0112, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.354, val_accuracy=0.918, val_f1_score=0.918]
Epoch 120:  90%|█████████ | 230/255 [01:35<00:10,  2.42it/s, loss=0.0345, v_num=4, train_loss=0.0112, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.354, val_accuracy=0.918, val_f1_score=0.918]
Epoch 120:  91%|█████████ | 232/255 [01:35<00:09,  2.43it/s, loss=0.0345, v_num=4, train_loss=0.0112, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.354, val_accuracy=0.918, val_f1_score=0.918]
Epoch 120:  92%|█████████▏| 234/255 [01:35<00:08,  2.45it/s, loss=0.0345, v_num=4, train_loss=0.0112, t

Epoch 120, global step 27345: val_loss was not in top 2


Epoch 121:  89%|████████▊ | 226/255 [01:26<00:11,  2.60it/s, loss=0.022, v_num=4, train_loss=0.00652, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.295, val_accuracy=0.923, val_f1_score=0.923] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 121:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.022, v_num=4, train_loss=0.00652, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.295, val_accuracy=0.923, val_f1_score=0.923]
Epoch 121:  90%|█████████ | 230/255 [01:34<00:10,  2.42it/s, loss=0.022, v_num=4, train_loss=0.00652, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.295, val_accuracy=0.923, val_f1_score=0.923]
Epoch 121:  91%|█████████ | 232/255 [01:35<00:09,  2.44it/s, loss=0.022, v_num=4, train_loss=0.00652, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.295, val_accuracy=0.923, val_f1_score=0.923]
Validating:  21%|██        | 6/29 [00:08<00:17,  1.32it/s][A
Epoch 121:  92%|█████████▏| 234/255 [01:3

Epoch 121, global step 27571: val_loss was not in top 2


Epoch 122:  89%|████████▊ | 226/255 [01:26<00:11,  2.60it/s, loss=0.00966, v_num=4, train_loss=0.0313, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.275, val_accuracy=0.928, val_f1_score=0.928] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 122:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.00966, v_num=4, train_loss=0.0313, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.275, val_accuracy=0.928, val_f1_score=0.928]
Epoch 122:  90%|█████████ | 230/255 [01:34<00:10,  2.42it/s, loss=0.00966, v_num=4, train_loss=0.0313, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.275, val_accuracy=0.928, val_f1_score=0.928]
Epoch 122:  91%|█████████ | 232/255 [01:35<00:09,  2.44it/s, loss=0.00966, v_num=4, train_loss=0.0313, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.275, val_accuracy=0.928, val_f1_score=0.928]
Epoch 122:  92%|█████████▏| 234/255 [01:35<00:08,  2.46it/s, loss=0.00966, v_num=4, train_loss=0.03

Epoch 122, global step 27797: val_loss was not in top 2


Epoch 123:  89%|████████▊ | 226/255 [01:26<00:11,  2.60it/s, loss=0.0254, v_num=4, train_loss=0.0397, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.279, val_accuracy=0.930, val_f1_score=0.930]   
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 123:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.0254, v_num=4, train_loss=0.0397, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.279, val_accuracy=0.930, val_f1_score=0.930]
Epoch 123:  90%|█████████ | 230/255 [01:34<00:10,  2.42it/s, loss=0.0254, v_num=4, train_loss=0.0397, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.279, val_accuracy=0.930, val_f1_score=0.930]
Epoch 123:  91%|█████████ | 232/255 [01:35<00:09,  2.44it/s, loss=0.0254, v_num=4, train_loss=0.0397, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.279, val_accuracy=0.930, val_f1_score=0.930]
Epoch 123:  92%|█████████▏| 234/255 [01:35<00:08,  2.46it/s, loss=0.0254, v_num=4, train_loss=0.0397,

Epoch 123, global step 28023: val_loss was not in top 2


Epoch 124:  89%|████████▊ | 226/255 [01:26<00:11,  2.60it/s, loss=0.024, v_num=4, train_loss=0.00118, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.323, val_accuracy=0.923, val_f1_score=0.923]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 124:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.024, v_num=4, train_loss=0.00118, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.323, val_accuracy=0.923, val_f1_score=0.923]
Epoch 124:  90%|█████████ | 230/255 [01:34<00:10,  2.43it/s, loss=0.024, v_num=4, train_loss=0.00118, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.323, val_accuracy=0.923, val_f1_score=0.923]
Epoch 124:  91%|█████████ | 232/255 [01:35<00:09,  2.44it/s, loss=0.024, v_num=4, train_loss=0.00118, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.323, val_accuracy=0.923, val_f1_score=0.923]
Epoch 124:  92%|█████████▏| 234/255 [01:35<00:08,  2.46it/s, loss=0.024, v_num=4, train_loss=0.00118, 

Epoch 124, global step 28249: val_loss was not in top 2


Epoch 125:  89%|████████▊ | 226/255 [01:26<00:11,  2.61it/s, loss=0.024, v_num=4, train_loss=0.0582, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.293, val_accuracy=0.933, val_f1_score=0.933]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 125:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.024, v_num=4, train_loss=0.0582, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.293, val_accuracy=0.933, val_f1_score=0.933]
Epoch 125:  90%|█████████ | 230/255 [01:34<00:10,  2.43it/s, loss=0.024, v_num=4, train_loss=0.0582, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.293, val_accuracy=0.933, val_f1_score=0.933]
Epoch 125:  91%|█████████ | 232/255 [01:34<00:09,  2.44it/s, loss=0.024, v_num=4, train_loss=0.0582, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.293, val_accuracy=0.933, val_f1_score=0.933]
Epoch 125:  92%|█████████▏| 234/255 [01:35<00:08,  2.46it/s, loss=0.024, v_num=4, train_loss=0.0582, train

Epoch 125, global step 28475: val_loss reached 0.24981 (best 0.24981), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-0-v2.ckpt" as top 2


Epoch 126:  89%|████████▊ | 226/255 [01:26<00:11,  2.60it/s, loss=0.0425, v_num=4, train_loss=0.00188, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.250, val_accuracy=0.929, val_f1_score=0.929] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 126:  89%|████████▉ | 228/255 [01:34<00:11,  2.40it/s, loss=0.0425, v_num=4, train_loss=0.00188, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.250, val_accuracy=0.929, val_f1_score=0.929]
Epoch 126:  90%|█████████ | 230/255 [01:35<00:10,  2.42it/s, loss=0.0425, v_num=4, train_loss=0.00188, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.250, val_accuracy=0.929, val_f1_score=0.929]
Epoch 126:  91%|█████████ | 232/255 [01:35<00:09,  2.44it/s, loss=0.0425, v_num=4, train_loss=0.00188, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.250, val_accuracy=0.929, val_f1_score=0.929]
Epoch 126:  92%|█████████▏| 234/255 [01:35<00:08,  2.45it/s, loss=0.0425, v_num=4, train_loss=0.001

Epoch 126, global step 28701: val_loss was not in top 2


Epoch 127:  89%|████████▊ | 226/255 [01:27<00:11,  2.59it/s, loss=0.0265, v_num=4, train_loss=0.00441, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.308, val_accuracy=0.929, val_f1_score=0.929]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 127:  89%|████████▉ | 228/255 [01:35<00:11,  2.40it/s, loss=0.0265, v_num=4, train_loss=0.00441, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.308, val_accuracy=0.929, val_f1_score=0.929]
Epoch 127:  90%|█████████ | 230/255 [01:35<00:10,  2.42it/s, loss=0.0265, v_num=4, train_loss=0.00441, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.308, val_accuracy=0.929, val_f1_score=0.929]
Epoch 127:  91%|█████████ | 232/255 [01:35<00:09,  2.43it/s, loss=0.0265, v_num=4, train_loss=0.00441, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.308, val_accuracy=0.929, val_f1_score=0.929]
Epoch 127:  92%|█████████▏| 234/255 [01:35<00:08,  2.45it/s, loss=0.0265, v_num=4, train_loss=0.0044

Epoch 127, global step 28927: val_loss was not in top 2


Epoch 128:  89%|████████▊ | 226/255 [01:27<00:11,  2.59it/s, loss=0.0315, v_num=4, train_loss=0.00104, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.284, val_accuracy=0.931, val_f1_score=0.931] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 128:  89%|████████▉ | 228/255 [01:34<00:11,  2.40it/s, loss=0.0315, v_num=4, train_loss=0.00104, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.284, val_accuracy=0.931, val_f1_score=0.931]
Epoch 128:  90%|█████████ | 230/255 [01:35<00:10,  2.42it/s, loss=0.0315, v_num=4, train_loss=0.00104, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.284, val_accuracy=0.931, val_f1_score=0.931]
Epoch 128:  91%|█████████ | 232/255 [01:35<00:09,  2.44it/s, loss=0.0315, v_num=4, train_loss=0.00104, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.284, val_accuracy=0.931, val_f1_score=0.931]
Epoch 128:  92%|█████████▏| 234/255 [01:35<00:08,  2.45it/s, loss=0.0315, v_num=4, train_loss=0.001

Epoch 128, global step 29153: val_loss was not in top 2


Epoch 129:  89%|████████▊ | 226/255 [01:26<00:11,  2.60it/s, loss=0.0138, v_num=4, train_loss=0.000992, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.301, val_accuracy=0.932, val_f1_score=0.932]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 129:  89%|████████▉ | 228/255 [01:34<00:11,  2.42it/s, loss=0.0138, v_num=4, train_loss=0.000992, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.301, val_accuracy=0.932, val_f1_score=0.932]
Epoch 129:  90%|█████████ | 230/255 [01:34<00:10,  2.43it/s, loss=0.0138, v_num=4, train_loss=0.000992, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.301, val_accuracy=0.932, val_f1_score=0.932]
Epoch 129:  91%|█████████ | 232/255 [01:34<00:09,  2.45it/s, loss=0.0138, v_num=4, train_loss=0.000992, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.301, val_accuracy=0.932, val_f1_score=0.932]
Epoch 129:  92%|█████████▏| 234/255 [01:34<00:08,  2.47it/s, loss=0.0138, v_num=4, train_loss=0.

Epoch 129, global step 29379: val_loss was not in top 2


Epoch 130:  89%|████████▊ | 226/255 [01:26<00:11,  2.61it/s, loss=0.0445, v_num=4, train_loss=0.0334, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.287, val_accuracy=0.925, val_f1_score=0.925]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 130:  89%|████████▉ | 228/255 [01:34<00:11,  2.43it/s, loss=0.0445, v_num=4, train_loss=0.0334, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.287, val_accuracy=0.925, val_f1_score=0.925]
Epoch 130:  90%|█████████ | 230/255 [01:34<00:10,  2.44it/s, loss=0.0445, v_num=4, train_loss=0.0334, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.287, val_accuracy=0.925, val_f1_score=0.925]
Epoch 130:  91%|█████████ | 232/255 [01:34<00:09,  2.46it/s, loss=0.0445, v_num=4, train_loss=0.0334, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.287, val_accuracy=0.925, val_f1_score=0.925]
Epoch 130:  92%|█████████▏| 234/255 [01:34<00:08,  2.47it/s, loss=0.0445, v_num=4, train_loss=0.0334, 

Epoch 130, global step 29605: val_loss was not in top 2


Epoch 131:  89%|████████▊ | 226/255 [01:26<00:11,  2.60it/s, loss=0.082, v_num=4, train_loss=0.0117, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.318, val_accuracy=0.925, val_f1_score=0.925]   
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 131:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.082, v_num=4, train_loss=0.0117, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.318, val_accuracy=0.925, val_f1_score=0.925]
Epoch 131:  90%|█████████ | 230/255 [01:34<00:10,  2.43it/s, loss=0.082, v_num=4, train_loss=0.0117, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.318, val_accuracy=0.925, val_f1_score=0.925]
Epoch 131:  91%|█████████ | 232/255 [01:34<00:09,  2.45it/s, loss=0.082, v_num=4, train_loss=0.0117, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.318, val_accuracy=0.925, val_f1_score=0.925]
Epoch 131:  92%|█████████▏| 234/255 [01:34<00:08,  2.46it/s, loss=0.082, v_num=4, train_loss=0.0117, trai

Epoch 131, global step 29831: val_loss was not in top 2


Epoch 132:  89%|████████▊ | 226/255 [01:26<00:11,  2.60it/s, loss=0.0282, v_num=4, train_loss=0.00895, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.468, val_accuracy=0.891, val_f1_score=0.891]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 132:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.0282, v_num=4, train_loss=0.00895, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.468, val_accuracy=0.891, val_f1_score=0.891]
Epoch 132:  90%|█████████ | 230/255 [01:34<00:10,  2.43it/s, loss=0.0282, v_num=4, train_loss=0.00895, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.468, val_accuracy=0.891, val_f1_score=0.891]
Epoch 132:  91%|█████████ | 232/255 [01:34<00:09,  2.44it/s, loss=0.0282, v_num=4, train_loss=0.00895, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.468, val_accuracy=0.891, val_f1_score=0.891]
Validating:  21%|██        | 6/29 [00:08<00:16,  1.41it/s][A
Epoch 132:  92%|█████████▏| 234/255 [0

Epoch 132, global step 30057: val_loss reached 0.25823 (best 0.24981), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-0-v3.ckpt" as top 2


Epoch 133:  89%|████████▊ | 226/255 [01:26<00:11,  2.60it/s, loss=0.18, v_num=4, train_loss=0.163, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.258, val_accuracy=0.936, val_f1_score=0.936]    
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 133:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.18, v_num=4, train_loss=0.163, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.258, val_accuracy=0.936, val_f1_score=0.936]
Epoch 133:  90%|█████████ | 230/255 [01:34<00:10,  2.43it/s, loss=0.18, v_num=4, train_loss=0.163, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.258, val_accuracy=0.936, val_f1_score=0.936]
Epoch 133:  91%|█████████ | 232/255 [01:34<00:09,  2.44it/s, loss=0.18, v_num=4, train_loss=0.163, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.258, val_accuracy=0.936, val_f1_score=0.936]
Epoch 133:  92%|█████████▏| 234/255 [01:35<00:08,  2.46it/s, loss=0.18, v_num=4, train_loss=0.163, train_accurac

Epoch 133, global step 30283: val_loss was not in top 2


Epoch 134:  89%|████████▊ | 226/255 [01:26<00:11,  2.61it/s, loss=0.063, v_num=4, train_loss=0.0134, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.409, val_accuracy=0.904, val_f1_score=0.904]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 134:  89%|████████▉ | 228/255 [01:34<00:11,  2.42it/s, loss=0.063, v_num=4, train_loss=0.0134, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.409, val_accuracy=0.904, val_f1_score=0.904]
Epoch 134:  90%|█████████ | 230/255 [01:34<00:10,  2.43it/s, loss=0.063, v_num=4, train_loss=0.0134, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.409, val_accuracy=0.904, val_f1_score=0.904]
Epoch 134:  91%|█████████ | 232/255 [01:34<00:09,  2.45it/s, loss=0.063, v_num=4, train_loss=0.0134, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.409, val_accuracy=0.904, val_f1_score=0.904]
Epoch 134:  92%|█████████▏| 234/255 [01:34<00:08,  2.47it/s, loss=0.063, v_num=4, train_loss=0.0134, train

Epoch 134, global step 30509: val_loss was not in top 2


Epoch 135:  89%|████████▊ | 226/255 [01:26<00:11,  2.60it/s, loss=0.0566, v_num=4, train_loss=0.00495, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.294, val_accuracy=0.923, val_f1_score=0.923]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 135:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.0566, v_num=4, train_loss=0.00495, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.294, val_accuracy=0.923, val_f1_score=0.923]
Epoch 135:  90%|█████████ | 230/255 [01:34<00:10,  2.42it/s, loss=0.0566, v_num=4, train_loss=0.00495, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.294, val_accuracy=0.923, val_f1_score=0.923]
Epoch 135:  91%|█████████ | 232/255 [01:35<00:09,  2.44it/s, loss=0.0566, v_num=4, train_loss=0.00495, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.294, val_accuracy=0.923, val_f1_score=0.923]
Epoch 135:  92%|█████████▏| 234/255 [01:35<00:08,  2.46it/s, loss=0.0566, v_num=4, train_loss=0.0049

Epoch 135, global step 30735: val_loss was not in top 2


Epoch 136:  89%|████████▊ | 226/255 [01:26<00:11,  2.60it/s, loss=0.04, v_num=4, train_loss=0.032, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.261, val_accuracy=0.924, val_f1_score=0.924]    
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 136:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.04, v_num=4, train_loss=0.032, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.261, val_accuracy=0.924, val_f1_score=0.924]
Epoch 136:  90%|█████████ | 230/255 [01:34<00:10,  2.43it/s, loss=0.04, v_num=4, train_loss=0.032, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.261, val_accuracy=0.924, val_f1_score=0.924]
Epoch 136:  91%|█████████ | 232/255 [01:34<00:09,  2.44it/s, loss=0.04, v_num=4, train_loss=0.032, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.261, val_accuracy=0.924, val_f1_score=0.924]
Epoch 136:  92%|█████████▏| 234/255 [01:35<00:08,  2.46it/s, loss=0.04, v_num=4, train_loss=0.032, train_accurac

Epoch 136, global step 30961: val_loss was not in top 2


Epoch 137:  89%|████████▊ | 226/255 [01:26<00:11,  2.60it/s, loss=0.014, v_num=4, train_loss=0.00165, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.268, val_accuracy=0.930, val_f1_score=0.930] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 137:  89%|████████▉ | 228/255 [01:35<00:11,  2.39it/s, loss=0.014, v_num=4, train_loss=0.00165, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.268, val_accuracy=0.930, val_f1_score=0.930]
Epoch 137:  90%|█████████ | 230/255 [01:35<00:10,  2.41it/s, loss=0.014, v_num=4, train_loss=0.00165, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.268, val_accuracy=0.930, val_f1_score=0.930]
Epoch 137:  91%|█████████ | 232/255 [01:35<00:09,  2.43it/s, loss=0.014, v_num=4, train_loss=0.00165, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.268, val_accuracy=0.930, val_f1_score=0.930]
Epoch 137:  92%|█████████▏| 234/255 [01:35<00:08,  2.44it/s, loss=0.014, v_num=4, train_loss=0.00165, t

Epoch 137, global step 31187: val_loss was not in top 2


Epoch 138:  89%|████████▊ | 226/255 [01:26<00:11,  2.60it/s, loss=0.0298, v_num=4, train_loss=0.0017, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.279, val_accuracy=0.927, val_f1_score=0.927]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 138:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.0298, v_num=4, train_loss=0.0017, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.279, val_accuracy=0.927, val_f1_score=0.927]
Epoch 138:  90%|█████████ | 230/255 [01:34<00:10,  2.43it/s, loss=0.0298, v_num=4, train_loss=0.0017, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.279, val_accuracy=0.927, val_f1_score=0.927]
Validating:  14%|█▍        | 4/29 [00:07<00:31,  1.25s/it][A
Epoch 138:  91%|█████████ | 232/255 [01:34<00:09,  2.45it/s, loss=0.0298, v_num=4, train_loss=0.0017, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.279, val_accuracy=0.927, val_f1_score=0.927]
Epoch 138:  92%|█████████▏| 234/255 [01:

Epoch 138, global step 31413: val_loss was not in top 2


Epoch 139:  89%|████████▊ | 226/255 [01:26<00:11,  2.60it/s, loss=0.0137, v_num=4, train_loss=0.00164, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.329, val_accuracy=0.928, val_f1_score=0.928]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 139:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.0137, v_num=4, train_loss=0.00164, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.329, val_accuracy=0.928, val_f1_score=0.928]
Epoch 139:  90%|█████████ | 230/255 [01:34<00:10,  2.43it/s, loss=0.0137, v_num=4, train_loss=0.00164, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.329, val_accuracy=0.928, val_f1_score=0.928]
Epoch 139:  91%|█████████ | 232/255 [01:34<00:09,  2.44it/s, loss=0.0137, v_num=4, train_loss=0.00164, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.329, val_accuracy=0.928, val_f1_score=0.928]
Epoch 139:  92%|█████████▏| 234/255 [01:35<00:08,  2.46it/s, loss=0.0137, v_num=4, train_loss=0.0016

Epoch 139, global step 31639: val_loss was not in top 2


Epoch 140:  89%|████████▊ | 226/255 [01:27<00:11,  2.59it/s, loss=0.0415, v_num=4, train_loss=0.220, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.287, val_accuracy=0.933, val_f1_score=0.933]   
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 140:  89%|████████▉ | 228/255 [01:35<00:11,  2.40it/s, loss=0.0415, v_num=4, train_loss=0.220, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.287, val_accuracy=0.933, val_f1_score=0.933]
Epoch 140:  90%|█████████ | 230/255 [01:35<00:10,  2.42it/s, loss=0.0415, v_num=4, train_loss=0.220, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.287, val_accuracy=0.933, val_f1_score=0.933]
Epoch 140:  91%|█████████ | 232/255 [01:35<00:09,  2.43it/s, loss=0.0415, v_num=4, train_loss=0.220, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.287, val_accuracy=0.933, val_f1_score=0.933]
Epoch 140:  92%|█████████▏| 234/255 [01:35<00:08,  2.45it/s, loss=0.0415, v_num=4, train_loss=0.220, trai

Epoch 140, global step 31865: val_loss was not in top 2


Epoch 141:  89%|████████▊ | 226/255 [01:27<00:11,  2.59it/s, loss=0.0125, v_num=4, train_loss=0.000439, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.307, val_accuracy=0.923, val_f1_score=0.923]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 141:  89%|████████▉ | 228/255 [01:35<00:11,  2.40it/s, loss=0.0125, v_num=4, train_loss=0.000439, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.307, val_accuracy=0.923, val_f1_score=0.923]
Validating:   7%|▋         | 2/29 [00:07<01:29,  3.30s/it][A
Epoch 141:  90%|█████████ | 230/255 [01:35<00:10,  2.41it/s, loss=0.0125, v_num=4, train_loss=0.000439, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.307, val_accuracy=0.923, val_f1_score=0.923]
Epoch 141:  91%|█████████ | 232/255 [01:35<00:09,  2.43it/s, loss=0.0125, v_num=4, train_loss=0.000439, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.307, val_accuracy=0.923, val_f1_score=0.923]
Epoch 141:  92%|█████████▏| 234/25

Epoch 141, global step 32091: val_loss was not in top 2


Epoch 142:  89%|████████▊ | 226/255 [01:26<00:11,  2.61it/s, loss=0.0285, v_num=4, train_loss=0.0269, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.308, val_accuracy=0.930, val_f1_score=0.930]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 142:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.0285, v_num=4, train_loss=0.0269, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.308, val_accuracy=0.930, val_f1_score=0.930]
Epoch 142:  90%|█████████ | 230/255 [01:34<00:10,  2.43it/s, loss=0.0285, v_num=4, train_loss=0.0269, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.308, val_accuracy=0.930, val_f1_score=0.930]
Epoch 142:  91%|█████████ | 232/255 [01:34<00:09,  2.45it/s, loss=0.0285, v_num=4, train_loss=0.0269, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.308, val_accuracy=0.930, val_f1_score=0.930]
Epoch 142:  92%|█████████▏| 234/255 [01:35<00:08,  2.46it/s, loss=0.0285, v_num=4, train_loss=0.0269, 

Epoch 142, global step 32317: val_loss was not in top 2


Epoch 143:  89%|████████▊ | 226/255 [01:26<00:11,  2.60it/s, loss=0.0214, v_num=4, train_loss=0.00961, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.266, val_accuracy=0.933, val_f1_score=0.933] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 143:  89%|████████▉ | 228/255 [01:34<00:11,  2.42it/s, loss=0.0214, v_num=4, train_loss=0.00961, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.266, val_accuracy=0.933, val_f1_score=0.933]
Validating:   7%|▋         | 2/29 [00:07<01:26,  3.19s/it][A
Epoch 143:  90%|█████████ | 230/255 [01:34<00:10,  2.43it/s, loss=0.0214, v_num=4, train_loss=0.00961, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.266, val_accuracy=0.933, val_f1_score=0.933]
Epoch 143:  91%|█████████ | 232/255 [01:34<00:09,  2.45it/s, loss=0.0214, v_num=4, train_loss=0.00961, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.266, val_accuracy=0.933, val_f1_score=0.933]
Epoch 143:  92%|█████████▏| 234/255 [

Epoch 143, global step 32543: val_loss was not in top 2


Epoch 144:  89%|████████▊ | 226/255 [01:26<00:11,  2.61it/s, loss=0.00775, v_num=4, train_loss=0.00249, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.302, val_accuracy=0.928, val_f1_score=0.928]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 144:  89%|████████▉ | 228/255 [01:34<00:11,  2.42it/s, loss=0.00775, v_num=4, train_loss=0.00249, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.302, val_accuracy=0.928, val_f1_score=0.928]
Epoch 144:  90%|█████████ | 230/255 [01:34<00:10,  2.43it/s, loss=0.00775, v_num=4, train_loss=0.00249, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.302, val_accuracy=0.928, val_f1_score=0.928]
Epoch 144:  91%|█████████ | 232/255 [01:34<00:09,  2.45it/s, loss=0.00775, v_num=4, train_loss=0.00249, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.302, val_accuracy=0.928, val_f1_score=0.928]
Epoch 144:  92%|█████████▏| 234/255 [01:34<00:08,  2.47it/s, loss=0.00775, v_num=4, train_loss=0

Epoch 144, global step 32769: val_loss was not in top 2


Epoch 145:  89%|████████▊ | 226/255 [01:26<00:11,  2.61it/s, loss=0.0227, v_num=4, train_loss=0.00872, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.269, val_accuracy=0.935, val_f1_score=0.935] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 145:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.0227, v_num=4, train_loss=0.00872, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.269, val_accuracy=0.935, val_f1_score=0.935]
Epoch 145:  90%|█████████ | 230/255 [01:34<00:10,  2.43it/s, loss=0.0227, v_num=4, train_loss=0.00872, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.269, val_accuracy=0.935, val_f1_score=0.935]
Epoch 145:  91%|█████████ | 232/255 [01:34<00:09,  2.44it/s, loss=0.0227, v_num=4, train_loss=0.00872, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.269, val_accuracy=0.935, val_f1_score=0.935]
Epoch 145:  92%|█████████▏| 234/255 [01:35<00:08,  2.46it/s, loss=0.0227, v_num=4, train_loss=0.008

Epoch 145, global step 32995: val_loss reached 0.24510 (best 0.24510), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-0-v3.ckpt" as top 2


Epoch 146:  89%|████████▊ | 226/255 [01:26<00:11,  2.60it/s, loss=0.192, v_num=4, train_loss=0.0184, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.245, val_accuracy=0.938, val_f1_score=0.938]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 146:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.192, v_num=4, train_loss=0.0184, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.245, val_accuracy=0.938, val_f1_score=0.938]
Epoch 146:  90%|█████████ | 230/255 [01:34<00:10,  2.42it/s, loss=0.192, v_num=4, train_loss=0.0184, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.245, val_accuracy=0.938, val_f1_score=0.938]
Epoch 146:  91%|█████████ | 232/255 [01:35<00:09,  2.44it/s, loss=0.192, v_num=4, train_loss=0.0184, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.245, val_accuracy=0.938, val_f1_score=0.938]
Epoch 146:  92%|█████████▏| 234/255 [01:35<00:08,  2.46it/s, loss=0.192, v_num=4, train_loss=0.0184, train

Epoch 146, global step 33221: val_loss was not in top 2


Epoch 147:  89%|████████▊ | 226/255 [01:26<00:11,  2.60it/s, loss=0.0607, v_num=4, train_loss=0.0372, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.325, val_accuracy=0.884, val_f1_score=0.884]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 147:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.0607, v_num=4, train_loss=0.0372, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.325, val_accuracy=0.884, val_f1_score=0.884]
Epoch 147:  90%|█████████ | 230/255 [01:34<00:10,  2.42it/s, loss=0.0607, v_num=4, train_loss=0.0372, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.325, val_accuracy=0.884, val_f1_score=0.884]
Epoch 147:  91%|█████████ | 232/255 [01:35<00:09,  2.44it/s, loss=0.0607, v_num=4, train_loss=0.0372, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.325, val_accuracy=0.884, val_f1_score=0.884]
Epoch 147:  92%|█████████▏| 234/255 [01:35<00:08,  2.46it/s, loss=0.0607, v_num=4, train_loss=0.0372, tr

Epoch 147, global step 33447: val_loss was not in top 2


Epoch 148:  89%|████████▊ | 226/255 [01:27<00:11,  2.60it/s, loss=0.0414, v_num=4, train_loss=0.260, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.252, val_accuracy=0.916, val_f1_score=0.916]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 148:  89%|████████▉ | 228/255 [01:34<00:11,  2.40it/s, loss=0.0414, v_num=4, train_loss=0.260, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.252, val_accuracy=0.916, val_f1_score=0.916]
Epoch 148:  90%|█████████ | 230/255 [01:35<00:10,  2.42it/s, loss=0.0414, v_num=4, train_loss=0.260, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.252, val_accuracy=0.916, val_f1_score=0.916]
Epoch 148:  91%|█████████ | 232/255 [01:35<00:09,  2.44it/s, loss=0.0414, v_num=4, train_loss=0.260, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.252, val_accuracy=0.916, val_f1_score=0.916]
Epoch 148:  92%|█████████▏| 234/255 [01:35<00:08,  2.45it/s, loss=0.0414, v_num=4, train_loss=0.260, train

Epoch 148, global step 33673: val_loss was not in top 2


Epoch 149:  89%|████████▊ | 226/255 [01:26<00:11,  2.61it/s, loss=0.0415, v_num=4, train_loss=0.0299, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.283, val_accuracy=0.923, val_f1_score=0.923] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 149:  89%|████████▉ | 228/255 [01:34<00:11,  2.42it/s, loss=0.0415, v_num=4, train_loss=0.0299, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.283, val_accuracy=0.923, val_f1_score=0.923]
Epoch 149:  90%|█████████ | 230/255 [01:34<00:10,  2.43it/s, loss=0.0415, v_num=4, train_loss=0.0299, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.283, val_accuracy=0.923, val_f1_score=0.923]
Epoch 149:  91%|█████████ | 232/255 [01:34<00:09,  2.45it/s, loss=0.0415, v_num=4, train_loss=0.0299, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.283, val_accuracy=0.923, val_f1_score=0.923]
Epoch 149:  92%|█████████▏| 234/255 [01:34<00:08,  2.46it/s, loss=0.0415, v_num=4, train_loss=0.0299, t

Epoch 149, global step 33899: val_loss reached 0.23288 (best 0.23288), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-0-v2.ckpt" as top 2


Epoch 150:  89%|████████▊ | 226/255 [01:26<00:11,  2.60it/s, loss=0.0441, v_num=4, train_loss=0.00181, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.233, val_accuracy=0.929, val_f1_score=0.929] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 150:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.0441, v_num=4, train_loss=0.00181, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.233, val_accuracy=0.929, val_f1_score=0.929]
Epoch 150:  90%|█████████ | 230/255 [01:34<00:10,  2.43it/s, loss=0.0441, v_num=4, train_loss=0.00181, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.233, val_accuracy=0.929, val_f1_score=0.929]
Epoch 150:  91%|█████████ | 232/255 [01:34<00:09,  2.44it/s, loss=0.0441, v_num=4, train_loss=0.00181, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.233, val_accuracy=0.929, val_f1_score=0.929]
Epoch 150:  92%|█████████▏| 234/255 [01:35<00:08,  2.46it/s, loss=0.0441, v_num=4, train_loss=0.001

Epoch 150, global step 34125: val_loss was not in top 2


Epoch 151:  89%|████████▊ | 226/255 [01:26<00:11,  2.60it/s, loss=0.0307, v_num=4, train_loss=0.0021, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.293, val_accuracy=0.927, val_f1_score=0.927] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 151:  89%|████████▉ | 228/255 [01:34<00:11,  2.41it/s, loss=0.0307, v_num=4, train_loss=0.0021, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.293, val_accuracy=0.927, val_f1_score=0.927]
Epoch 151:  90%|█████████ | 230/255 [01:34<00:10,  2.43it/s, loss=0.0307, v_num=4, train_loss=0.0021, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.293, val_accuracy=0.927, val_f1_score=0.927]
Epoch 151:  91%|█████████ | 232/255 [01:35<00:09,  2.44it/s, loss=0.0307, v_num=4, train_loss=0.0021, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.293, val_accuracy=0.927, val_f1_score=0.927]
Epoch 151:  92%|█████████▏| 234/255 [01:35<00:08,  2.46it/s, loss=0.0307, v_num=4, train_loss=0.0021, t

Epoch 151, global step 34351: val_loss was not in top 2


Epoch 152:  89%|████████▊ | 226/255 [01:26<00:11,  2.61it/s, loss=0.0528, v_num=4, train_loss=0.00548, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.303, val_accuracy=0.926, val_f1_score=0.926]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 152:  89%|████████▉ | 228/255 [01:34<00:11,  2.42it/s, loss=0.0528, v_num=4, train_loss=0.00548, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.303, val_accuracy=0.926, val_f1_score=0.926]
Epoch 152:  90%|█████████ | 230/255 [01:34<00:10,  2.43it/s, loss=0.0528, v_num=4, train_loss=0.00548, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.303, val_accuracy=0.926, val_f1_score=0.926]
Epoch 152:  91%|█████████ | 232/255 [01:34<00:09,  2.45it/s, loss=0.0528, v_num=4, train_loss=0.00548, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.303, val_accuracy=0.926, val_f1_score=0.926]
Epoch 152:  92%|█████████▏| 234/255 [01:34<00:08,  2.47it/s, loss=0.0528, v_num=4, train_loss=0.0054

Epoch 152, global step 34577: val_loss reached 0.24091 (best 0.23288), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-0-v3.ckpt" as top 2


Epoch 153:  89%|████████▊ | 226/255 [01:27<00:11,  2.59it/s, loss=0.0273, v_num=4, train_loss=0.00252, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.241, val_accuracy=0.930, val_f1_score=0.930]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 153:  89%|████████▉ | 228/255 [01:35<00:11,  2.39it/s, loss=0.0273, v_num=4, train_loss=0.00252, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.241, val_accuracy=0.930, val_f1_score=0.930]
Epoch 153:  90%|█████████ | 230/255 [01:35<00:10,  2.41it/s, loss=0.0273, v_num=4, train_loss=0.00252, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.241, val_accuracy=0.930, val_f1_score=0.930]
Epoch 153:  91%|█████████ | 232/255 [01:35<00:09,  2.43it/s, loss=0.0273, v_num=4, train_loss=0.00252, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.241, val_accuracy=0.930, val_f1_score=0.930]
Epoch 153:  92%|█████████▏| 234/255 [01:35<00:08,  2.44it/s, loss=0.0273, v_num=4, train_loss=0.0025

Epoch 153, global step 34803: val_loss reached 0.23569 (best 0.23288), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-0-v3.ckpt" as top 2


Epoch 154:  89%|████████▊ | 226/255 [01:27<00:11,  2.58it/s, loss=0.0399, v_num=4, train_loss=0.0267, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.236, val_accuracy=0.920, val_f1_score=0.920] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 154:  89%|████████▉ | 228/255 [01:35<00:11,  2.39it/s, loss=0.0399, v_num=4, train_loss=0.0267, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.236, val_accuracy=0.920, val_f1_score=0.920]
Epoch 154:  90%|█████████ | 230/255 [01:35<00:10,  2.41it/s, loss=0.0399, v_num=4, train_loss=0.0267, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.236, val_accuracy=0.920, val_f1_score=0.920]
Epoch 154:  91%|█████████ | 232/255 [01:35<00:09,  2.42it/s, loss=0.0399, v_num=4, train_loss=0.0267, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.236, val_accuracy=0.920, val_f1_score=0.920]
Epoch 154:  92%|█████████▏| 234/255 [01:35<00:08,  2.44it/s, loss=0.0399, v_num=4, train_loss=0.0267, t

Epoch 154, global step 35029: val_loss reached 0.20454 (best 0.20454), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-0-v3.ckpt" as top 2


Epoch 155:  89%|████████▊ | 226/255 [01:26<00:11,  2.61it/s, loss=0.0205, v_num=4, train_loss=0.0676, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.205, val_accuracy=0.932, val_f1_score=0.932] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A

OSError: [Errno 12] Cannot allocate memory

Epoch 155:  89%|████████▉ | 227/255 [01:37<00:12,  2.33it/s, loss=0.0205, v_num=4, train_loss=0.0676, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.205, val_accuracy=0.932, val_f1_score=0.932]

## Load Checkpoint 

In [None]:
# best-checkpoint-corr-3-v1.ckptn
# trainer.fit(model, data_module, ckpt_path="/Workspace/code/checkpoints/best-checkpoint-corr-3-v1.ckpt")