In [1]:
import os
import pandas as pd
import numpy as np
from sklearn.preprocessing import LabelEncoder
from sklearn.model_selection import train_test_split
from sklearn.metrics import classification_report, confusion_matrix
import matplotlib.pyplot as plt

import torch
from torch import nn, optim
from torch.nn import functional as F
from torch.utils.data import Dataset, DataLoader

import torchmetrics
from torchmetrics.functional import accuracy

import pytorch_lightning as pl
from pytorch_lightning.loggers import TensorBoardLogger
from pytorch_lightning.callbacks import ModelCheckpoint

device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
print(device)

cuda


## Model Setup 

In [2]:
pl.seed_everything(42, workers=True)

class DrowsyDataset(Dataset):
    
    def __init__(self, sequences):
        self.sequences = sequences
        
    def __len__(self):
        return len(self.sequences)
    
    def __getitem__(self, idx):
        sequence, label = self.sequences[idx]
        return dict(
            sequence=torch.Tensor(sequence.to_numpy()),
            label=torch.tensor(label).long()
        )
    
class DrowsyDataModule(pl.LightningDataModule):
    
    def __init__(self, train_sequences, val_sequences, test_sequences, batch_size):
        super().__init__()
        self.train_sequences = train_sequences
        self.val_sequences = val_sequences
        self.test_sequences = test_sequences
        self.batch_size = batch_size

    def setup(self, stage=None):
        self.train_dataset = DrowsyDataset(self.train_sequences)
        self.val_dataset = DrowsyDataset(self.val_sequences)
        self.test_dataset = DrowsyDataset(self.test_sequences)
        
    def train_dataloader(self):
        return DataLoader(
            self.train_dataset,
            batch_size=self.batch_size,
            shuffle=True,
            num_workers=os.cpu_count()
        )
    
    def val_dataloader(self):
        return DataLoader(
            self.val_dataset,
            batch_size=self.batch_size,
            shuffle=False,
            num_workers=os.cpu_count()
        )
    
    def test_dataloader(self):
        return DataLoader(
            self.test_dataset,
            batch_size=self.batch_size,
            shuffle=False,
            num_workers=os.cpu_count()
        ) 

class DrowsyModel(nn.Module):
    
    def __init__(self, n_features, n_classes, n_hidden=256, n_layers=3):
        super().__init__()
        
        self.n_hidden = n_hidden
        
        self.lstm = nn.LSTM(
            input_size=n_features,
            hidden_size=n_hidden,
            num_layers=n_layers,
            batch_first=True,
            dropout=0.75
        )
        
        self.classifier = nn.Linear(n_hidden, n_classes)
        
    def forward(self, x):
        self.lstm.flatten_parameters()
        _, (hidden, _) = self.lstm(x)
        
        out = hidden[-1]
        return self.classifier(out)
    
class DrowsyPredictor(pl.LightningModule):
    
    def __init__(self, n_features: int, n_classes: int):
        super().__init__()
        self.model = DrowsyModel(n_features, n_classes)
        self.criterion = nn.CrossEntropyLoss()
        
    def forward(self, x, label=None):
        output = self.model(x)
        loss = 0
        if label is not None:
            loss = self.criterion(output, label)
        return loss, output
        
    def training_step(self, batch, batch_idx):
        sequences = batch["sequence"]
        labels = batch["label"]
        loss, outputs = self(sequences, labels)
        predictions = torch.argmax(outputs, dim=1)
        step_accuracy = accuracy(predictions, labels)
        
        self.log("train_loss", loss, prog_bar=True, logger=True)
        self.log("train_accuracy", step_accuracy, prog_bar=True, logger=True)
        
        return {"loss": loss, "accuracy": step_accuracy}
    
    def validation_step(self, batch, batch_idx):
        sequences = batch["sequence"]
        labels = batch["label"]
        loss, outputs = self(sequences, labels)
        predictions = torch.argmax(outputs, dim=1)
        step_accuracy = accuracy(predictions, labels)
        
        self.log("val_loss", loss, prog_bar=True, logger=True)
        self.log("val_accuracy", step_accuracy, prog_bar=True, logger=True)
        
        return {"loss": loss, "accuracy": step_accuracy}
    
    def test_step(self, batch, batch_idx):
        sequences = batch["sequence"]
        labels = batch["label"]
        loss, outputs = self(sequences, labels)
        predictions = torch.argmax(outputs, dim=1)
        step_accuracy = accuracy(predictions, labels)
        
        self.log("test_loss", loss, prog_bar=True, logger=True)
        self.log("test_accuracy", step_accuracy, prog_bar=True, logger=True)
        
        return {"loss": loss, "accuracy": step_accuracy}
    
    def configure_optimizers(self):
        return optim.Adam(self.parameters(), lr=0.0001)

Global seed set to 42


## 參數設置

In [3]:
%load_ext tensorboard
%reload_ext tensorboard
%tensorboard --logdir ./lightning_logs --host 0.0.0.0 --port=8888

In [4]:
X_train = pd.read_csv('../data2.csv')

In [5]:
N_EPOCHS = 200
BATCH_SIZE = 50

# randomed 
ORG_FEATURE_COLUMNS = ['HEOR', 'T5', 'VEOL', 'VEOU', 'F8', 'FZ', 'F7', 'TP8', 'FC3', 'T4', 'HEOL', 'FT10', 'O2', 'FC4', 'FCZ', 'CP3', 'FP2', 'TP7', 'C3', 'F3', 'PZ', 'F4', 'O1', 'FT7', 'CP4', 'FP1', 'C4', 'T6', 'FT8', 'CZ', 'PO1', 'OZ', 'A2', 'A1', 'T3', 'P4', 'P3', 'FT9', 'CPZ', 'PO2']
# ['HEOR', 'T5', 'VEOL', 'VEOU', 'F8', 'FZ', 'F7', 'TP8', 'FC3', 'T4', 'HEOL', 'FT10', 'O2', 'FC4', 'FCZ', 'CP3', 'FP2', 'TP7', 'C3', 'F3', 'PZ', 'F4', 'O1', 'FT7', 'CP4', 'FP1', 'C4', 'T6', 'FT8', 'CZ', 'PO1', 'OZ', 'A2', 'A1', 'T3', 'P4', 'P3', 'FT9', 'CPZ', 'PO2']
g = X_train.groupby("group")

In [6]:
# import random
# ORG_FEATURE_COLUMNS = ['TP8', 'FP2', 'FCZ', 'FT10', 'O2', 'O1', 'FT7', 'F4', 'TP7', 'C3', 'C4', 'F3', 'FT8', 'T6', 'HEOR', 'T5', 'VEOL', 'F7', 'FZ', 'VEOU', 'A1', 'P3', 'PZ', 'CP3', 'P4', 'CPZ', 'A2', 'HEOL', 'CP4', 'FT9', 'F8', 'OZ', 'CZ', 'FC4', 'FC3', 'FP1', 'PO1', 'T3', 'T4', 'PO2']
# random.shuffle(ORG_FEATURE_COLUMNS)
# print(ORG_FEATURE_COLUMNS)

## Main

In [None]:
n = 35
FEATURE_COLUMNS = ORG_FEATURE_COLUMNS[n:]

while(n < 40):
    print("------------------ Round: " + str(n) + " ------------------")
    print(FEATURE_COLUMNS)
    print("Len:", len(FEATURE_COLUMNS))
    
    label_encoder = LabelEncoder()
    encoded_labels = label_encoder.fit_transform(X_train.state)

    label_encoder.classes_

    X_train['label'] = encoded_labels

    # Prepare data ###########################################
    sequences = [] 

    for name, group in g:
        sequence_features = group[FEATURE_COLUMNS]
        label = group.label.iloc[0]

        # print((sequence_features, label))
        sequences.append((sequence_features, label))

    # Setting up train, test, val gruop #######################
    train_sequences, test_sequences = train_test_split(sequences, test_size=0.2)
    val_sequences, test_sequences = train_test_split(test_sequences, test_size=0.5)


    # Setting up data module ##################################
    data_module = DrowsyDataModule(
        train_sequences, val_sequences, test_sequences, BATCH_SIZE
    )

    model = DrowsyPredictor(
        n_features=len(FEATURE_COLUMNS), 
        n_classes=len(label_encoder.classes_)
    )

    # Check points and logger #################################
    checkpoint_callback = ModelCheckpoint(
        dirpath="checkpoints",
        filename="best-checkpoint-corr-mi-" + str(n),
        save_top_k=2,
        verbose=True,
        monitor="val_loss",
        mode="min"
    )

    logger = TensorBoardLogger("lightning_logs", name="Drowsy_MI" + str(n))

    trainer = pl.Trainer(
        logger=logger,
        callbacks=[checkpoint_callback],
        max_epochs=N_EPOCHS,
        gpus=[2],
#         gpus=1, 
#         auto_select_gpus=True,
        auto_lr_find=True, 
        # check_val_every_n_epoch=10
        # refresh_rate=20,
    )
    
    # Training start
    if (n == 35):
        trainer.fit(model, data_module, ckpt_path="/Workspace/code/checkpoints/best-checkpoint-corr-mi-35-v1.ckpt")
    else:
        trainer.fit(model, data_module)
    trainer.test(model, data_module)
    
    FEATURE_COLUMNS.pop(0)
    n = n + 1

------------------ Round: 35 ------------------
['P4', 'P3', 'FT9', 'CPZ', 'PO2']
Len: 5


GPU available: True, used: True
TPU available: False, using: 0 TPU cores
IPU available: False, using: 0 IPUs
Restoring states from the checkpoint path at /Workspace/code/checkpoints/best-checkpoint-corr-mi-35-v1.ckpt
LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1,2]
  "You're resuming from a checkpoint that ended mid-epoch."
Restored all states from the checkpoint file at /Workspace/code/checkpoints/best-checkpoint-corr-mi-35-v1.ckpt

  | Name      | Type             | Params
-----------------------------------------------
0 | model     | DrowsyModel      | 1.3 M 
1 | criterion | CrossEntropyLoss | 0     
-----------------------------------------------
1.3 M     Trainable params
0         Non-trainable params
1.3 M     Total params
5.290     Total estimated model params size (MB)
  rank_zero_warn(f"Checkpoint directory {dirpath} exists and is not empty.")


                                                                      

Global seed set to 42


Epoch 7:  89%|████████▊ | 226/255 [02:38<00:20,  1.42it/s, loss=0.664, v_num=1, train_loss=0.657, train_accuracy=0.556]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 7:  89%|████████▉ | 228/255 [02:41<00:19,  1.41it/s, loss=0.664, v_num=1, train_loss=0.657, train_accuracy=0.556]
Validating:   7%|▋         | 2/29 [00:02<00:30,  1.15s/it][A
Epoch 7:  90%|█████████ | 230/255 [02:41<00:17,  1.42it/s, loss=0.664, v_num=1, train_loss=0.657, train_accuracy=0.556]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.98it/s][A
Epoch 7:  91%|█████████ | 232/255 [02:42<00:16,  1.43it/s, loss=0.664, v_num=1, train_loss=0.657, train_accuracy=0.556]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.13it/s][A
Epoch 7:  92%|█████████▏| 234/255 [02:42<00:14,  1.44it/s, loss=0.664, v_num=1, train_loss=0.657, train_accuracy=0.556]
Validating:  28%|██▊       | 8/29 [00:03<00:05,  4.00it/s][A
Epoch 7:  93%|█████████▎| 236/255 [02:43<00:13,  1.45it/s, loss=

Epoch 7, global step 1807: val_loss reached 0.66877 (best 0.66877), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-35.ckpt" as top 2


Epoch 8:  89%|████████▊ | 226/255 [02:36<00:20,  1.44it/s, loss=0.633, v_num=1, train_loss=0.633, train_accuracy=0.611, val_loss=0.669, val_accuracy=0.549]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 8:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.633, v_num=1, train_loss=0.633, train_accuracy=0.611, val_loss=0.669, val_accuracy=0.549]
Validating:   7%|▋         | 2/29 [00:02<00:32,  1.19s/it][A
Epoch 8:  90%|█████████ | 230/255 [02:39<00:17,  1.44it/s, loss=0.633, v_num=1, train_loss=0.633, train_accuracy=0.611, val_loss=0.669, val_accuracy=0.549]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.94it/s][A
Epoch 8:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.633, v_num=1, train_loss=0.633, train_accuracy=0.611, val_loss=0.669, val_accuracy=0.549]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.10it/s][A
Epoch 8:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.633, v_num=1, train_loss=0.633, trai

Epoch 8, global step 2033: val_loss was not in top 2


Epoch 9:  89%|████████▊ | 226/255 [02:36<00:20,  1.44it/s, loss=0.648, v_num=1, train_loss=0.642, train_accuracy=0.556, val_loss=0.737, val_accuracy=0.594]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 9:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.648, v_num=1, train_loss=0.642, train_accuracy=0.556, val_loss=0.737, val_accuracy=0.594]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.17s/it][A
Epoch 9:  90%|█████████ | 230/255 [02:39<00:17,  1.44it/s, loss=0.648, v_num=1, train_loss=0.642, train_accuracy=0.556, val_loss=0.737, val_accuracy=0.594]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.98it/s][A
Epoch 9:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.648, v_num=1, train_loss=0.642, train_accuracy=0.556, val_loss=0.737, val_accuracy=0.594]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.11it/s][A
Epoch 9:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.648, v_num=1, train_loss=0.642, trai

Epoch 9, global step 2259: val_loss reached 0.65925 (best 0.65925), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-35-v1.ckpt" as top 2


Epoch 10:  89%|████████▊ | 226/255 [02:36<00:20,  1.44it/s, loss=0.617, v_num=1, train_loss=0.861, train_accuracy=0.556, val_loss=0.659, val_accuracy=0.585]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 10:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.617, v_num=1, train_loss=0.861, train_accuracy=0.556, val_loss=0.659, val_accuracy=0.585]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.15s/it][A
Epoch 10:  90%|█████████ | 230/255 [02:39<00:17,  1.44it/s, loss=0.617, v_num=1, train_loss=0.861, train_accuracy=0.556, val_loss=0.659, val_accuracy=0.585]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.97it/s][A
Epoch 10:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.617, v_num=1, train_loss=0.861, train_accuracy=0.556, val_loss=0.659, val_accuracy=0.585]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.09it/s][A
Epoch 10:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.617, v_num=1, train_loss=0.861,

Epoch 10, global step 2485: val_loss was not in top 2


Epoch 11:  89%|████████▊ | 226/255 [02:36<00:20,  1.44it/s, loss=0.609, v_num=1, train_loss=0.450, train_accuracy=0.944, val_loss=0.823, val_accuracy=0.586]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 11:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.609, v_num=1, train_loss=0.450, train_accuracy=0.944, val_loss=0.823, val_accuracy=0.586]
Validating:   7%|▋         | 2/29 [00:02<00:32,  1.20s/it][A
Epoch 11:  90%|█████████ | 230/255 [02:39<00:17,  1.44it/s, loss=0.609, v_num=1, train_loss=0.450, train_accuracy=0.944, val_loss=0.823, val_accuracy=0.586]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.93it/s][A
Epoch 11:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.609, v_num=1, train_loss=0.450, train_accuracy=0.944, val_loss=0.823, val_accuracy=0.586]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.08it/s][A
Epoch 11:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.609, v_num=1, train_loss=0.450,

Epoch 11, global step 2711: val_loss reached 0.66496 (best 0.65925), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-35.ckpt" as top 2


Epoch 12:  89%|████████▊ | 226/255 [02:36<00:20,  1.44it/s, loss=0.64, v_num=1, train_loss=0.691, train_accuracy=0.500, val_loss=0.665, val_accuracy=0.594] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 12:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.64, v_num=1, train_loss=0.691, train_accuracy=0.500, val_loss=0.665, val_accuracy=0.594]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.16s/it][A
Epoch 12:  90%|█████████ | 230/255 [02:39<00:17,  1.44it/s, loss=0.64, v_num=1, train_loss=0.691, train_accuracy=0.500, val_loss=0.665, val_accuracy=0.594]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.96it/s][A
Epoch 12:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.64, v_num=1, train_loss=0.691, train_accuracy=0.500, val_loss=0.665, val_accuracy=0.594]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.12it/s][A
Epoch 12:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.64, v_num=1, train_loss=0.691, tra

Epoch 12, global step 2937: val_loss reached 0.65970 (best 0.65925), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-35.ckpt" as top 2


Epoch 13:  89%|████████▊ | 226/255 [02:36<00:20,  1.44it/s, loss=0.621, v_num=1, train_loss=0.587, train_accuracy=0.722, val_loss=0.660, val_accuracy=0.593]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 13:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.621, v_num=1, train_loss=0.587, train_accuracy=0.722, val_loss=0.660, val_accuracy=0.593]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.15s/it][A
Epoch 13:  90%|█████████ | 230/255 [02:39<00:17,  1.44it/s, loss=0.621, v_num=1, train_loss=0.587, train_accuracy=0.722, val_loss=0.660, val_accuracy=0.593]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.97it/s][A
Epoch 13:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.621, v_num=1, train_loss=0.587, train_accuracy=0.722, val_loss=0.660, val_accuracy=0.593]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.10it/s][A
Epoch 13:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.621, v_num=1, train_loss=0.587,

Epoch 13, global step 3163: val_loss reached 0.65738 (best 0.65738), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-35.ckpt" as top 2


Epoch 14:  89%|████████▊ | 226/255 [02:36<00:20,  1.44it/s, loss=0.61, v_num=1, train_loss=0.627, train_accuracy=0.722, val_loss=0.657, val_accuracy=0.590] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 14:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.61, v_num=1, train_loss=0.627, train_accuracy=0.722, val_loss=0.657, val_accuracy=0.590]
Validating:   7%|▋         | 2/29 [00:02<00:32,  1.21s/it][A
Epoch 14:  90%|█████████ | 230/255 [02:39<00:17,  1.44it/s, loss=0.61, v_num=1, train_loss=0.627, train_accuracy=0.722, val_loss=0.657, val_accuracy=0.590]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.92it/s][A
Epoch 14:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.61, v_num=1, train_loss=0.627, train_accuracy=0.722, val_loss=0.657, val_accuracy=0.590]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.03it/s][A
Epoch 14:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.61, v_num=1, train_loss=0.627, tra

Epoch 14, global step 3389: val_loss reached 0.63618 (best 0.63618), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-35-v1.ckpt" as top 2


Epoch 15:  89%|████████▊ | 226/255 [02:36<00:20,  1.44it/s, loss=0.659, v_num=1, train_loss=0.630, train_accuracy=0.667, val_loss=0.636, val_accuracy=0.609]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 15:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.659, v_num=1, train_loss=0.630, train_accuracy=0.667, val_loss=0.636, val_accuracy=0.609]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.17s/it][A
Epoch 15:  90%|█████████ | 230/255 [02:39<00:17,  1.44it/s, loss=0.659, v_num=1, train_loss=0.630, train_accuracy=0.667, val_loss=0.636, val_accuracy=0.609]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.97it/s][A
Epoch 15:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.659, v_num=1, train_loss=0.630, train_accuracy=0.667, val_loss=0.636, val_accuracy=0.609]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.14it/s][A
Epoch 15:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.659, v_num=1, train_loss=0.630,

Epoch 15, global step 3615: val_loss was not in top 2


Epoch 16:  89%|████████▊ | 226/255 [02:36<00:20,  1.44it/s, loss=0.635, v_num=1, train_loss=0.577, train_accuracy=0.833, val_loss=0.719, val_accuracy=0.568]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 16:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.635, v_num=1, train_loss=0.577, train_accuracy=0.833, val_loss=0.719, val_accuracy=0.568]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.16s/it][A
Epoch 16:  90%|█████████ | 230/255 [02:39<00:17,  1.44it/s, loss=0.635, v_num=1, train_loss=0.577, train_accuracy=0.833, val_loss=0.719, val_accuracy=0.568]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.94it/s][A
Epoch 16:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.635, v_num=1, train_loss=0.577, train_accuracy=0.833, val_loss=0.719, val_accuracy=0.568]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.09it/s][A
Epoch 16:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.635, v_num=1, train_loss=0.577,

Epoch 16, global step 3841: val_loss was not in top 2


Epoch 17:  89%|████████▊ | 226/255 [02:36<00:20,  1.44it/s, loss=0.61, v_num=1, train_loss=0.573, train_accuracy=0.778, val_loss=0.677, val_accuracy=0.630] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 17:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.61, v_num=1, train_loss=0.573, train_accuracy=0.778, val_loss=0.677, val_accuracy=0.630]
Validating:   7%|▋         | 2/29 [00:02<00:32,  1.20s/it][A
Epoch 17:  90%|█████████ | 230/255 [02:39<00:17,  1.44it/s, loss=0.61, v_num=1, train_loss=0.573, train_accuracy=0.778, val_loss=0.677, val_accuracy=0.630]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.90it/s][A
Epoch 17:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.61, v_num=1, train_loss=0.573, train_accuracy=0.778, val_loss=0.677, val_accuracy=0.630]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.04it/s][A
Epoch 17:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.61, v_num=1, train_loss=0.573, tra

Epoch 17, global step 4067: val_loss was not in top 2


Epoch 18:  89%|████████▊ | 226/255 [02:36<00:20,  1.44it/s, loss=0.589, v_num=1, train_loss=0.557, train_accuracy=0.778, val_loss=0.669, val_accuracy=0.621]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 18:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.589, v_num=1, train_loss=0.557, train_accuracy=0.778, val_loss=0.669, val_accuracy=0.621]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.18s/it][A
Epoch 18:  90%|█████████ | 230/255 [02:39<00:17,  1.44it/s, loss=0.589, v_num=1, train_loss=0.557, train_accuracy=0.778, val_loss=0.669, val_accuracy=0.621]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.93it/s][A
Epoch 18:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.589, v_num=1, train_loss=0.557, train_accuracy=0.778, val_loss=0.669, val_accuracy=0.621]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.07it/s][A
Epoch 18:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.589, v_num=1, train_loss=0.557,

Epoch 18, global step 4293: val_loss reached 0.63618 (best 0.63618), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-35.ckpt" as top 2


Epoch 19:  89%|████████▊ | 226/255 [02:36<00:20,  1.44it/s, loss=0.685, v_num=1, train_loss=0.688, train_accuracy=0.611, val_loss=0.636, val_accuracy=0.659]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 19:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.685, v_num=1, train_loss=0.688, train_accuracy=0.611, val_loss=0.636, val_accuracy=0.659]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.16s/it][A
Epoch 19:  90%|█████████ | 230/255 [02:39<00:17,  1.44it/s, loss=0.685, v_num=1, train_loss=0.688, train_accuracy=0.611, val_loss=0.636, val_accuracy=0.659]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.99it/s][A
Epoch 19:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.685, v_num=1, train_loss=0.688, train_accuracy=0.611, val_loss=0.636, val_accuracy=0.659]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.07it/s][A
Epoch 19:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.685, v_num=1, train_loss=0.688,

Epoch 19, global step 4519: val_loss was not in top 2


Epoch 20:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.672, v_num=1, train_loss=0.696, train_accuracy=0.556, val_loss=0.696, val_accuracy=0.496]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 20:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.672, v_num=1, train_loss=0.696, train_accuracy=0.556, val_loss=0.696, val_accuracy=0.496]
Validating:   7%|▋         | 2/29 [00:02<00:32,  1.21s/it][A
Epoch 20:  90%|█████████ | 230/255 [02:40<00:17,  1.44it/s, loss=0.672, v_num=1, train_loss=0.696, train_accuracy=0.556, val_loss=0.696, val_accuracy=0.496]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.91it/s][A
Epoch 20:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.672, v_num=1, train_loss=0.696, train_accuracy=0.556, val_loss=0.696, val_accuracy=0.496]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.98it/s][A
Epoch 20:  92%|█████████▏| 234/255 [02:40<00:14,  1.45it/s, loss=0.672, v_num=1, train_loss=0.696,

Epoch 20, global step 4745: val_loss was not in top 2


Epoch 21:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.656, v_num=1, train_loss=0.653, train_accuracy=0.500, val_loss=0.673, val_accuracy=0.569]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 21:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.656, v_num=1, train_loss=0.653, train_accuracy=0.500, val_loss=0.673, val_accuracy=0.569]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.18s/it][A
Epoch 21:  90%|█████████ | 230/255 [02:40<00:17,  1.44it/s, loss=0.656, v_num=1, train_loss=0.653, train_accuracy=0.500, val_loss=0.673, val_accuracy=0.569]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.93it/s][A
Epoch 21:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.656, v_num=1, train_loss=0.653, train_accuracy=0.500, val_loss=0.673, val_accuracy=0.569]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.07it/s][A
Epoch 21:  92%|█████████▏| 234/255 [02:40<00:14,  1.45it/s, loss=0.656, v_num=1, train_loss=0.653,

Epoch 21, global step 4971: val_loss was not in top 2


Epoch 22:  89%|████████▊ | 226/255 [02:36<00:20,  1.44it/s, loss=0.638, v_num=1, train_loss=0.686, train_accuracy=0.500, val_loss=0.660, val_accuracy=0.589]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 22:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.638, v_num=1, train_loss=0.686, train_accuracy=0.500, val_loss=0.660, val_accuracy=0.589]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.17s/it][A
Epoch 22:  90%|█████████ | 230/255 [02:39<00:17,  1.44it/s, loss=0.638, v_num=1, train_loss=0.686, train_accuracy=0.500, val_loss=0.660, val_accuracy=0.589]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.95it/s][A
Epoch 22:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.638, v_num=1, train_loss=0.686, train_accuracy=0.500, val_loss=0.660, val_accuracy=0.589]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.04it/s][A
Epoch 22:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.638, v_num=1, train_loss=0.686,

Epoch 22, global step 5197: val_loss was not in top 2


Epoch 23:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.618, v_num=1, train_loss=0.525, train_accuracy=0.722, val_loss=0.643, val_accuracy=0.609]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 23:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.618, v_num=1, train_loss=0.525, train_accuracy=0.722, val_loss=0.643, val_accuracy=0.609]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.17s/it][A
Epoch 23:  90%|█████████ | 230/255 [02:40<00:17,  1.44it/s, loss=0.618, v_num=1, train_loss=0.525, train_accuracy=0.722, val_loss=0.643, val_accuracy=0.609]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.95it/s][A
Epoch 23:  91%|█████████ | 232/255 [02:40<00:15,  1.44it/s, loss=0.618, v_num=1, train_loss=0.525, train_accuracy=0.722, val_loss=0.643, val_accuracy=0.609]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.06it/s][A
Epoch 23:  92%|█████████▏| 234/255 [02:41<00:14,  1.45it/s, loss=0.618, v_num=1, train_loss=0.525,

Epoch 23, global step 5423: val_loss was not in top 2


Epoch 24:  89%|████████▊ | 226/255 [02:36<00:20,  1.44it/s, loss=0.602, v_num=1, train_loss=0.578, train_accuracy=0.667, val_loss=0.680, val_accuracy=0.595]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 24:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.602, v_num=1, train_loss=0.578, train_accuracy=0.667, val_loss=0.680, val_accuracy=0.595]
Validating:   7%|▋         | 2/29 [00:02<00:32,  1.21s/it][A
Epoch 24:  90%|█████████ | 230/255 [02:39<00:17,  1.44it/s, loss=0.602, v_num=1, train_loss=0.578, train_accuracy=0.667, val_loss=0.680, val_accuracy=0.595]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.93it/s][A
Epoch 24:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.602, v_num=1, train_loss=0.578, train_accuracy=0.667, val_loss=0.680, val_accuracy=0.595]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.10it/s][A
Epoch 24:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.602, v_num=1, train_loss=0.578,

Epoch 24, global step 5649: val_loss was not in top 2


Epoch 25:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.638, v_num=1, train_loss=0.630, train_accuracy=0.667, val_loss=0.743, val_accuracy=0.612]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 25:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.638, v_num=1, train_loss=0.630, train_accuracy=0.667, val_loss=0.743, val_accuracy=0.612]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.16s/it][A
Epoch 25:  90%|█████████ | 230/255 [02:39<00:17,  1.44it/s, loss=0.638, v_num=1, train_loss=0.630, train_accuracy=0.667, val_loss=0.743, val_accuracy=0.612]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.98it/s][A
Epoch 25:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.638, v_num=1, train_loss=0.630, train_accuracy=0.667, val_loss=0.743, val_accuracy=0.612]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.14it/s][A
Epoch 25:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.638, v_num=1, train_loss=0.630,

Epoch 25, global step 5875: val_loss reached 0.63356 (best 0.63356), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-35.ckpt" as top 2


Epoch 26:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.616, v_num=1, train_loss=0.592, train_accuracy=0.667, val_loss=0.634, val_accuracy=0.625]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 26:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.616, v_num=1, train_loss=0.592, train_accuracy=0.667, val_loss=0.634, val_accuracy=0.625]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.17s/it][A
Epoch 26:  90%|█████████ | 230/255 [02:40<00:17,  1.44it/s, loss=0.616, v_num=1, train_loss=0.592, train_accuracy=0.667, val_loss=0.634, val_accuracy=0.625]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.95it/s][A
Epoch 26:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.616, v_num=1, train_loss=0.592, train_accuracy=0.667, val_loss=0.634, val_accuracy=0.625]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.05it/s][A
Epoch 26:  92%|█████████▏| 234/255 [02:40<00:14,  1.45it/s, loss=0.616, v_num=1, train_loss=0.592,

Epoch 26, global step 6101: val_loss reached 0.62207 (best 0.62207), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-35-v1.ckpt" as top 2


Epoch 27:  89%|████████▊ | 226/255 [02:36<00:20,  1.44it/s, loss=0.671, v_num=1, train_loss=0.628, train_accuracy=0.500, val_loss=0.622, val_accuracy=0.636]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 27:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.671, v_num=1, train_loss=0.628, train_accuracy=0.500, val_loss=0.622, val_accuracy=0.636]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.16s/it][A
Epoch 27:  90%|█████████ | 230/255 [02:39<00:17,  1.44it/s, loss=0.671, v_num=1, train_loss=0.628, train_accuracy=0.500, val_loss=0.622, val_accuracy=0.636]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.96it/s][A
Epoch 27:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.671, v_num=1, train_loss=0.628, train_accuracy=0.500, val_loss=0.622, val_accuracy=0.636]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.06it/s][A
Epoch 27:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.671, v_num=1, train_loss=0.628,

Epoch 27, global step 6327: val_loss was not in top 2


Epoch 28:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.675, v_num=1, train_loss=0.626, train_accuracy=0.722, val_loss=0.740, val_accuracy=0.540]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 28:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.675, v_num=1, train_loss=0.626, train_accuracy=0.722, val_loss=0.740, val_accuracy=0.540]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.18s/it][A
Epoch 28:  90%|█████████ | 230/255 [02:40<00:17,  1.44it/s, loss=0.675, v_num=1, train_loss=0.626, train_accuracy=0.722, val_loss=0.740, val_accuracy=0.540]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.94it/s][A
Epoch 28:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.675, v_num=1, train_loss=0.626, train_accuracy=0.722, val_loss=0.740, val_accuracy=0.540]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.08it/s][A
Epoch 28:  92%|█████████▏| 234/255 [02:40<00:14,  1.45it/s, loss=0.675, v_num=1, train_loss=0.626,

Epoch 28, global step 6553: val_loss was not in top 2


Epoch 29:  89%|████████▊ | 226/255 [02:36<00:20,  1.44it/s, loss=0.592, v_num=1, train_loss=0.654, train_accuracy=0.778, val_loss=0.659, val_accuracy=0.576]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 29:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.592, v_num=1, train_loss=0.654, train_accuracy=0.778, val_loss=0.659, val_accuracy=0.576]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.18s/it][A
Epoch 29:  90%|█████████ | 230/255 [02:39<00:17,  1.44it/s, loss=0.592, v_num=1, train_loss=0.654, train_accuracy=0.778, val_loss=0.659, val_accuracy=0.576]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.94it/s][A
Epoch 29:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.592, v_num=1, train_loss=0.654, train_accuracy=0.778, val_loss=0.659, val_accuracy=0.576]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.05it/s][A
Epoch 29:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.592, v_num=1, train_loss=0.654,

Epoch 29, global step 6779: val_loss reached 0.62465 (best 0.62207), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-35.ckpt" as top 2


Epoch 30:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.557, v_num=1, train_loss=0.406, train_accuracy=0.889, val_loss=0.625, val_accuracy=0.672]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 30:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.557, v_num=1, train_loss=0.406, train_accuracy=0.889, val_loss=0.625, val_accuracy=0.672]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.18s/it][A
Epoch 30:  90%|█████████ | 230/255 [02:40<00:17,  1.44it/s, loss=0.557, v_num=1, train_loss=0.406, train_accuracy=0.889, val_loss=0.625, val_accuracy=0.672]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.96it/s][A
Epoch 30:  91%|█████████ | 232/255 [02:40<00:15,  1.44it/s, loss=0.557, v_num=1, train_loss=0.406, train_accuracy=0.889, val_loss=0.625, val_accuracy=0.672]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.06it/s][A
Epoch 30:  92%|█████████▏| 234/255 [02:40<00:14,  1.45it/s, loss=0.557, v_num=1, train_loss=0.406,

Epoch 30, global step 7005: val_loss was not in top 2


Epoch 31:  89%|████████▊ | 226/255 [02:36<00:20,  1.44it/s, loss=0.602, v_num=1, train_loss=0.601, train_accuracy=0.611, val_loss=0.809, val_accuracy=0.656]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 31:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.602, v_num=1, train_loss=0.601, train_accuracy=0.611, val_loss=0.809, val_accuracy=0.656]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.18s/it][A
Epoch 31:  90%|█████████ | 230/255 [02:39<00:17,  1.44it/s, loss=0.602, v_num=1, train_loss=0.601, train_accuracy=0.611, val_loss=0.809, val_accuracy=0.656]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.94it/s][A
Epoch 31:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.602, v_num=1, train_loss=0.601, train_accuracy=0.611, val_loss=0.809, val_accuracy=0.656]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.07it/s][A
Epoch 31:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.602, v_num=1, train_loss=0.601,

Epoch 31, global step 7231: val_loss reached 0.62242 (best 0.62207), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-35.ckpt" as top 2


Epoch 32:  89%|████████▊ | 226/255 [02:36<00:20,  1.44it/s, loss=0.606, v_num=1, train_loss=0.612, train_accuracy=0.611, val_loss=0.622, val_accuracy=0.643]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 32:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.606, v_num=1, train_loss=0.612, train_accuracy=0.611, val_loss=0.622, val_accuracy=0.643]
Validating:   7%|▋         | 2/29 [00:02<00:32,  1.19s/it][A
Epoch 32:  90%|█████████ | 230/255 [02:39<00:17,  1.44it/s, loss=0.606, v_num=1, train_loss=0.612, train_accuracy=0.611, val_loss=0.622, val_accuracy=0.643]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.95it/s][A
Epoch 32:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.606, v_num=1, train_loss=0.612, train_accuracy=0.611, val_loss=0.622, val_accuracy=0.643]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.06it/s][A
Epoch 32:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.606, v_num=1, train_loss=0.612,

Epoch 32, global step 7457: val_loss reached 0.60184 (best 0.60184), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-35.ckpt" as top 2


Epoch 33:  89%|████████▊ | 226/255 [02:36<00:20,  1.44it/s, loss=0.579, v_num=1, train_loss=0.538, train_accuracy=0.778, val_loss=0.602, val_accuracy=0.668]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 33:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.579, v_num=1, train_loss=0.538, train_accuracy=0.778, val_loss=0.602, val_accuracy=0.668]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.18s/it][A
Epoch 33:  90%|█████████ | 230/255 [02:39<00:17,  1.44it/s, loss=0.579, v_num=1, train_loss=0.538, train_accuracy=0.778, val_loss=0.602, val_accuracy=0.668]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.96it/s][A
Epoch 33:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.579, v_num=1, train_loss=0.538, train_accuracy=0.778, val_loss=0.602, val_accuracy=0.668]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.14it/s][A
Epoch 33:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.579, v_num=1, train_loss=0.538,

Epoch 33, global step 7683: val_loss reached 0.59379 (best 0.59379), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-35-v1.ckpt" as top 2


Epoch 34:  89%|████████▊ | 226/255 [02:36<00:20,  1.44it/s, loss=0.693, v_num=1, train_loss=0.412, train_accuracy=0.833, val_loss=0.594, val_accuracy=0.652]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 34:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.693, v_num=1, train_loss=0.412, train_accuracy=0.833, val_loss=0.594, val_accuracy=0.652]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.17s/it][A
Epoch 34:  90%|█████████ | 230/255 [02:39<00:17,  1.44it/s, loss=0.693, v_num=1, train_loss=0.412, train_accuracy=0.833, val_loss=0.594, val_accuracy=0.652]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.98it/s][A
Epoch 34:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.693, v_num=1, train_loss=0.412, train_accuracy=0.833, val_loss=0.594, val_accuracy=0.652]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.15it/s][A
Epoch 34:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.693, v_num=1, train_loss=0.412,

Epoch 34, global step 7909: val_loss was not in top 2


Epoch 35:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.59, v_num=1, train_loss=0.506, train_accuracy=0.833, val_loss=0.725, val_accuracy=0.566] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 35:  89%|████████▉ | 228/255 [02:40<00:18,  1.42it/s, loss=0.59, v_num=1, train_loss=0.506, train_accuracy=0.833, val_loss=0.725, val_accuracy=0.566]
Validating:   7%|▋         | 2/29 [00:03<00:34,  1.27s/it][A
Epoch 35:  90%|█████████ | 230/255 [02:40<00:17,  1.43it/s, loss=0.59, v_num=1, train_loss=0.506, train_accuracy=0.833, val_loss=0.725, val_accuracy=0.566]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.84it/s][A
Epoch 35:  91%|█████████ | 232/255 [02:40<00:15,  1.44it/s, loss=0.59, v_num=1, train_loss=0.506, train_accuracy=0.833, val_loss=0.725, val_accuracy=0.566]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.96it/s][A
Epoch 35:  92%|█████████▏| 234/255 [02:41<00:14,  1.45it/s, loss=0.59, v_num=1, train_loss=0.506, tra

Epoch 35, global step 8135: val_loss reached 0.59851 (best 0.59379), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-35.ckpt" as top 2


Epoch 36:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.59, v_num=1, train_loss=0.604, train_accuracy=0.722, val_loss=0.599, val_accuracy=0.672] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 36:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.59, v_num=1, train_loss=0.604, train_accuracy=0.722, val_loss=0.599, val_accuracy=0.672]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.17s/it][A
Epoch 36:  90%|█████████ | 230/255 [02:39<00:17,  1.44it/s, loss=0.59, v_num=1, train_loss=0.604, train_accuracy=0.722, val_loss=0.599, val_accuracy=0.672]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.97it/s][A
Epoch 36:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.59, v_num=1, train_loss=0.604, train_accuracy=0.722, val_loss=0.599, val_accuracy=0.672]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.14it/s][A
Epoch 36:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.59, v_num=1, train_loss=0.604, tra

Epoch 36, global step 8361: val_loss reached 0.59696 (best 0.59379), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-35.ckpt" as top 2


Epoch 37:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.543, v_num=1, train_loss=0.571, train_accuracy=0.667, val_loss=0.597, val_accuracy=0.654]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 37:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.543, v_num=1, train_loss=0.571, train_accuracy=0.667, val_loss=0.597, val_accuracy=0.654]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.18s/it][A
Epoch 37:  90%|█████████ | 230/255 [02:40<00:17,  1.44it/s, loss=0.543, v_num=1, train_loss=0.571, train_accuracy=0.667, val_loss=0.597, val_accuracy=0.654]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.93it/s][A
Epoch 37:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.543, v_num=1, train_loss=0.571, train_accuracy=0.667, val_loss=0.597, val_accuracy=0.654]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.04it/s][A
Epoch 37:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.543, v_num=1, train_loss=0.571,

Epoch 37, global step 8587: val_loss reached 0.54718 (best 0.54718), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-35.ckpt" as top 2


Epoch 38:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.519, v_num=1, train_loss=0.614, train_accuracy=0.667, val_loss=0.547, val_accuracy=0.707]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 38:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.519, v_num=1, train_loss=0.614, train_accuracy=0.667, val_loss=0.547, val_accuracy=0.707]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.17s/it][A
Epoch 38:  90%|█████████ | 230/255 [02:40<00:17,  1.44it/s, loss=0.519, v_num=1, train_loss=0.614, train_accuracy=0.667, val_loss=0.547, val_accuracy=0.707]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.98it/s][A
Epoch 38:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.519, v_num=1, train_loss=0.614, train_accuracy=0.667, val_loss=0.547, val_accuracy=0.707]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.13it/s][A
Epoch 38:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.519, v_num=1, train_loss=0.614,

Epoch 38, global step 8813: val_loss reached 0.55777 (best 0.54718), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-35-v1.ckpt" as top 2


Epoch 39:  89%|████████▊ | 226/255 [02:36<00:20,  1.44it/s, loss=0.531, v_num=1, train_loss=0.429, train_accuracy=0.889, val_loss=0.558, val_accuracy=0.714]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 39:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.531, v_num=1, train_loss=0.429, train_accuracy=0.889, val_loss=0.558, val_accuracy=0.714]
Validating:   7%|▋         | 2/29 [00:02<00:34,  1.26s/it][A
Epoch 39:  90%|█████████ | 230/255 [02:40<00:17,  1.44it/s, loss=0.531, v_num=1, train_loss=0.429, train_accuracy=0.889, val_loss=0.558, val_accuracy=0.714]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.85it/s][A
Epoch 39:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.531, v_num=1, train_loss=0.429, train_accuracy=0.889, val_loss=0.558, val_accuracy=0.714]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.95it/s][A
Epoch 39:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.531, v_num=1, train_loss=0.429,

Epoch 39, global step 9039: val_loss reached 0.52389 (best 0.52389), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-35-v1.ckpt" as top 2


Epoch 40:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.556, v_num=1, train_loss=0.617, train_accuracy=0.611, val_loss=0.524, val_accuracy=0.759]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 40:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.556, v_num=1, train_loss=0.617, train_accuracy=0.611, val_loss=0.524, val_accuracy=0.759]
Validating:   7%|▋         | 2/29 [00:02<00:32,  1.21s/it][A
Epoch 40:  90%|█████████ | 230/255 [02:40<00:17,  1.44it/s, loss=0.556, v_num=1, train_loss=0.617, train_accuracy=0.611, val_loss=0.524, val_accuracy=0.759]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.89it/s][A
Epoch 40:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.556, v_num=1, train_loss=0.617, train_accuracy=0.611, val_loss=0.524, val_accuracy=0.759]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.03it/s][A
Epoch 40:  92%|█████████▏| 234/255 [02:40<00:14,  1.45it/s, loss=0.556, v_num=1, train_loss=0.617,

Epoch 40, global step 9265: val_loss was not in top 2


Epoch 41:  89%|████████▊ | 226/255 [02:36<00:20,  1.44it/s, loss=0.523, v_num=1, train_loss=0.412, train_accuracy=0.944, val_loss=0.565, val_accuracy=0.720]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 41:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.523, v_num=1, train_loss=0.412, train_accuracy=0.944, val_loss=0.565, val_accuracy=0.720]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.18s/it][A
Epoch 41:  90%|█████████ | 230/255 [02:39<00:17,  1.44it/s, loss=0.523, v_num=1, train_loss=0.412, train_accuracy=0.944, val_loss=0.565, val_accuracy=0.720]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.96it/s][A
Epoch 41:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.523, v_num=1, train_loss=0.412, train_accuracy=0.944, val_loss=0.565, val_accuracy=0.720]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.14it/s][A
Epoch 41:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.523, v_num=1, train_loss=0.412,

Epoch 41, global step 9491: val_loss was not in top 2


Epoch 42:  89%|████████▊ | 226/255 [02:36<00:20,  1.44it/s, loss=0.526, v_num=1, train_loss=0.345, train_accuracy=1.000, val_loss=0.560, val_accuracy=0.715]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 42:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.526, v_num=1, train_loss=0.345, train_accuracy=1.000, val_loss=0.560, val_accuracy=0.715]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.18s/it][A
Epoch 42:  90%|█████████ | 230/255 [02:39<00:17,  1.44it/s, loss=0.526, v_num=1, train_loss=0.345, train_accuracy=1.000, val_loss=0.560, val_accuracy=0.715]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.94it/s][A
Epoch 42:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.526, v_num=1, train_loss=0.345, train_accuracy=1.000, val_loss=0.560, val_accuracy=0.715]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.05it/s][A
Epoch 42:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.526, v_num=1, train_loss=0.345,

Epoch 42, global step 9717: val_loss reached 0.52912 (best 0.52389), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-35.ckpt" as top 2


Epoch 43:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.53, v_num=1, train_loss=0.475, train_accuracy=0.778, val_loss=0.529, val_accuracy=0.738] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 43:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.53, v_num=1, train_loss=0.475, train_accuracy=0.778, val_loss=0.529, val_accuracy=0.738]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.18s/it][A
Epoch 43:  90%|█████████ | 230/255 [02:40<00:17,  1.44it/s, loss=0.53, v_num=1, train_loss=0.475, train_accuracy=0.778, val_loss=0.529, val_accuracy=0.738]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.95it/s][A
Epoch 43:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.53, v_num=1, train_loss=0.475, train_accuracy=0.778, val_loss=0.529, val_accuracy=0.738]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.07it/s][A
Epoch 43:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.53, v_num=1, train_loss=0.475, tra

Epoch 43, global step 9943: val_loss was not in top 2


Epoch 44:  89%|████████▊ | 226/255 [02:36<00:20,  1.44it/s, loss=0.481, v_num=1, train_loss=0.530, train_accuracy=0.722, val_loss=0.553, val_accuracy=0.684]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 44:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.481, v_num=1, train_loss=0.530, train_accuracy=0.722, val_loss=0.553, val_accuracy=0.684]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.17s/it][A
Epoch 44:  90%|█████████ | 230/255 [02:39<00:17,  1.44it/s, loss=0.481, v_num=1, train_loss=0.530, train_accuracy=0.722, val_loss=0.553, val_accuracy=0.684]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.95it/s][A
Epoch 44:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.481, v_num=1, train_loss=0.530, train_accuracy=0.722, val_loss=0.553, val_accuracy=0.684]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.10it/s][A
Epoch 44:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.481, v_num=1, train_loss=0.530,

Epoch 44, global step 10169: val_loss reached 0.52575 (best 0.52389), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-35.ckpt" as top 2


Epoch 45:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.549, v_num=1, train_loss=0.770, train_accuracy=0.611, val_loss=0.526, val_accuracy=0.753]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 45:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.549, v_num=1, train_loss=0.770, train_accuracy=0.611, val_loss=0.526, val_accuracy=0.753]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.17s/it][A
Epoch 45:  90%|█████████ | 230/255 [02:40<00:17,  1.44it/s, loss=0.549, v_num=1, train_loss=0.770, train_accuracy=0.611, val_loss=0.526, val_accuracy=0.753]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.97it/s][A
Epoch 45:  91%|█████████ | 232/255 [02:40<00:15,  1.44it/s, loss=0.549, v_num=1, train_loss=0.770, train_accuracy=0.611, val_loss=0.526, val_accuracy=0.753]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.10it/s][A
Epoch 45:  92%|█████████▏| 234/255 [02:40<00:14,  1.45it/s, loss=0.549, v_num=1, train_loss=0.770,

Epoch 45, global step 10395: val_loss was not in top 2


Epoch 46:  89%|████████▊ | 226/255 [02:36<00:20,  1.44it/s, loss=0.481, v_num=1, train_loss=0.438, train_accuracy=0.778, val_loss=0.556, val_accuracy=0.707]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 46:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.481, v_num=1, train_loss=0.438, train_accuracy=0.778, val_loss=0.556, val_accuracy=0.707]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.18s/it][A
Epoch 46:  90%|█████████ | 230/255 [02:39<00:17,  1.44it/s, loss=0.481, v_num=1, train_loss=0.438, train_accuracy=0.778, val_loss=0.556, val_accuracy=0.707]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.95it/s][A
Epoch 46:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.481, v_num=1, train_loss=0.438, train_accuracy=0.778, val_loss=0.556, val_accuracy=0.707]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.10it/s][A
Epoch 46:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.481, v_num=1, train_loss=0.438,

Epoch 46, global step 10621: val_loss was not in top 2


Epoch 47:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.435, v_num=1, train_loss=0.477, train_accuracy=0.778, val_loss=0.535, val_accuracy=0.731]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 47:  89%|████████▉ | 228/255 [02:40<00:18,  1.42it/s, loss=0.435, v_num=1, train_loss=0.477, train_accuracy=0.778, val_loss=0.535, val_accuracy=0.731]
Validating:   7%|▋         | 2/29 [00:03<00:38,  1.41s/it][A
Epoch 47:  90%|█████████ | 230/255 [02:40<00:17,  1.43it/s, loss=0.435, v_num=1, train_loss=0.477, train_accuracy=0.778, val_loss=0.535, val_accuracy=0.731]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.70it/s][A
Epoch 47:  91%|█████████ | 232/255 [02:41<00:15,  1.44it/s, loss=0.435, v_num=1, train_loss=0.477, train_accuracy=0.778, val_loss=0.535, val_accuracy=0.731]
Validating:  21%|██        | 6/29 [00:04<00:08,  2.83it/s][A
Epoch 47:  92%|█████████▏| 234/255 [02:41<00:14,  1.45it/s, loss=0.435, v_num=1, train_loss=0.477,

Epoch 47, global step 10847: val_loss reached 0.48161 (best 0.48161), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-35.ckpt" as top 2


Epoch 48:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.49, v_num=1, train_loss=0.537, train_accuracy=0.778, val_loss=0.482, val_accuracy=0.779] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 48:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.49, v_num=1, train_loss=0.537, train_accuracy=0.778, val_loss=0.482, val_accuracy=0.779]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.18s/it][A
Epoch 48:  90%|█████████ | 230/255 [02:40<00:17,  1.44it/s, loss=0.49, v_num=1, train_loss=0.537, train_accuracy=0.778, val_loss=0.482, val_accuracy=0.779]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.94it/s][A
Epoch 48:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.49, v_num=1, train_loss=0.537, train_accuracy=0.778, val_loss=0.482, val_accuracy=0.779]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.11it/s][A
Epoch 48:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.49, v_num=1, train_loss=0.537, tra

Epoch 48, global step 11073: val_loss was not in top 2


Epoch 49:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.516, v_num=1, train_loss=0.559, train_accuracy=0.778, val_loss=0.525, val_accuracy=0.763]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 49:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.516, v_num=1, train_loss=0.559, train_accuracy=0.778, val_loss=0.525, val_accuracy=0.763]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.16s/it][A
Epoch 49:  90%|█████████ | 230/255 [02:40<00:17,  1.44it/s, loss=0.516, v_num=1, train_loss=0.559, train_accuracy=0.778, val_loss=0.525, val_accuracy=0.763]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.97it/s][A
Epoch 49:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.516, v_num=1, train_loss=0.559, train_accuracy=0.778, val_loss=0.525, val_accuracy=0.763]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.08it/s][A
Epoch 49:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.516, v_num=1, train_loss=0.559,

Epoch 49, global step 11299: val_loss was not in top 2


Epoch 50:  89%|████████▊ | 226/255 [02:36<00:20,  1.44it/s, loss=0.42, v_num=1, train_loss=0.315, train_accuracy=0.889, val_loss=0.546, val_accuracy=0.721] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 50:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.42, v_num=1, train_loss=0.315, train_accuracy=0.889, val_loss=0.546, val_accuracy=0.721]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.17s/it][A
Epoch 50:  90%|█████████ | 230/255 [02:39<00:17,  1.44it/s, loss=0.42, v_num=1, train_loss=0.315, train_accuracy=0.889, val_loss=0.546, val_accuracy=0.721]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.92it/s][A
Epoch 50:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.42, v_num=1, train_loss=0.315, train_accuracy=0.889, val_loss=0.546, val_accuracy=0.721]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.04it/s][A
Epoch 50:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.42, v_num=1, train_loss=0.315, tra

Epoch 50, global step 11525: val_loss was not in top 2


Epoch 51:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.479, v_num=1, train_loss=0.351, train_accuracy=0.944, val_loss=0.536, val_accuracy=0.745]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 51:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.479, v_num=1, train_loss=0.351, train_accuracy=0.944, val_loss=0.536, val_accuracy=0.745]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.17s/it][A
Epoch 51:  90%|█████████ | 230/255 [02:40<00:17,  1.44it/s, loss=0.479, v_num=1, train_loss=0.351, train_accuracy=0.944, val_loss=0.536, val_accuracy=0.745]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.98it/s][A
Epoch 51:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.479, v_num=1, train_loss=0.351, train_accuracy=0.944, val_loss=0.536, val_accuracy=0.745]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.15it/s][A
Epoch 51:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.479, v_num=1, train_loss=0.351,

Epoch 51, global step 11751: val_loss reached 0.50977 (best 0.48161), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-35-v1.ckpt" as top 2


Epoch 52:  89%|████████▊ | 226/255 [02:36<00:20,  1.44it/s, loss=0.48, v_num=1, train_loss=0.459, train_accuracy=0.833, val_loss=0.510, val_accuracy=0.751] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 52:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.48, v_num=1, train_loss=0.459, train_accuracy=0.833, val_loss=0.510, val_accuracy=0.751]
Validating:   7%|▋         | 2/29 [00:02<00:32,  1.22s/it][A
Epoch 52:  90%|█████████ | 230/255 [02:39<00:17,  1.44it/s, loss=0.48, v_num=1, train_loss=0.459, train_accuracy=0.833, val_loss=0.510, val_accuracy=0.751]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.91it/s][A
Epoch 52:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.48, v_num=1, train_loss=0.459, train_accuracy=0.833, val_loss=0.510, val_accuracy=0.751]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.05it/s][A
Epoch 52:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.48, v_num=1, train_loss=0.459, tra

Epoch 52, global step 11977: val_loss reached 0.49143 (best 0.48161), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-35-v1.ckpt" as top 2


Epoch 53:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.422, v_num=1, train_loss=0.391, train_accuracy=0.833, val_loss=0.491, val_accuracy=0.764]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 53:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.422, v_num=1, train_loss=0.391, train_accuracy=0.833, val_loss=0.491, val_accuracy=0.764]
Validating:   7%|▋         | 2/29 [00:02<00:32,  1.21s/it][A
Epoch 53:  90%|█████████ | 230/255 [02:40<00:17,  1.43it/s, loss=0.422, v_num=1, train_loss=0.391, train_accuracy=0.833, val_loss=0.491, val_accuracy=0.764]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.92it/s][A
Epoch 53:  91%|█████████ | 232/255 [02:40<00:15,  1.44it/s, loss=0.422, v_num=1, train_loss=0.391, train_accuracy=0.833, val_loss=0.491, val_accuracy=0.764]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.08it/s][A
Epoch 53:  92%|█████████▏| 234/255 [02:41<00:14,  1.45it/s, loss=0.422, v_num=1, train_loss=0.391,

Epoch 53, global step 12203: val_loss reached 0.44212 (best 0.44212), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-35-v1.ckpt" as top 2


Epoch 54:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.466, v_num=1, train_loss=0.374, train_accuracy=0.889, val_loss=0.442, val_accuracy=0.811]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 54:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.466, v_num=1, train_loss=0.374, train_accuracy=0.889, val_loss=0.442, val_accuracy=0.811]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.18s/it][A
Epoch 54:  90%|█████████ | 230/255 [02:40<00:17,  1.44it/s, loss=0.466, v_num=1, train_loss=0.374, train_accuracy=0.889, val_loss=0.442, val_accuracy=0.811]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.94it/s][A
Epoch 54:  91%|█████████ | 232/255 [02:40<00:15,  1.44it/s, loss=0.466, v_num=1, train_loss=0.374, train_accuracy=0.889, val_loss=0.442, val_accuracy=0.811]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.07it/s][A
Epoch 54:  92%|█████████▏| 234/255 [02:40<00:14,  1.45it/s, loss=0.466, v_num=1, train_loss=0.374,

Epoch 54, global step 12429: val_loss reached 0.48020 (best 0.44212), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-35.ckpt" as top 2


Epoch 55:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.556, v_num=1, train_loss=0.697, train_accuracy=0.500, val_loss=0.480, val_accuracy=0.781]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 55:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.556, v_num=1, train_loss=0.697, train_accuracy=0.500, val_loss=0.480, val_accuracy=0.781]
Validating:   7%|▋         | 2/29 [00:02<00:32,  1.21s/it][A
Epoch 55:  90%|█████████ | 230/255 [02:40<00:17,  1.44it/s, loss=0.556, v_num=1, train_loss=0.697, train_accuracy=0.500, val_loss=0.480, val_accuracy=0.781]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.92it/s][A
Epoch 55:  91%|█████████ | 232/255 [02:40<00:15,  1.44it/s, loss=0.556, v_num=1, train_loss=0.697, train_accuracy=0.500, val_loss=0.480, val_accuracy=0.781]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.08it/s][A
Epoch 55:  92%|█████████▏| 234/255 [02:40<00:14,  1.45it/s, loss=0.556, v_num=1, train_loss=0.697,

Epoch 55, global step 12655: val_loss was not in top 2


Epoch 56:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.432, v_num=1, train_loss=0.455, train_accuracy=0.722, val_loss=0.590, val_accuracy=0.703]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 56:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.432, v_num=1, train_loss=0.455, train_accuracy=0.722, val_loss=0.590, val_accuracy=0.703]
Validating:   7%|▋         | 2/29 [00:02<00:32,  1.19s/it][A
Epoch 56:  90%|█████████ | 230/255 [02:40<00:17,  1.44it/s, loss=0.432, v_num=1, train_loss=0.455, train_accuracy=0.722, val_loss=0.590, val_accuracy=0.703]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.95it/s][A
Epoch 56:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.432, v_num=1, train_loss=0.455, train_accuracy=0.722, val_loss=0.590, val_accuracy=0.703]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.08it/s][A
Epoch 56:  92%|█████████▏| 234/255 [02:40<00:14,  1.45it/s, loss=0.432, v_num=1, train_loss=0.455,

Epoch 56, global step 12881: val_loss reached 0.46066 (best 0.44212), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-35.ckpt" as top 2


Epoch 57:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.452, v_num=1, train_loss=0.345, train_accuracy=0.778, val_loss=0.461, val_accuracy=0.784]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 57:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.452, v_num=1, train_loss=0.345, train_accuracy=0.778, val_loss=0.461, val_accuracy=0.784]
Validating:   7%|▋         | 2/29 [00:02<00:32,  1.19s/it][A
Epoch 57:  90%|█████████ | 230/255 [02:40<00:17,  1.43it/s, loss=0.452, v_num=1, train_loss=0.345, train_accuracy=0.778, val_loss=0.461, val_accuracy=0.784]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.93it/s][A
Epoch 57:  91%|█████████ | 232/255 [02:40<00:15,  1.44it/s, loss=0.452, v_num=1, train_loss=0.345, train_accuracy=0.778, val_loss=0.461, val_accuracy=0.784]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.06it/s][A
Epoch 57:  92%|█████████▏| 234/255 [02:41<00:14,  1.45it/s, loss=0.452, v_num=1, train_loss=0.345,

Epoch 57, global step 13107: val_loss was not in top 2


Epoch 58:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.485, v_num=1, train_loss=0.623, train_accuracy=0.556, val_loss=0.492, val_accuracy=0.764]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 58:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.485, v_num=1, train_loss=0.623, train_accuracy=0.556, val_loss=0.492, val_accuracy=0.764]
Validating:   7%|▋         | 2/29 [00:02<00:33,  1.25s/it][A
Epoch 58:  90%|█████████ | 230/255 [02:40<00:17,  1.44it/s, loss=0.485, v_num=1, train_loss=0.623, train_accuracy=0.556, val_loss=0.492, val_accuracy=0.764]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.87it/s][A
Epoch 58:  91%|█████████ | 232/255 [02:40<00:15,  1.44it/s, loss=0.485, v_num=1, train_loss=0.623, train_accuracy=0.556, val_loss=0.492, val_accuracy=0.764]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.03it/s][A
Epoch 58:  92%|█████████▏| 234/255 [02:40<00:14,  1.45it/s, loss=0.485, v_num=1, train_loss=0.623,

Epoch 58, global step 13333: val_loss was not in top 2


Epoch 59:  89%|████████▊ | 226/255 [02:36<00:20,  1.44it/s, loss=0.415, v_num=1, train_loss=0.254, train_accuracy=0.944, val_loss=0.567, val_accuracy=0.682]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 59:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.415, v_num=1, train_loss=0.254, train_accuracy=0.944, val_loss=0.567, val_accuracy=0.682]
Validating:   7%|▋         | 2/29 [00:02<00:32,  1.20s/it][A
Epoch 59:  90%|█████████ | 230/255 [02:40<00:17,  1.44it/s, loss=0.415, v_num=1, train_loss=0.254, train_accuracy=0.944, val_loss=0.567, val_accuracy=0.682]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.93it/s][A
Epoch 59:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.415, v_num=1, train_loss=0.254, train_accuracy=0.944, val_loss=0.567, val_accuracy=0.682]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.09it/s][A
Epoch 59:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.415, v_num=1, train_loss=0.254,

Epoch 59, global step 13559: val_loss was not in top 2


Epoch 60:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.535, v_num=1, train_loss=0.898, train_accuracy=0.556, val_loss=0.463, val_accuracy=0.783]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 60:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.535, v_num=1, train_loss=0.898, train_accuracy=0.556, val_loss=0.463, val_accuracy=0.783]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.17s/it][A
Epoch 60:  90%|█████████ | 230/255 [02:40<00:17,  1.44it/s, loss=0.535, v_num=1, train_loss=0.898, train_accuracy=0.556, val_loss=0.463, val_accuracy=0.783]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.97it/s][A
Epoch 60:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.535, v_num=1, train_loss=0.898, train_accuracy=0.556, val_loss=0.463, val_accuracy=0.783]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.08it/s][A
Epoch 60:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.535, v_num=1, train_loss=0.898,

Epoch 60, global step 13785: val_loss was not in top 2


Epoch 61:  89%|████████▊ | 226/255 [02:36<00:20,  1.44it/s, loss=0.42, v_num=1, train_loss=0.569, train_accuracy=0.778, val_loss=0.514, val_accuracy=0.744] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 61:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.42, v_num=1, train_loss=0.569, train_accuracy=0.778, val_loss=0.514, val_accuracy=0.744]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.18s/it][A
Epoch 61:  90%|█████████ | 230/255 [02:39<00:17,  1.44it/s, loss=0.42, v_num=1, train_loss=0.569, train_accuracy=0.778, val_loss=0.514, val_accuracy=0.744]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.96it/s][A
Epoch 61:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.42, v_num=1, train_loss=0.569, train_accuracy=0.778, val_loss=0.514, val_accuracy=0.744]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.12it/s][A
Epoch 61:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.42, v_num=1, train_loss=0.569, tra

Epoch 61, global step 14011: val_loss was not in top 2


Epoch 62:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.462, v_num=1, train_loss=0.466, train_accuracy=0.722, val_loss=0.472, val_accuracy=0.770]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 62:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.462, v_num=1, train_loss=0.466, train_accuracy=0.722, val_loss=0.472, val_accuracy=0.770]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.17s/it][A
Epoch 62:  90%|█████████ | 230/255 [02:40<00:17,  1.43it/s, loss=0.462, v_num=1, train_loss=0.466, train_accuracy=0.722, val_loss=0.472, val_accuracy=0.770]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.96it/s][A
Epoch 62:  91%|█████████ | 232/255 [02:40<00:15,  1.44it/s, loss=0.462, v_num=1, train_loss=0.466, train_accuracy=0.722, val_loss=0.472, val_accuracy=0.770]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.04it/s][A
Epoch 62:  92%|█████████▏| 234/255 [02:41<00:14,  1.45it/s, loss=0.462, v_num=1, train_loss=0.466,

Epoch 62, global step 14237: val_loss was not in top 2


Epoch 63:  89%|████████▊ | 226/255 [02:36<00:20,  1.44it/s, loss=0.418, v_num=1, train_loss=0.269, train_accuracy=1.000, val_loss=0.483, val_accuracy=0.772]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 63:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.418, v_num=1, train_loss=0.269, train_accuracy=1.000, val_loss=0.483, val_accuracy=0.772]
Validating:   7%|▋         | 2/29 [00:03<00:34,  1.27s/it][A
Epoch 63:  90%|█████████ | 230/255 [02:40<00:17,  1.44it/s, loss=0.418, v_num=1, train_loss=0.269, train_accuracy=1.000, val_loss=0.483, val_accuracy=0.772]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.83it/s][A
Epoch 63:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.418, v_num=1, train_loss=0.269, train_accuracy=1.000, val_loss=0.483, val_accuracy=0.772]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.96it/s][A
Epoch 63:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.418, v_num=1, train_loss=0.269,

Epoch 63, global step 14463: val_loss was not in top 2


Epoch 64:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.466, v_num=1, train_loss=0.607, train_accuracy=0.667, val_loss=0.472, val_accuracy=0.781]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 64:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.466, v_num=1, train_loss=0.607, train_accuracy=0.667, val_loss=0.472, val_accuracy=0.781]
Validating:   7%|▋         | 2/29 [00:02<00:33,  1.25s/it][A
Epoch 64:  90%|█████████ | 230/255 [02:40<00:17,  1.44it/s, loss=0.466, v_num=1, train_loss=0.607, train_accuracy=0.667, val_loss=0.472, val_accuracy=0.781]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.85it/s][A
Epoch 64:  91%|█████████ | 232/255 [02:40<00:15,  1.44it/s, loss=0.466, v_num=1, train_loss=0.607, train_accuracy=0.667, val_loss=0.472, val_accuracy=0.781]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.00it/s][A
Epoch 64:  92%|█████████▏| 234/255 [02:40<00:14,  1.45it/s, loss=0.466, v_num=1, train_loss=0.607,

Epoch 64, global step 14689: val_loss was not in top 2


Epoch 65:  89%|████████▊ | 226/255 [02:36<00:20,  1.44it/s, loss=0.555, v_num=1, train_loss=0.607, train_accuracy=0.722, val_loss=0.505, val_accuracy=0.745]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 65:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.555, v_num=1, train_loss=0.607, train_accuracy=0.722, val_loss=0.505, val_accuracy=0.745]
Validating:   7%|▋         | 2/29 [00:03<00:35,  1.32s/it][A
Epoch 65:  90%|█████████ | 230/255 [02:40<00:17,  1.44it/s, loss=0.555, v_num=1, train_loss=0.607, train_accuracy=0.722, val_loss=0.505, val_accuracy=0.745]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.80it/s][A
Epoch 65:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.555, v_num=1, train_loss=0.607, train_accuracy=0.722, val_loss=0.505, val_accuracy=0.745]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.90it/s][A
Epoch 65:  92%|█████████▏| 234/255 [02:40<00:14,  1.45it/s, loss=0.555, v_num=1, train_loss=0.607,

Epoch 65, global step 14915: val_loss was not in top 2


Epoch 66:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.562, v_num=1, train_loss=0.512, train_accuracy=0.722, val_loss=0.575, val_accuracy=0.716]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 66:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.562, v_num=1, train_loss=0.512, train_accuracy=0.722, val_loss=0.575, val_accuracy=0.716]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.18s/it][A
Epoch 66:  90%|█████████ | 230/255 [02:40<00:17,  1.43it/s, loss=0.562, v_num=1, train_loss=0.512, train_accuracy=0.722, val_loss=0.575, val_accuracy=0.716]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.95it/s][A
Epoch 66:  91%|█████████ | 232/255 [02:40<00:15,  1.44it/s, loss=0.562, v_num=1, train_loss=0.512, train_accuracy=0.722, val_loss=0.575, val_accuracy=0.716]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.08it/s][A
Epoch 66:  92%|█████████▏| 234/255 [02:41<00:14,  1.45it/s, loss=0.562, v_num=1, train_loss=0.512,

Epoch 66, global step 15141: val_loss was not in top 2


Epoch 67:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.512, v_num=1, train_loss=0.414, train_accuracy=0.833, val_loss=0.560, val_accuracy=0.735]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 67:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.512, v_num=1, train_loss=0.414, train_accuracy=0.833, val_loss=0.560, val_accuracy=0.735]
Validating:   7%|▋         | 2/29 [00:02<00:33,  1.24s/it][A
Epoch 67:  90%|█████████ | 230/255 [02:40<00:17,  1.44it/s, loss=0.512, v_num=1, train_loss=0.414, train_accuracy=0.833, val_loss=0.560, val_accuracy=0.735]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.88it/s][A
Epoch 67:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.512, v_num=1, train_loss=0.414, train_accuracy=0.833, val_loss=0.560, val_accuracy=0.735]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.05it/s][A
Epoch 67:  92%|█████████▏| 234/255 [02:40<00:14,  1.45it/s, loss=0.512, v_num=1, train_loss=0.414,

Epoch 67, global step 15367: val_loss was not in top 2


Epoch 68:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.517, v_num=1, train_loss=0.632, train_accuracy=0.722, val_loss=0.522, val_accuracy=0.758]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 68:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.517, v_num=1, train_loss=0.632, train_accuracy=0.722, val_loss=0.522, val_accuracy=0.758]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.18s/it][A
Epoch 68:  90%|█████████ | 230/255 [02:40<00:17,  1.44it/s, loss=0.517, v_num=1, train_loss=0.632, train_accuracy=0.722, val_loss=0.522, val_accuracy=0.758]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.96it/s][A
Epoch 68:  91%|█████████ | 232/255 [02:40<00:15,  1.44it/s, loss=0.517, v_num=1, train_loss=0.632, train_accuracy=0.722, val_loss=0.522, val_accuracy=0.758]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.10it/s][A
Epoch 68:  92%|█████████▏| 234/255 [02:40<00:14,  1.45it/s, loss=0.517, v_num=1, train_loss=0.632,

Epoch 68, global step 15593: val_loss was not in top 2


Epoch 69:  89%|████████▊ | 226/255 [02:36<00:20,  1.44it/s, loss=0.472, v_num=1, train_loss=0.428, train_accuracy=0.722, val_loss=0.503, val_accuracy=0.757]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 69:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.472, v_num=1, train_loss=0.428, train_accuracy=0.722, val_loss=0.503, val_accuracy=0.757]
Validating:   7%|▋         | 2/29 [00:02<00:32,  1.19s/it][A
Epoch 69:  90%|█████████ | 230/255 [02:39<00:17,  1.44it/s, loss=0.472, v_num=1, train_loss=0.428, train_accuracy=0.722, val_loss=0.503, val_accuracy=0.757]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.93it/s][A
Epoch 69:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.472, v_num=1, train_loss=0.428, train_accuracy=0.722, val_loss=0.503, val_accuracy=0.757]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.00it/s][A
Epoch 69:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.472, v_num=1, train_loss=0.428,

Epoch 69, global step 15819: val_loss was not in top 2


Epoch 70:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.465, v_num=1, train_loss=0.306, train_accuracy=0.833, val_loss=0.508, val_accuracy=0.754]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 70:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.465, v_num=1, train_loss=0.306, train_accuracy=0.833, val_loss=0.508, val_accuracy=0.754]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.17s/it][A
Epoch 70:  90%|█████████ | 230/255 [02:40<00:17,  1.44it/s, loss=0.465, v_num=1, train_loss=0.306, train_accuracy=0.833, val_loss=0.508, val_accuracy=0.754]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.95it/s][A
Epoch 70:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.465, v_num=1, train_loss=0.306, train_accuracy=0.833, val_loss=0.508, val_accuracy=0.754]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.11it/s][A
Epoch 70:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.465, v_num=1, train_loss=0.306,

Epoch 70, global step 16045: val_loss was not in top 2


Epoch 71:  89%|████████▊ | 226/255 [02:36<00:20,  1.44it/s, loss=0.485, v_num=1, train_loss=0.542, train_accuracy=0.778, val_loss=0.513, val_accuracy=0.754]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 71:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.485, v_num=1, train_loss=0.542, train_accuracy=0.778, val_loss=0.513, val_accuracy=0.754]
Validating:   7%|▋         | 2/29 [00:02<00:32,  1.22s/it][A
Epoch 71:  90%|█████████ | 230/255 [02:39<00:17,  1.44it/s, loss=0.485, v_num=1, train_loss=0.542, train_accuracy=0.778, val_loss=0.513, val_accuracy=0.754]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.92it/s][A
Epoch 71:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.485, v_num=1, train_loss=0.542, train_accuracy=0.778, val_loss=0.513, val_accuracy=0.754]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.02it/s][A
Epoch 71:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.485, v_num=1, train_loss=0.542,

Epoch 71, global step 16271: val_loss was not in top 2


Epoch 72:  89%|████████▊ | 226/255 [02:36<00:20,  1.44it/s, loss=0.446, v_num=1, train_loss=0.438, train_accuracy=0.778, val_loss=0.544, val_accuracy=0.761]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 72:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.446, v_num=1, train_loss=0.438, train_accuracy=0.778, val_loss=0.544, val_accuracy=0.761]
Validating:   7%|▋         | 2/29 [00:02<00:32,  1.19s/it][A
Epoch 72:  90%|█████████ | 230/255 [02:39<00:17,  1.44it/s, loss=0.446, v_num=1, train_loss=0.438, train_accuracy=0.778, val_loss=0.544, val_accuracy=0.761]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.91it/s][A
Epoch 72:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.446, v_num=1, train_loss=0.438, train_accuracy=0.778, val_loss=0.544, val_accuracy=0.761]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.07it/s][A
Epoch 72:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.446, v_num=1, train_loss=0.438,

Epoch 72, global step 16497: val_loss reached 0.45474 (best 0.44212), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-35.ckpt" as top 2


Epoch 73:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.494, v_num=1, train_loss=0.523, train_accuracy=0.667, val_loss=0.455, val_accuracy=0.784]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 73:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.494, v_num=1, train_loss=0.523, train_accuracy=0.667, val_loss=0.455, val_accuracy=0.784]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.17s/it][A
Epoch 73:  90%|█████████ | 230/255 [02:40<00:17,  1.44it/s, loss=0.494, v_num=1, train_loss=0.523, train_accuracy=0.667, val_loss=0.455, val_accuracy=0.784]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.97it/s][A
Epoch 73:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.494, v_num=1, train_loss=0.523, train_accuracy=0.667, val_loss=0.455, val_accuracy=0.784]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.11it/s][A
Epoch 73:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.494, v_num=1, train_loss=0.523,

Epoch 73, global step 16723: val_loss was not in top 2


Epoch 74:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.365, v_num=1, train_loss=0.297, train_accuracy=0.833, val_loss=0.546, val_accuracy=0.729]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 74:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.365, v_num=1, train_loss=0.297, train_accuracy=0.833, val_loss=0.546, val_accuracy=0.729]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.18s/it][A
Epoch 74:  90%|█████████ | 230/255 [02:40<00:17,  1.44it/s, loss=0.365, v_num=1, train_loss=0.297, train_accuracy=0.833, val_loss=0.546, val_accuracy=0.729]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.96it/s][A
Epoch 74:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.365, v_num=1, train_loss=0.297, train_accuracy=0.833, val_loss=0.546, val_accuracy=0.729]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.14it/s][A
Epoch 74:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.365, v_num=1, train_loss=0.297,

Epoch 74, global step 16949: val_loss reached 0.42076 (best 0.42076), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-35.ckpt" as top 2


Epoch 75:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.511, v_num=1, train_loss=0.684, train_accuracy=0.611, val_loss=0.421, val_accuracy=0.810]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 75:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.511, v_num=1, train_loss=0.684, train_accuracy=0.611, val_loss=0.421, val_accuracy=0.810]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.18s/it][A
Epoch 75:  90%|█████████ | 230/255 [02:40<00:17,  1.44it/s, loss=0.511, v_num=1, train_loss=0.684, train_accuracy=0.611, val_loss=0.421, val_accuracy=0.810]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.96it/s][A
Epoch 75:  91%|█████████ | 232/255 [02:40<00:15,  1.44it/s, loss=0.511, v_num=1, train_loss=0.684, train_accuracy=0.611, val_loss=0.421, val_accuracy=0.810]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.05it/s][A
Epoch 75:  92%|█████████▏| 234/255 [02:40<00:14,  1.45it/s, loss=0.511, v_num=1, train_loss=0.684,

Epoch 75, global step 17175: val_loss was not in top 2


Epoch 76:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.634, v_num=1, train_loss=0.498, train_accuracy=0.722, val_loss=0.520, val_accuracy=0.722]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 76:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.634, v_num=1, train_loss=0.498, train_accuracy=0.722, val_loss=0.520, val_accuracy=0.722]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.18s/it][A
Epoch 76:  90%|█████████ | 230/255 [02:40<00:17,  1.43it/s, loss=0.634, v_num=1, train_loss=0.498, train_accuracy=0.722, val_loss=0.520, val_accuracy=0.722]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.91it/s][A
Epoch 76:  91%|█████████ | 232/255 [02:40<00:15,  1.44it/s, loss=0.634, v_num=1, train_loss=0.498, train_accuracy=0.722, val_loss=0.520, val_accuracy=0.722]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.08it/s][A
Epoch 76:  92%|█████████▏| 234/255 [02:41<00:14,  1.45it/s, loss=0.634, v_num=1, train_loss=0.498,

Epoch 76, global step 17401: val_loss was not in top 2


Epoch 77:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.432, v_num=1, train_loss=0.334, train_accuracy=0.833, val_loss=0.598, val_accuracy=0.654]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 77:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.432, v_num=1, train_loss=0.334, train_accuracy=0.833, val_loss=0.598, val_accuracy=0.654]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.18s/it][A
Epoch 77:  90%|█████████ | 230/255 [02:40<00:17,  1.44it/s, loss=0.432, v_num=1, train_loss=0.334, train_accuracy=0.833, val_loss=0.598, val_accuracy=0.654]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.92it/s][A
Epoch 77:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.432, v_num=1, train_loss=0.334, train_accuracy=0.833, val_loss=0.598, val_accuracy=0.654]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.06it/s][A
Epoch 77:  92%|█████████▏| 234/255 [02:40<00:14,  1.45it/s, loss=0.432, v_num=1, train_loss=0.334,

Epoch 77, global step 17627: val_loss reached 0.43986 (best 0.42076), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-35-v1.ckpt" as top 2


Epoch 78:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.403, v_num=1, train_loss=0.330, train_accuracy=0.944, val_loss=0.440, val_accuracy=0.798]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 78:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.403, v_num=1, train_loss=0.330, train_accuracy=0.944, val_loss=0.440, val_accuracy=0.798]
Validating:   7%|▋         | 2/29 [00:02<00:33,  1.25s/it][A
Epoch 78:  90%|█████████ | 230/255 [02:40<00:17,  1.44it/s, loss=0.403, v_num=1, train_loss=0.330, train_accuracy=0.944, val_loss=0.440, val_accuracy=0.798]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.83it/s][A
Epoch 78:  91%|█████████ | 232/255 [02:40<00:15,  1.44it/s, loss=0.403, v_num=1, train_loss=0.330, train_accuracy=0.944, val_loss=0.440, val_accuracy=0.798]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.99it/s][A
Epoch 78:  92%|█████████▏| 234/255 [02:40<00:14,  1.45it/s, loss=0.403, v_num=1, train_loss=0.330,

Epoch 78, global step 17853: val_loss was not in top 2


Epoch 79:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.505, v_num=1, train_loss=0.378, train_accuracy=0.833, val_loss=0.447, val_accuracy=0.777]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 79:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.505, v_num=1, train_loss=0.378, train_accuracy=0.833, val_loss=0.447, val_accuracy=0.777]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.18s/it][A
Epoch 79:  90%|█████████ | 230/255 [02:40<00:17,  1.43it/s, loss=0.505, v_num=1, train_loss=0.378, train_accuracy=0.833, val_loss=0.447, val_accuracy=0.777]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.96it/s][A
Epoch 79:  91%|█████████ | 232/255 [02:40<00:15,  1.44it/s, loss=0.505, v_num=1, train_loss=0.378, train_accuracy=0.833, val_loss=0.447, val_accuracy=0.777]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.10it/s][A
Epoch 79:  92%|█████████▏| 234/255 [02:41<00:14,  1.45it/s, loss=0.505, v_num=1, train_loss=0.378,

Epoch 79, global step 18079: val_loss was not in top 2


Epoch 80:  89%|████████▊ | 226/255 [02:36<00:20,  1.44it/s, loss=0.473, v_num=1, train_loss=0.691, train_accuracy=0.611, val_loss=0.575, val_accuracy=0.711]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 80:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.473, v_num=1, train_loss=0.691, train_accuracy=0.611, val_loss=0.575, val_accuracy=0.711]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.18s/it][A
Epoch 80:  90%|█████████ | 230/255 [02:39<00:17,  1.44it/s, loss=0.473, v_num=1, train_loss=0.691, train_accuracy=0.611, val_loss=0.575, val_accuracy=0.711]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.93it/s][A
Epoch 80:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.473, v_num=1, train_loss=0.691, train_accuracy=0.611, val_loss=0.575, val_accuracy=0.711]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.07it/s][A
Epoch 80:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.473, v_num=1, train_loss=0.691,

Epoch 80, global step 18305: val_loss was not in top 2


Epoch 81:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.407, v_num=1, train_loss=0.276, train_accuracy=0.889, val_loss=0.497, val_accuracy=0.762]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 81:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.407, v_num=1, train_loss=0.276, train_accuracy=0.889, val_loss=0.497, val_accuracy=0.762]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.17s/it][A
Epoch 81:  90%|█████████ | 230/255 [02:40<00:17,  1.44it/s, loss=0.407, v_num=1, train_loss=0.276, train_accuracy=0.889, val_loss=0.497, val_accuracy=0.762]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.97it/s][A
Epoch 81:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.407, v_num=1, train_loss=0.276, train_accuracy=0.889, val_loss=0.497, val_accuracy=0.762]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.07it/s][A
Epoch 81:  92%|█████████▏| 234/255 [02:40<00:14,  1.45it/s, loss=0.407, v_num=1, train_loss=0.276,

Epoch 81, global step 18531: val_loss was not in top 2


Epoch 82:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.443, v_num=1, train_loss=0.500, train_accuracy=0.833, val_loss=0.450, val_accuracy=0.792]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 82:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.443, v_num=1, train_loss=0.500, train_accuracy=0.833, val_loss=0.450, val_accuracy=0.792]
Validating:   7%|▋         | 2/29 [00:02<00:32,  1.20s/it][A
Epoch 82:  90%|█████████ | 230/255 [02:40<00:17,  1.44it/s, loss=0.443, v_num=1, train_loss=0.500, train_accuracy=0.833, val_loss=0.450, val_accuracy=0.792]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.92it/s][A
Epoch 82:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.443, v_num=1, train_loss=0.500, train_accuracy=0.833, val_loss=0.450, val_accuracy=0.792]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.02it/s][A
Epoch 82:  92%|█████████▏| 234/255 [02:40<00:14,  1.45it/s, loss=0.443, v_num=1, train_loss=0.500,

Epoch 82, global step 18757: val_loss was not in top 2


Epoch 83:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.404, v_num=1, train_loss=0.300, train_accuracy=0.778, val_loss=0.480, val_accuracy=0.759]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 83:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.404, v_num=1, train_loss=0.300, train_accuracy=0.778, val_loss=0.480, val_accuracy=0.759]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.18s/it][A
Epoch 83:  90%|█████████ | 230/255 [02:40<00:17,  1.43it/s, loss=0.404, v_num=1, train_loss=0.300, train_accuracy=0.778, val_loss=0.480, val_accuracy=0.759]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.95it/s][A
Epoch 83:  91%|█████████ | 232/255 [02:40<00:15,  1.44it/s, loss=0.404, v_num=1, train_loss=0.300, train_accuracy=0.778, val_loss=0.480, val_accuracy=0.759]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.12it/s][A
Epoch 83:  92%|█████████▏| 234/255 [02:41<00:14,  1.45it/s, loss=0.404, v_num=1, train_loss=0.300,

Epoch 83, global step 18983: val_loss reached 0.43521 (best 0.42076), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-35-v1.ckpt" as top 2


Epoch 84:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.399, v_num=1, train_loss=0.435, train_accuracy=0.833, val_loss=0.435, val_accuracy=0.785]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 84:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.399, v_num=1, train_loss=0.435, train_accuracy=0.833, val_loss=0.435, val_accuracy=0.785]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.18s/it][A
Epoch 84:  90%|█████████ | 230/255 [02:40<00:17,  1.44it/s, loss=0.399, v_num=1, train_loss=0.435, train_accuracy=0.833, val_loss=0.435, val_accuracy=0.785]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.94it/s][A
Epoch 84:  91%|█████████ | 232/255 [02:40<00:15,  1.44it/s, loss=0.399, v_num=1, train_loss=0.435, train_accuracy=0.833, val_loss=0.435, val_accuracy=0.785]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.04it/s][A
Epoch 84:  92%|█████████▏| 234/255 [02:40<00:14,  1.45it/s, loss=0.399, v_num=1, train_loss=0.435,

Epoch 84, global step 19209: val_loss was not in top 2


Epoch 85:  89%|████████▊ | 226/255 [02:36<00:20,  1.44it/s, loss=0.458, v_num=1, train_loss=0.434, train_accuracy=0.833, val_loss=0.468, val_accuracy=0.784]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 85:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.458, v_num=1, train_loss=0.434, train_accuracy=0.833, val_loss=0.468, val_accuracy=0.784]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.18s/it][A
Epoch 85:  90%|█████████ | 230/255 [02:39<00:17,  1.44it/s, loss=0.458, v_num=1, train_loss=0.434, train_accuracy=0.833, val_loss=0.468, val_accuracy=0.784]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.95it/s][A
Epoch 85:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.458, v_num=1, train_loss=0.434, train_accuracy=0.833, val_loss=0.468, val_accuracy=0.784]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.07it/s][A
Epoch 85:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.458, v_num=1, train_loss=0.434,

Epoch 85, global step 19435: val_loss was not in top 2


Epoch 86:  89%|████████▊ | 226/255 [02:36<00:20,  1.44it/s, loss=0.406, v_num=1, train_loss=0.454, train_accuracy=0.778, val_loss=0.457, val_accuracy=0.769]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 86:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.406, v_num=1, train_loss=0.454, train_accuracy=0.778, val_loss=0.457, val_accuracy=0.769]
Validating:   7%|▋         | 2/29 [00:02<00:33,  1.24s/it][A
Epoch 86:  90%|█████████ | 230/255 [02:40<00:17,  1.44it/s, loss=0.406, v_num=1, train_loss=0.454, train_accuracy=0.778, val_loss=0.457, val_accuracy=0.769]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.89it/s][A
Epoch 86:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.406, v_num=1, train_loss=0.454, train_accuracy=0.778, val_loss=0.457, val_accuracy=0.769]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.05it/s][A
Epoch 86:  92%|█████████▏| 234/255 [02:40<00:14,  1.45it/s, loss=0.406, v_num=1, train_loss=0.454,

Epoch 86, global step 19661: val_loss reached 0.41597 (best 0.41597), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-35-v1.ckpt" as top 2


Epoch 87:  89%|████████▊ | 226/255 [02:36<00:20,  1.44it/s, loss=0.468, v_num=1, train_loss=0.494, train_accuracy=0.778, val_loss=0.416, val_accuracy=0.794]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 87:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.468, v_num=1, train_loss=0.494, train_accuracy=0.778, val_loss=0.416, val_accuracy=0.794]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.18s/it][A
Epoch 87:  90%|█████████ | 230/255 [02:39<00:17,  1.44it/s, loss=0.468, v_num=1, train_loss=0.494, train_accuracy=0.778, val_loss=0.416, val_accuracy=0.794]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.95it/s][A
Epoch 87:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.468, v_num=1, train_loss=0.494, train_accuracy=0.778, val_loss=0.416, val_accuracy=0.794]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.01it/s][A
Epoch 87:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.468, v_num=1, train_loss=0.494,

Epoch 87, global step 19887: val_loss was not in top 2


Epoch 88:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.412, v_num=1, train_loss=0.509, train_accuracy=0.833, val_loss=0.425, val_accuracy=0.797]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 88:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.412, v_num=1, train_loss=0.509, train_accuracy=0.833, val_loss=0.425, val_accuracy=0.797]
Validating:   7%|▋         | 2/29 [00:02<00:32,  1.19s/it][A
Epoch 88:  90%|█████████ | 230/255 [02:40<00:17,  1.44it/s, loss=0.412, v_num=1, train_loss=0.509, train_accuracy=0.833, val_loss=0.425, val_accuracy=0.797]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.94it/s][A
Epoch 88:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.412, v_num=1, train_loss=0.509, train_accuracy=0.833, val_loss=0.425, val_accuracy=0.797]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.11it/s][A
Epoch 88:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.412, v_num=1, train_loss=0.509,

Epoch 88, global step 20113: val_loss reached 0.41886 (best 0.41597), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-35.ckpt" as top 2


Epoch 89:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.431, v_num=1, train_loss=0.295, train_accuracy=0.944, val_loss=0.419, val_accuracy=0.811]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 89:  89%|████████▉ | 228/255 [02:40<00:18,  1.42it/s, loss=0.431, v_num=1, train_loss=0.295, train_accuracy=0.944, val_loss=0.419, val_accuracy=0.811]
Validating:   7%|▋         | 2/29 [00:02<00:33,  1.24s/it][A
Epoch 89:  90%|█████████ | 230/255 [02:40<00:17,  1.43it/s, loss=0.431, v_num=1, train_loss=0.295, train_accuracy=0.944, val_loss=0.419, val_accuracy=0.811]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.87it/s][A
Epoch 89:  91%|█████████ | 232/255 [02:40<00:15,  1.44it/s, loss=0.431, v_num=1, train_loss=0.295, train_accuracy=0.944, val_loss=0.419, val_accuracy=0.811]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.02it/s][A
Epoch 89:  92%|█████████▏| 234/255 [02:41<00:14,  1.45it/s, loss=0.431, v_num=1, train_loss=0.295,

Epoch 89, global step 20339: val_loss was not in top 2


Epoch 90:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.448, v_num=1, train_loss=0.288, train_accuracy=0.833, val_loss=0.429, val_accuracy=0.798]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 90:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.448, v_num=1, train_loss=0.288, train_accuracy=0.833, val_loss=0.429, val_accuracy=0.798]
Validating:   7%|▋         | 2/29 [00:02<00:32,  1.19s/it][A
Epoch 90:  90%|█████████ | 230/255 [02:40<00:17,  1.44it/s, loss=0.448, v_num=1, train_loss=0.288, train_accuracy=0.833, val_loss=0.429, val_accuracy=0.798]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.93it/s][A
Epoch 90:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.448, v_num=1, train_loss=0.288, train_accuracy=0.833, val_loss=0.429, val_accuracy=0.798]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.08it/s][A
Epoch 90:  92%|█████████▏| 234/255 [02:40<00:14,  1.45it/s, loss=0.448, v_num=1, train_loss=0.288,

Epoch 90, global step 20565: val_loss was not in top 2


Epoch 91:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.378, v_num=1, train_loss=0.330, train_accuracy=0.778, val_loss=0.431, val_accuracy=0.795]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 91:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.378, v_num=1, train_loss=0.330, train_accuracy=0.778, val_loss=0.431, val_accuracy=0.795]
Validating:   7%|▋         | 2/29 [00:02<00:32,  1.19s/it][A
Epoch 91:  90%|█████████ | 230/255 [02:40<00:17,  1.44it/s, loss=0.378, v_num=1, train_loss=0.330, train_accuracy=0.778, val_loss=0.431, val_accuracy=0.795]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.94it/s][A
Epoch 91:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.378, v_num=1, train_loss=0.330, train_accuracy=0.778, val_loss=0.431, val_accuracy=0.795]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.01it/s][A
Epoch 91:  92%|█████████▏| 234/255 [02:40<00:14,  1.45it/s, loss=0.378, v_num=1, train_loss=0.330,

Epoch 91, global step 20791: val_loss was not in top 2


Epoch 92:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.375, v_num=1, train_loss=0.463, train_accuracy=0.833, val_loss=0.446, val_accuracy=0.789]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 92:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.375, v_num=1, train_loss=0.463, train_accuracy=0.833, val_loss=0.446, val_accuracy=0.789]
Validating:   7%|▋         | 2/29 [00:02<00:32,  1.20s/it][A
Epoch 92:  90%|█████████ | 230/255 [02:40<00:17,  1.43it/s, loss=0.375, v_num=1, train_loss=0.463, train_accuracy=0.833, val_loss=0.446, val_accuracy=0.789]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.93it/s][A
Epoch 92:  91%|█████████ | 232/255 [02:40<00:15,  1.44it/s, loss=0.375, v_num=1, train_loss=0.463, train_accuracy=0.833, val_loss=0.446, val_accuracy=0.789]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.06it/s][A
Epoch 92:  92%|█████████▏| 234/255 [02:41<00:14,  1.45it/s, loss=0.375, v_num=1, train_loss=0.463,

Epoch 92, global step 21017: val_loss reached 0.40202 (best 0.40202), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-35.ckpt" as top 2


Epoch 93:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.387, v_num=1, train_loss=0.251, train_accuracy=0.944, val_loss=0.402, val_accuracy=0.811]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 93:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.387, v_num=1, train_loss=0.251, train_accuracy=0.944, val_loss=0.402, val_accuracy=0.811]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.18s/it][A
Epoch 93:  90%|█████████ | 230/255 [02:40<00:17,  1.44it/s, loss=0.387, v_num=1, train_loss=0.251, train_accuracy=0.944, val_loss=0.402, val_accuracy=0.811]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.95it/s][A
Epoch 93:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.387, v_num=1, train_loss=0.251, train_accuracy=0.944, val_loss=0.402, val_accuracy=0.811]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.10it/s][A
Epoch 93:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.387, v_num=1, train_loss=0.251,

Epoch 93, global step 21243: val_loss was not in top 2


Epoch 94:  89%|████████▊ | 226/255 [02:36<00:20,  1.44it/s, loss=0.43, v_num=1, train_loss=0.318, train_accuracy=0.889, val_loss=0.416, val_accuracy=0.798] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 94:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.43, v_num=1, train_loss=0.318, train_accuracy=0.889, val_loss=0.416, val_accuracy=0.798]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.18s/it][A
Epoch 94:  90%|█████████ | 230/255 [02:39<00:17,  1.44it/s, loss=0.43, v_num=1, train_loss=0.318, train_accuracy=0.889, val_loss=0.416, val_accuracy=0.798]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.94it/s][A
Epoch 94:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.43, v_num=1, train_loss=0.318, train_accuracy=0.889, val_loss=0.416, val_accuracy=0.798]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.10it/s][A
Epoch 94:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.43, v_num=1, train_loss=0.318, tra

Epoch 94, global step 21469: val_loss was not in top 2


Epoch 95:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.432, v_num=1, train_loss=0.511, train_accuracy=0.556, val_loss=0.475, val_accuracy=0.773]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 95:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.432, v_num=1, train_loss=0.511, train_accuracy=0.556, val_loss=0.475, val_accuracy=0.773]
Validating:   7%|▋         | 2/29 [00:02<00:32,  1.19s/it][A
Epoch 95:  90%|█████████ | 230/255 [02:40<00:17,  1.44it/s, loss=0.432, v_num=1, train_loss=0.511, train_accuracy=0.556, val_loss=0.475, val_accuracy=0.773]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.95it/s][A
Epoch 95:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.432, v_num=1, train_loss=0.511, train_accuracy=0.556, val_loss=0.475, val_accuracy=0.773]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.11it/s][A
Epoch 95:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.432, v_num=1, train_loss=0.511,

Epoch 95, global step 21695: val_loss was not in top 2


Epoch 96:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.414, v_num=1, train_loss=0.449, train_accuracy=0.833, val_loss=0.427, val_accuracy=0.795]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 96:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.414, v_num=1, train_loss=0.449, train_accuracy=0.833, val_loss=0.427, val_accuracy=0.795]
Validating:   7%|▋         | 2/29 [00:02<00:32,  1.21s/it][A
Epoch 96:  90%|█████████ | 230/255 [02:40<00:17,  1.44it/s, loss=0.414, v_num=1, train_loss=0.449, train_accuracy=0.833, val_loss=0.427, val_accuracy=0.795]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.92it/s][A
Epoch 96:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.414, v_num=1, train_loss=0.449, train_accuracy=0.833, val_loss=0.427, val_accuracy=0.795]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.04it/s][A
Epoch 96:  92%|█████████▏| 234/255 [02:40<00:14,  1.45it/s, loss=0.414, v_num=1, train_loss=0.449,

Epoch 96, global step 21921: val_loss reached 0.40412 (best 0.40202), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-35-v1.ckpt" as top 2


Epoch 97:  89%|████████▊ | 226/255 [02:36<00:20,  1.44it/s, loss=0.372, v_num=1, train_loss=0.530, train_accuracy=0.778, val_loss=0.404, val_accuracy=0.814]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 97:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.372, v_num=1, train_loss=0.530, train_accuracy=0.778, val_loss=0.404, val_accuracy=0.814]
Validating:   7%|▋         | 2/29 [00:02<00:32,  1.20s/it][A
Epoch 97:  90%|█████████ | 230/255 [02:39<00:17,  1.44it/s, loss=0.372, v_num=1, train_loss=0.530, train_accuracy=0.778, val_loss=0.404, val_accuracy=0.814]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.93it/s][A
Epoch 97:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.372, v_num=1, train_loss=0.530, train_accuracy=0.778, val_loss=0.404, val_accuracy=0.814]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.05it/s][A
Epoch 97:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.372, v_num=1, train_loss=0.530,

Epoch 97, global step 22147: val_loss was not in top 2


Epoch 98:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.342, v_num=1, train_loss=0.226, train_accuracy=0.889, val_loss=0.493, val_accuracy=0.769]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 98:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.342, v_num=1, train_loss=0.226, train_accuracy=0.889, val_loss=0.493, val_accuracy=0.769]
Validating:   7%|▋         | 2/29 [00:02<00:32,  1.20s/it][A
Epoch 98:  90%|█████████ | 230/255 [02:40<00:17,  1.43it/s, loss=0.342, v_num=1, train_loss=0.226, train_accuracy=0.889, val_loss=0.493, val_accuracy=0.769]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.92it/s][A
Epoch 98:  91%|█████████ | 232/255 [02:40<00:15,  1.44it/s, loss=0.342, v_num=1, train_loss=0.226, train_accuracy=0.889, val_loss=0.493, val_accuracy=0.769]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.05it/s][A
Epoch 98:  92%|█████████▏| 234/255 [02:41<00:14,  1.45it/s, loss=0.342, v_num=1, train_loss=0.226,

Epoch 98, global step 22373: val_loss reached 0.39390 (best 0.39390), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-35-v1.ckpt" as top 2


Epoch 99:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.346, v_num=1, train_loss=0.288, train_accuracy=0.833, val_loss=0.394, val_accuracy=0.820]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 99:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.346, v_num=1, train_loss=0.288, train_accuracy=0.833, val_loss=0.394, val_accuracy=0.820]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.17s/it][A
Epoch 99:  90%|█████████ | 230/255 [02:39<00:17,  1.44it/s, loss=0.346, v_num=1, train_loss=0.288, train_accuracy=0.833, val_loss=0.394, val_accuracy=0.820]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.97it/s][A
Epoch 99:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.346, v_num=1, train_loss=0.288, train_accuracy=0.833, val_loss=0.394, val_accuracy=0.820]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.07it/s][A
Epoch 99:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.346, v_num=1, train_loss=0.288,

Epoch 99, global step 22599: val_loss reached 0.38312 (best 0.38312), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-35.ckpt" as top 2


Epoch 100:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.429, v_num=1, train_loss=0.565, train_accuracy=0.833, val_loss=0.383, val_accuracy=0.825]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 100:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.429, v_num=1, train_loss=0.565, train_accuracy=0.833, val_loss=0.383, val_accuracy=0.825]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.18s/it][A
Epoch 100:  90%|█████████ | 230/255 [02:39<00:17,  1.44it/s, loss=0.429, v_num=1, train_loss=0.565, train_accuracy=0.833, val_loss=0.383, val_accuracy=0.825]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.95it/s][A
Epoch 100:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.429, v_num=1, train_loss=0.565, train_accuracy=0.833, val_loss=0.383, val_accuracy=0.825]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.08it/s][A
Epoch 100:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.429, v_num=1, train_loss=0

Epoch 100, global step 22825: val_loss was not in top 2


Epoch 101:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.341, v_num=1, train_loss=0.381, train_accuracy=0.778, val_loss=0.428, val_accuracy=0.796]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 101:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.341, v_num=1, train_loss=0.381, train_accuracy=0.778, val_loss=0.428, val_accuracy=0.796]
Validating:   7%|▋         | 2/29 [00:02<00:32,  1.19s/it][A
Epoch 101:  90%|█████████ | 230/255 [02:40<00:17,  1.44it/s, loss=0.341, v_num=1, train_loss=0.381, train_accuracy=0.778, val_loss=0.428, val_accuracy=0.796]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.95it/s][A
Epoch 101:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.341, v_num=1, train_loss=0.381, train_accuracy=0.778, val_loss=0.428, val_accuracy=0.796]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.09it/s][A
Epoch 101:  92%|█████████▏| 234/255 [02:40<00:14,  1.45it/s, loss=0.341, v_num=1, train_loss=0

Epoch 101, global step 23051: val_loss was not in top 2


Epoch 102:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.359, v_num=1, train_loss=0.596, train_accuracy=0.722, val_loss=0.402, val_accuracy=0.823]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 102:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.359, v_num=1, train_loss=0.596, train_accuracy=0.722, val_loss=0.402, val_accuracy=0.823]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.19s/it][A
Epoch 102:  90%|█████████ | 230/255 [02:40<00:17,  1.44it/s, loss=0.359, v_num=1, train_loss=0.596, train_accuracy=0.722, val_loss=0.402, val_accuracy=0.823]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.95it/s][A
Epoch 102:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.359, v_num=1, train_loss=0.596, train_accuracy=0.722, val_loss=0.402, val_accuracy=0.823]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.07it/s][A
Epoch 102:  92%|█████████▏| 234/255 [02:40<00:14,  1.45it/s, loss=0.359, v_num=1, train_loss=0

Epoch 102, global step 23277: val_loss was not in top 2


Epoch 103:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.417, v_num=1, train_loss=0.534, train_accuracy=0.778, val_loss=0.411, val_accuracy=0.815]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 103:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.417, v_num=1, train_loss=0.534, train_accuracy=0.778, val_loss=0.411, val_accuracy=0.815]
Validating:   7%|▋         | 2/29 [00:02<00:32,  1.22s/it][A
Epoch 103:  90%|█████████ | 230/255 [02:40<00:17,  1.44it/s, loss=0.417, v_num=1, train_loss=0.534, train_accuracy=0.778, val_loss=0.411, val_accuracy=0.815]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.92it/s][A
Epoch 103:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.417, v_num=1, train_loss=0.534, train_accuracy=0.778, val_loss=0.411, val_accuracy=0.815]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.08it/s][A
Epoch 103:  92%|█████████▏| 234/255 [02:40<00:14,  1.45it/s, loss=0.417, v_num=1, train_loss=0

Epoch 103, global step 23503: val_loss was not in top 2


Epoch 104:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.412, v_num=1, train_loss=0.532, train_accuracy=0.778, val_loss=0.433, val_accuracy=0.805]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 104:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.412, v_num=1, train_loss=0.532, train_accuracy=0.778, val_loss=0.433, val_accuracy=0.805]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.18s/it][A
Epoch 104:  90%|█████████ | 230/255 [02:40<00:17,  1.44it/s, loss=0.412, v_num=1, train_loss=0.532, train_accuracy=0.778, val_loss=0.433, val_accuracy=0.805]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.92it/s][A
Epoch 104:  91%|█████████ | 232/255 [02:40<00:15,  1.44it/s, loss=0.412, v_num=1, train_loss=0.532, train_accuracy=0.778, val_loss=0.433, val_accuracy=0.805]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.08it/s][A
Epoch 104:  92%|█████████▏| 234/255 [02:40<00:14,  1.45it/s, loss=0.412, v_num=1, train_loss=0

Epoch 104, global step 23729: val_loss was not in top 2


Epoch 105:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.354, v_num=1, train_loss=0.411, train_accuracy=0.833, val_loss=0.426, val_accuracy=0.794]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 105:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.354, v_num=1, train_loss=0.411, train_accuracy=0.833, val_loss=0.426, val_accuracy=0.794]
Validating:   7%|▋         | 2/29 [00:02<00:33,  1.24s/it][A
Epoch 105:  90%|█████████ | 230/255 [02:40<00:17,  1.44it/s, loss=0.354, v_num=1, train_loss=0.411, train_accuracy=0.833, val_loss=0.426, val_accuracy=0.794]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.86it/s][A
Epoch 105:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.354, v_num=1, train_loss=0.411, train_accuracy=0.833, val_loss=0.426, val_accuracy=0.794]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.01it/s][A
Epoch 105:  92%|█████████▏| 234/255 [02:40<00:14,  1.45it/s, loss=0.354, v_num=1, train_loss=0

Epoch 105, global step 23955: val_loss was not in top 2


Epoch 106:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.387, v_num=1, train_loss=0.606, train_accuracy=0.667, val_loss=0.406, val_accuracy=0.815]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 106:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.387, v_num=1, train_loss=0.606, train_accuracy=0.667, val_loss=0.406, val_accuracy=0.815]
Validating:   7%|▋         | 2/29 [00:02<00:32,  1.20s/it][A
Epoch 106:  90%|█████████ | 230/255 [02:40<00:17,  1.44it/s, loss=0.387, v_num=1, train_loss=0.606, train_accuracy=0.667, val_loss=0.406, val_accuracy=0.815]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.91it/s][A
Epoch 106:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.387, v_num=1, train_loss=0.606, train_accuracy=0.667, val_loss=0.406, val_accuracy=0.815]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.08it/s][A
Epoch 106:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.387, v_num=1, train_loss=0

Epoch 106, global step 24181: val_loss was not in top 2


Epoch 107:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.408, v_num=1, train_loss=0.236, train_accuracy=0.889, val_loss=0.498, val_accuracy=0.757]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 107:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.408, v_num=1, train_loss=0.236, train_accuracy=0.889, val_loss=0.498, val_accuracy=0.757]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.18s/it][A
Epoch 107:  90%|█████████ | 230/255 [02:40<00:17,  1.44it/s, loss=0.408, v_num=1, train_loss=0.236, train_accuracy=0.889, val_loss=0.498, val_accuracy=0.757]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.92it/s][A
Epoch 107:  91%|█████████ | 232/255 [02:40<00:15,  1.44it/s, loss=0.408, v_num=1, train_loss=0.236, train_accuracy=0.889, val_loss=0.498, val_accuracy=0.757]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.04it/s][A
Epoch 107:  92%|█████████▏| 234/255 [02:41<00:14,  1.45it/s, loss=0.408, v_num=1, train_loss=0

Epoch 107, global step 24407: val_loss was not in top 2


Epoch 108:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.469, v_num=1, train_loss=0.472, train_accuracy=0.722, val_loss=0.560, val_accuracy=0.753]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 108:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.469, v_num=1, train_loss=0.472, train_accuracy=0.722, val_loss=0.560, val_accuracy=0.753]
Validating:   7%|▋         | 2/29 [00:02<00:32,  1.20s/it][A
Epoch 108:  90%|█████████ | 230/255 [02:40<00:17,  1.44it/s, loss=0.469, v_num=1, train_loss=0.472, train_accuracy=0.722, val_loss=0.560, val_accuracy=0.753]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.91it/s][A
Epoch 108:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.469, v_num=1, train_loss=0.472, train_accuracy=0.722, val_loss=0.560, val_accuracy=0.753]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.02it/s][A
Epoch 108:  92%|█████████▏| 234/255 [02:40<00:14,  1.45it/s, loss=0.469, v_num=1, train_loss=0

Epoch 108, global step 24633: val_loss was not in top 2


Epoch 109:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.424, v_num=1, train_loss=0.395, train_accuracy=0.833, val_loss=0.499, val_accuracy=0.741]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 109:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.424, v_num=1, train_loss=0.395, train_accuracy=0.833, val_loss=0.499, val_accuracy=0.741]
Validating:   7%|▋         | 2/29 [00:02<00:32,  1.19s/it][A
Epoch 109:  90%|█████████ | 230/255 [02:40<00:17,  1.44it/s, loss=0.424, v_num=1, train_loss=0.395, train_accuracy=0.833, val_loss=0.499, val_accuracy=0.741]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.93it/s][A
Epoch 109:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.424, v_num=1, train_loss=0.395, train_accuracy=0.833, val_loss=0.499, val_accuracy=0.741]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.06it/s][A
Epoch 109:  92%|█████████▏| 234/255 [02:40<00:14,  1.45it/s, loss=0.424, v_num=1, train_loss=0

Epoch 109, global step 24859: val_loss was not in top 2


Epoch 110:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.376, v_num=1, train_loss=0.436, train_accuracy=0.778, val_loss=0.460, val_accuracy=0.767]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 110:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.376, v_num=1, train_loss=0.436, train_accuracy=0.778, val_loss=0.460, val_accuracy=0.767]
Validating:   7%|▋         | 2/29 [00:02<00:32,  1.19s/it][A
Epoch 110:  90%|█████████ | 230/255 [02:40<00:17,  1.44it/s, loss=0.376, v_num=1, train_loss=0.436, train_accuracy=0.778, val_loss=0.460, val_accuracy=0.767]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.93it/s][A
Epoch 110:  91%|█████████ | 232/255 [02:40<00:15,  1.44it/s, loss=0.376, v_num=1, train_loss=0.436, train_accuracy=0.778, val_loss=0.460, val_accuracy=0.767]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.10it/s][A
Epoch 110:  92%|█████████▏| 234/255 [02:40<00:14,  1.45it/s, loss=0.376, v_num=1, train_loss=0

Epoch 110, global step 25085: val_loss was not in top 2


Epoch 111:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.392, v_num=1, train_loss=0.480, train_accuracy=0.778, val_loss=0.425, val_accuracy=0.796]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 111:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.392, v_num=1, train_loss=0.480, train_accuracy=0.778, val_loss=0.425, val_accuracy=0.796]
Validating:   7%|▋         | 2/29 [00:02<00:32,  1.19s/it][A
Epoch 111:  90%|█████████ | 230/255 [02:40<00:17,  1.44it/s, loss=0.392, v_num=1, train_loss=0.480, train_accuracy=0.778, val_loss=0.425, val_accuracy=0.796]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.94it/s][A
Epoch 111:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.392, v_num=1, train_loss=0.480, train_accuracy=0.778, val_loss=0.425, val_accuracy=0.796]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.06it/s][A
Epoch 111:  92%|█████████▏| 234/255 [02:40<00:14,  1.45it/s, loss=0.392, v_num=1, train_loss=0

Epoch 111, global step 25311: val_loss was not in top 2


Epoch 112:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.353, v_num=1, train_loss=0.303, train_accuracy=0.833, val_loss=0.406, val_accuracy=0.806]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 112:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.353, v_num=1, train_loss=0.303, train_accuracy=0.833, val_loss=0.406, val_accuracy=0.806]
Validating:   7%|▋         | 2/29 [00:02<00:33,  1.25s/it][A
Epoch 112:  90%|█████████ | 230/255 [02:40<00:17,  1.44it/s, loss=0.353, v_num=1, train_loss=0.303, train_accuracy=0.833, val_loss=0.406, val_accuracy=0.806]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.87it/s][A
Epoch 112:  91%|█████████ | 232/255 [02:40<00:15,  1.44it/s, loss=0.353, v_num=1, train_loss=0.303, train_accuracy=0.833, val_loss=0.406, val_accuracy=0.806]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.01it/s][A
Epoch 112:  92%|█████████▏| 234/255 [02:40<00:14,  1.45it/s, loss=0.353, v_num=1, train_loss=0

Epoch 112, global step 25537: val_loss reached 0.37172 (best 0.37172), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-35-v1.ckpt" as top 2


Epoch 113:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.342, v_num=1, train_loss=0.480, train_accuracy=0.778, val_loss=0.372, val_accuracy=0.825]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 113:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.342, v_num=1, train_loss=0.480, train_accuracy=0.778, val_loss=0.372, val_accuracy=0.825]
Validating:   7%|▋         | 2/29 [00:02<00:32,  1.19s/it][A
Epoch 113:  90%|█████████ | 230/255 [02:40<00:17,  1.44it/s, loss=0.342, v_num=1, train_loss=0.480, train_accuracy=0.778, val_loss=0.372, val_accuracy=0.825]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.96it/s][A
Epoch 113:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.342, v_num=1, train_loss=0.480, train_accuracy=0.778, val_loss=0.372, val_accuracy=0.825]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.13it/s][A
Epoch 113:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.342, v_num=1, train_loss=0

Epoch 113, global step 25763: val_loss was not in top 2


Epoch 114:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.372, v_num=1, train_loss=0.384, train_accuracy=0.833, val_loss=0.402, val_accuracy=0.800]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 114:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.372, v_num=1, train_loss=0.384, train_accuracy=0.833, val_loss=0.402, val_accuracy=0.800]
Validating:   7%|▋         | 2/29 [00:02<00:32,  1.19s/it][A
Epoch 114:  90%|█████████ | 230/255 [02:40<00:17,  1.44it/s, loss=0.372, v_num=1, train_loss=0.384, train_accuracy=0.833, val_loss=0.402, val_accuracy=0.800]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.94it/s][A
Epoch 114:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.372, v_num=1, train_loss=0.384, train_accuracy=0.833, val_loss=0.402, val_accuracy=0.800]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.07it/s][A
Epoch 114:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.372, v_num=1, train_loss=0

Epoch 114, global step 25989: val_loss was not in top 2


Epoch 115:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.375, v_num=1, train_loss=0.338, train_accuracy=0.889, val_loss=0.384, val_accuracy=0.809]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 115:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.375, v_num=1, train_loss=0.338, train_accuracy=0.889, val_loss=0.384, val_accuracy=0.809]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.17s/it][A
Epoch 115:  90%|█████████ | 230/255 [02:39<00:17,  1.44it/s, loss=0.375, v_num=1, train_loss=0.338, train_accuracy=0.889, val_loss=0.384, val_accuracy=0.809]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.95it/s][A
Epoch 115:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.375, v_num=1, train_loss=0.338, train_accuracy=0.889, val_loss=0.384, val_accuracy=0.809]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.07it/s][A
Epoch 115:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.375, v_num=1, train_loss=0

Epoch 115, global step 26215: val_loss was not in top 2


Epoch 116:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.344, v_num=1, train_loss=0.183, train_accuracy=0.889, val_loss=0.391, val_accuracy=0.808]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 116:  89%|████████▉ | 228/255 [02:40<00:18,  1.42it/s, loss=0.344, v_num=1, train_loss=0.183, train_accuracy=0.889, val_loss=0.391, val_accuracy=0.808]
Validating:   7%|▋         | 2/29 [00:02<00:32,  1.21s/it][A
Epoch 116:  90%|█████████ | 230/255 [02:40<00:17,  1.43it/s, loss=0.344, v_num=1, train_loss=0.183, train_accuracy=0.889, val_loss=0.391, val_accuracy=0.808]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.90it/s][A
Epoch 116:  91%|█████████ | 232/255 [02:40<00:15,  1.44it/s, loss=0.344, v_num=1, train_loss=0.183, train_accuracy=0.889, val_loss=0.391, val_accuracy=0.808]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.02it/s][A
Epoch 116:  92%|█████████▏| 234/255 [02:41<00:14,  1.45it/s, loss=0.344, v_num=1, train_loss=0

Epoch 116, global step 26441: val_loss was not in top 2


Epoch 117:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.334, v_num=1, train_loss=0.238, train_accuracy=0.889, val_loss=0.387, val_accuracy=0.823]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 117:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.334, v_num=1, train_loss=0.238, train_accuracy=0.889, val_loss=0.387, val_accuracy=0.823]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.18s/it][A
Epoch 117:  90%|█████████ | 230/255 [02:40<00:17,  1.43it/s, loss=0.334, v_num=1, train_loss=0.238, train_accuracy=0.889, val_loss=0.387, val_accuracy=0.823]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.90it/s][A
Epoch 117:  91%|█████████ | 232/255 [02:40<00:15,  1.44it/s, loss=0.334, v_num=1, train_loss=0.238, train_accuracy=0.889, val_loss=0.387, val_accuracy=0.823]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.04it/s][A
Epoch 117:  92%|█████████▏| 234/255 [02:41<00:14,  1.45it/s, loss=0.334, v_num=1, train_loss=0

Epoch 117, global step 26667: val_loss was not in top 2


Epoch 118:  89%|████████▊ | 226/255 [02:36<00:20,  1.44it/s, loss=0.331, v_num=1, train_loss=0.646, train_accuracy=0.833, val_loss=0.392, val_accuracy=0.823]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 118:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.331, v_num=1, train_loss=0.646, train_accuracy=0.833, val_loss=0.392, val_accuracy=0.823]
Validating:   7%|▋         | 2/29 [00:02<00:32,  1.19s/it][A
Epoch 118:  90%|█████████ | 230/255 [02:39<00:17,  1.44it/s, loss=0.331, v_num=1, train_loss=0.646, train_accuracy=0.833, val_loss=0.392, val_accuracy=0.823]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.94it/s][A
Epoch 118:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.331, v_num=1, train_loss=0.646, train_accuracy=0.833, val_loss=0.392, val_accuracy=0.823]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.08it/s][A
Epoch 118:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.331, v_num=1, train_loss=0

Epoch 118, global step 26893: val_loss was not in top 2


Epoch 119:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.397, v_num=1, train_loss=0.263, train_accuracy=0.944, val_loss=0.396, val_accuracy=0.823]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 119:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.397, v_num=1, train_loss=0.263, train_accuracy=0.944, val_loss=0.396, val_accuracy=0.823]
Validating:   7%|▋         | 2/29 [00:02<00:33,  1.23s/it][A
Epoch 119:  90%|█████████ | 230/255 [02:40<00:17,  1.44it/s, loss=0.397, v_num=1, train_loss=0.263, train_accuracy=0.944, val_loss=0.396, val_accuracy=0.823]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.88it/s][A
Epoch 119:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.397, v_num=1, train_loss=0.263, train_accuracy=0.944, val_loss=0.396, val_accuracy=0.823]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.03it/s][A
Epoch 119:  92%|█████████▏| 234/255 [02:40<00:14,  1.45it/s, loss=0.397, v_num=1, train_loss=0

Epoch 119, global step 27119: val_loss was not in top 2


Epoch 120:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.408, v_num=1, train_loss=0.613, train_accuracy=0.667, val_loss=0.463, val_accuracy=0.777]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 120:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.408, v_num=1, train_loss=0.613, train_accuracy=0.667, val_loss=0.463, val_accuracy=0.777]
Validating:   7%|▋         | 2/29 [00:03<00:34,  1.27s/it][A
Epoch 120:  90%|█████████ | 230/255 [02:40<00:17,  1.43it/s, loss=0.408, v_num=1, train_loss=0.613, train_accuracy=0.667, val_loss=0.463, val_accuracy=0.777]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.81it/s][A
Epoch 120:  91%|█████████ | 232/255 [02:40<00:15,  1.44it/s, loss=0.408, v_num=1, train_loss=0.613, train_accuracy=0.667, val_loss=0.463, val_accuracy=0.777]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.94it/s][A
Epoch 120:  92%|█████████▏| 234/255 [02:41<00:14,  1.45it/s, loss=0.408, v_num=1, train_loss=0

Epoch 120, global step 27345: val_loss was not in top 2


Epoch 121:  89%|████████▊ | 226/255 [02:36<00:20,  1.44it/s, loss=0.393, v_num=1, train_loss=0.478, train_accuracy=0.667, val_loss=0.424, val_accuracy=0.791]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 121:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.393, v_num=1, train_loss=0.478, train_accuracy=0.667, val_loss=0.424, val_accuracy=0.791]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.18s/it][A
Epoch 121:  90%|█████████ | 230/255 [02:39<00:17,  1.44it/s, loss=0.393, v_num=1, train_loss=0.478, train_accuracy=0.667, val_loss=0.424, val_accuracy=0.791]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.95it/s][A
Epoch 121:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.393, v_num=1, train_loss=0.478, train_accuracy=0.667, val_loss=0.424, val_accuracy=0.791]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.04it/s][A
Epoch 121:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.393, v_num=1, train_loss=0

Epoch 121, global step 27571: val_loss reached 0.37427 (best 0.37172), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-35.ckpt" as top 2


Epoch 122:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.309, v_num=1, train_loss=0.450, train_accuracy=0.778, val_loss=0.374, val_accuracy=0.825]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 122:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.309, v_num=1, train_loss=0.450, train_accuracy=0.778, val_loss=0.374, val_accuracy=0.825]
Validating:   7%|▋         | 2/29 [00:02<00:32,  1.19s/it][A
Epoch 122:  90%|█████████ | 230/255 [02:40<00:17,  1.44it/s, loss=0.309, v_num=1, train_loss=0.450, train_accuracy=0.778, val_loss=0.374, val_accuracy=0.825]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.93it/s][A
Epoch 122:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.309, v_num=1, train_loss=0.450, train_accuracy=0.778, val_loss=0.374, val_accuracy=0.825]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.09it/s][A
Epoch 122:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.309, v_num=1, train_loss=0

Epoch 122, global step 27797: val_loss reached 0.34873 (best 0.34873), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-35.ckpt" as top 2


Epoch 123:  89%|████████▊ | 226/255 [02:36<00:20,  1.44it/s, loss=0.351, v_num=1, train_loss=0.551, train_accuracy=0.889, val_loss=0.349, val_accuracy=0.845]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 123:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.351, v_num=1, train_loss=0.551, train_accuracy=0.889, val_loss=0.349, val_accuracy=0.845]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.17s/it][A
Epoch 123:  90%|█████████ | 230/255 [02:39<00:17,  1.44it/s, loss=0.351, v_num=1, train_loss=0.551, train_accuracy=0.889, val_loss=0.349, val_accuracy=0.845]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.94it/s][A
Epoch 123:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.351, v_num=1, train_loss=0.551, train_accuracy=0.889, val_loss=0.349, val_accuracy=0.845]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.05it/s][A
Epoch 123:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.351, v_num=1, train_loss=0

Epoch 123, global step 28023: val_loss reached 0.36249 (best 0.34873), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-35-v1.ckpt" as top 2


Epoch 124:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.327, v_num=1, train_loss=0.329, train_accuracy=0.944, val_loss=0.362, val_accuracy=0.825]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 124:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.327, v_num=1, train_loss=0.329, train_accuracy=0.944, val_loss=0.362, val_accuracy=0.825]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.18s/it][A
Epoch 124:  90%|█████████ | 230/255 [02:40<00:17,  1.43it/s, loss=0.327, v_num=1, train_loss=0.329, train_accuracy=0.944, val_loss=0.362, val_accuracy=0.825]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.95it/s][A
Epoch 124:  91%|█████████ | 232/255 [02:40<00:15,  1.44it/s, loss=0.327, v_num=1, train_loss=0.329, train_accuracy=0.944, val_loss=0.362, val_accuracy=0.825]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.10it/s][A
Epoch 124:  92%|█████████▏| 234/255 [02:41<00:14,  1.45it/s, loss=0.327, v_num=1, train_loss=0

Epoch 124, global step 28249: val_loss reached 0.36205 (best 0.34873), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-mi-35-v1.ckpt" as top 2


Epoch 125:  89%|████████▊ | 226/255 [02:37<00:20,  1.44it/s, loss=0.356, v_num=1, train_loss=0.423, train_accuracy=0.833, val_loss=0.362, val_accuracy=0.828]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 125:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.356, v_num=1, train_loss=0.423, train_accuracy=0.833, val_loss=0.362, val_accuracy=0.828]
Validating:   7%|▋         | 2/29 [00:02<00:32,  1.19s/it][A
Epoch 125:  90%|█████████ | 230/255 [02:40<00:17,  1.44it/s, loss=0.356, v_num=1, train_loss=0.423, train_accuracy=0.833, val_loss=0.362, val_accuracy=0.828]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.93it/s][A
Epoch 125:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.356, v_num=1, train_loss=0.423, train_accuracy=0.833, val_loss=0.362, val_accuracy=0.828]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.08it/s][A
Epoch 125:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.356, v_num=1, train_loss=0

Epoch 125, global step 28475: val_loss was not in top 2


Epoch 126:  89%|████████▊ | 226/255 [02:36<00:20,  1.44it/s, loss=0.314, v_num=1, train_loss=0.287, train_accuracy=0.889, val_loss=0.371, val_accuracy=0.822]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 126:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.314, v_num=1, train_loss=0.287, train_accuracy=0.889, val_loss=0.371, val_accuracy=0.822]
Validating:   7%|▋         | 2/29 [00:02<00:32,  1.19s/it][A
Epoch 126:  90%|█████████ | 230/255 [02:39<00:17,  1.44it/s, loss=0.314, v_num=1, train_loss=0.287, train_accuracy=0.889, val_loss=0.371, val_accuracy=0.822]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.94it/s][A
Epoch 126:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.314, v_num=1, train_loss=0.287, train_accuracy=0.889, val_loss=0.371, val_accuracy=0.822]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.10it/s][A
Epoch 126:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.314, v_num=1, train_loss=0

Epoch 126, global step 28701: val_loss was not in top 2


Epoch 127:  89%|████████▊ | 226/255 [02:36<00:20,  1.44it/s, loss=0.372, v_num=1, train_loss=0.370, train_accuracy=0.889, val_loss=0.368, val_accuracy=0.826]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 127:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.372, v_num=1, train_loss=0.370, train_accuracy=0.889, val_loss=0.368, val_accuracy=0.826]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.17s/it][A
Epoch 127:  90%|█████████ | 230/255 [02:39<00:17,  1.44it/s, loss=0.372, v_num=1, train_loss=0.370, train_accuracy=0.889, val_loss=0.368, val_accuracy=0.826]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.97it/s][A
Epoch 127:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.372, v_num=1, train_loss=0.370, train_accuracy=0.889, val_loss=0.368, val_accuracy=0.826]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.10it/s][A
Epoch 127:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.372, v_num=1, train_loss=0

Epoch 127, global step 28927: val_loss was not in top 2


Epoch 128:  89%|████████▊ | 226/255 [02:36<00:20,  1.44it/s, loss=0.325, v_num=1, train_loss=0.592, train_accuracy=0.778, val_loss=0.373, val_accuracy=0.832]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 128:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.325, v_num=1, train_loss=0.592, train_accuracy=0.778, val_loss=0.373, val_accuracy=0.832]
Validating:   7%|▋         | 2/29 [00:02<00:32,  1.19s/it][A
Epoch 128:  90%|█████████ | 230/255 [02:39<00:17,  1.44it/s, loss=0.325, v_num=1, train_loss=0.592, train_accuracy=0.778, val_loss=0.373, val_accuracy=0.832]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.95it/s][A
Epoch 128:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.325, v_num=1, train_loss=0.592, train_accuracy=0.778, val_loss=0.373, val_accuracy=0.832]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.09it/s][A
Epoch 128:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.325, v_num=1, train_loss=0

Epoch 128, global step 29153: val_loss was not in top 2


Epoch 129:  39%|███▉      | 99/255 [01:10<01:50,  1.41it/s, loss=0.322, v_num=1, train_loss=0.331, train_accuracy=0.880, val_loss=0.406, val_accuracy=0.813] 

  rank_zero_warn("Detected KeyboardInterrupt, attempting graceful shutdown...")
LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1,2]


Testing: 0it [00:00, ?it/s]

## Load Checkpoint 

In [None]:
# best-checkpoint-corr-3-v1.ckptn
# trainer.fit(model, data_module, ckpt_path="/Workspace/code/checkpoints/best-checkpoint-corr-3-v1.ckpt")