In [1]:
import os
import pandas as pd
import numpy as np
from sklearn.preprocessing import LabelEncoder
from sklearn.model_selection import train_test_split
from sklearn.metrics import classification_report, confusion_matrix
import matplotlib.pyplot as plt

import torch
from torch import nn, optim
from torch.nn import functional as F
from torch.utils.data import Dataset, DataLoader

import torchmetrics
from torchmetrics.functional import accuracy

import pytorch_lightning as pl
from pytorch_lightning.loggers import TensorBoardLogger
from pytorch_lightning.callbacks import ModelCheckpoint

device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
print(device)

cuda


## Model Setup 

In [2]:
pl.seed_everything(42, workers=True)

class DrowsyDataset(Dataset):
    
    def __init__(self, sequences):
        self.sequences = sequences
        
    def __len__(self):
        return len(self.sequences)
    
    def __getitem__(self, idx):
        sequence, label = self.sequences[idx]
        return dict(
            sequence=torch.Tensor(sequence.to_numpy()),
            label=torch.tensor(label).long()
        )
    
class DrowsyDataModule(pl.LightningDataModule):
    
    def __init__(self, train_sequences, val_sequences, test_sequences, batch_size):
        super().__init__()
        self.train_sequences = train_sequences
        self.val_sequences = val_sequences
        self.test_sequences = test_sequences
        self.batch_size = batch_size

    def setup(self, stage=None):
        self.train_dataset = DrowsyDataset(self.train_sequences)
        self.val_dataset = DrowsyDataset(self.val_sequences)
        self.test_dataset = DrowsyDataset(self.test_sequences)
        
    def train_dataloader(self):
        return DataLoader(
            self.train_dataset,
            batch_size=self.batch_size,
            shuffle=True,
            num_workers=os.cpu_count()
        )
    
    def val_dataloader(self):
        return DataLoader(
            self.val_dataset,
            batch_size=self.batch_size,
            shuffle=False,
            num_workers=os.cpu_count()
        )
    
    def test_dataloader(self):
        return DataLoader(
            self.test_dataset,
            batch_size=self.batch_size,
            shuffle=False,
            num_workers=os.cpu_count()
        ) 

class DrowsyModel(nn.Module):
    
    def __init__(self, n_features, n_classes, n_hidden=256, n_layers=3):
        super().__init__()
        
        self.n_hidden = n_hidden
        
        self.lstm = nn.LSTM(
            input_size=n_features,
            hidden_size=n_hidden,
            num_layers=n_layers,
            batch_first=True,
            dropout=0.75
        )
        
        self.classifier = nn.Linear(n_hidden, n_classes)
        
    def forward(self, x):
        self.lstm.flatten_parameters()
        _, (hidden, _) = self.lstm(x)
        
        out = hidden[-1]
        return self.classifier(out)
    
class DrowsyPredictor(pl.LightningModule):
    
    def __init__(self, n_features: int, n_classes: int):
        super().__init__()
        self.model = DrowsyModel(n_features, n_classes)
        self.criterion = nn.CrossEntropyLoss()
        
    def forward(self, x, label=None):
        output = self.model(x)
        loss = 0
        if label is not None:
            loss = self.criterion(output, label)
        return loss, output
        
    def training_step(self, batch, batch_idx):
        sequences = batch["sequence"]
        labels = batch["label"]
        loss, outputs = self(sequences, labels)
        predictions = torch.argmax(outputs, dim=1)
        step_accuracy = accuracy(predictions, labels)
        
        self.log("train_loss", loss, prog_bar=True, logger=True)
        self.log("train_accuracy", step_accuracy, prog_bar=True, logger=True)
        
        return {"loss": loss, "accuracy": step_accuracy}
    
    def validation_step(self, batch, batch_idx):
        sequences = batch["sequence"]
        labels = batch["label"]
        loss, outputs = self(sequences, labels)
        predictions = torch.argmax(outputs, dim=1)
        step_accuracy = accuracy(predictions, labels)
        
        self.log("val_loss", loss, prog_bar=True, logger=True)
        self.log("val_accuracy", step_accuracy, prog_bar=True, logger=True)
        
        return {"loss": loss, "accuracy": step_accuracy}
    
    def test_step(self, batch, batch_idx):
        sequences = batch["sequence"]
        labels = batch["label"]
        loss, outputs = self(sequences, labels)
        predictions = torch.argmax(outputs, dim=1)
        step_accuracy = accuracy(predictions, labels)
        
        self.log("test_loss", loss, prog_bar=True, logger=True)
        self.log("test_accuracy", step_accuracy, prog_bar=True, logger=True)
        
        return {"loss": loss, "accuracy": step_accuracy}
    
    def configure_optimizers(self):
        return optim.Adam(self.parameters(), lr=0.0001)

Global seed set to 42


## 參數設置

In [3]:
%load_ext tensorboard
%reload_ext tensorboard
%tensorboard --logdir ./lightning_logs --host 0.0.0.0 --port=8888

Reusing TensorBoard on port 8888 (pid 116), started 0:01:15 ago. (Use '!kill 116' to kill it.)

In [4]:
X_train = pd.read_csv('../data2.csv')

In [5]:
N_EPOCHS = 200
BATCH_SIZE = 50

ORG_FEATURE_COLUMNS = ['TP8', 'FP2', 'FCZ', 'FT10', 'O2', 'O1', 'FT7', 'F4', 'TP7', 'C3', 'C4', 'F3', 'FT8', 'T6', 'HEOR', 'T5', 'VEOL', 'F7', 'FZ', 'VEOU', 'A1', 'P3', 'PZ', 'CP3', 'P4', 'CPZ', 'A2', 'HEOL', 'CP4', 'FT9', 'F8', 'OZ', 'CZ', 'FC4', 'FC3', 'FP1', 'PO1', 'T3', 'T4', 'PO2']
g = X_train.groupby("group")


## Main

In [None]:
n = 29
FEATURE_COLUMNS = ORG_FEATURE_COLUMNS[n:]

while(n < 30):
    print("------------------ Round: " + str(n) + " ------------------")
    print(FEATURE_COLUMNS)
    print("Len:", len(FEATURE_COLUMNS))
    
    label_encoder = LabelEncoder()
    encoded_labels = label_encoder.fit_transform(X_train.state)

    label_encoder.classes_

    X_train['label'] = encoded_labels

    # Prepare data ###########################################
    sequences = [] 

    for name, group in g:
        sequence_features = group[FEATURE_COLUMNS]
        label = group.label.iloc[0]

        # print((sequence_features, label))
        sequences.append((sequence_features, label))

    # Setting up train, test, val gruop #######################
    train_sequences, test_sequences = train_test_split(sequences, test_size=0.2)
    val_sequences, test_sequences = train_test_split(test_sequences, test_size=0.5)


    # Setting up data module ##################################
    data_module = DrowsyDataModule(
        train_sequences, val_sequences, test_sequences, BATCH_SIZE
    )

    model = DrowsyPredictor(
        n_features=len(FEATURE_COLUMNS), 
        n_classes=len(label_encoder.classes_)
    )

    # Check points and logger #################################
    checkpoint_callback = ModelCheckpoint(
        dirpath="checkpoints",
        filename="best-checkpoint-corr-" + str(n),
        save_top_k=2,
        verbose=True,
        monitor="val_loss",
        mode="min"
    )

    logger = TensorBoardLogger("lightning_logs", name="Drowsy_" + str(n))

    trainer = pl.Trainer(
        logger=logger,
        callbacks=[checkpoint_callback],
        max_epochs=N_EPOCHS,
        gpus=[1],
        # gpus=2, 
        # auto_select_gpus=True,
        auto_lr_find=True, 
        # check_val_every_n_epoch=10
        # refresh_rate=20,
    )
    
    # Training start
    if (n == 14):
        trainer.fit(model, data_module, ckpt_path="/Workspace/code/checkpoints/best-checkpoint-corr-29-v1.ckpt")
    else:
        trainer.fit(model, data_module)
    trainer.test(model, data_module)
    
    FEATURE_COLUMNS.pop(0)
    n = n + 1

------------------ Round: 28 ------------------
['CP4', 'FT9', 'F8', 'OZ', 'CZ', 'FC4', 'FC3', 'FP1', 'PO1', 'T3', 'T4', 'PO2']
Len: 12


GPU available: True, used: True
TPU available: False, using: 0 TPU cores
IPU available: False, using: 0 IPUs
LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1,2]

  | Name      | Type             | Params
-----------------------------------------------
0 | model     | DrowsyModel      | 1.3 M 
1 | criterion | CrossEntropyLoss | 0     
-----------------------------------------------
1.3 M     Trainable params
0         Non-trainable params
1.3 M     Total params
5.319     Total estimated model params size (MB)
  rank_zero_warn(f"Checkpoint directory {dirpath} exists and is not empty.")


                                                                      

Global seed set to 42


Epoch 0:  89%|████████▊ | 226/255 [02:40<00:20,  1.41it/s, loss=0.651, v_num=3, train_loss=0.694, train_accuracy=0.556]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 0:  89%|████████▉ | 228/255 [02:42<00:19,  1.40it/s, loss=0.651, v_num=3, train_loss=0.694, train_accuracy=0.556]
Validating:   7%|▋         | 2/29 [00:02<00:32,  1.22s/it][A
Epoch 0:  90%|█████████ | 230/255 [02:43<00:17,  1.41it/s, loss=0.651, v_num=3, train_loss=0.694, train_accuracy=0.556]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.88it/s][A
Epoch 0:  91%|█████████ | 232/255 [02:43<00:16,  1.42it/s, loss=0.651, v_num=3, train_loss=0.694, train_accuracy=0.556]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.96it/s][A
Epoch 0:  92%|█████████▏| 234/255 [02:44<00:14,  1.43it/s, loss=0.651, v_num=3, train_loss=0.694, train_accuracy=0.556]
Validating:  28%|██▊       | 8/29 [00:04<00:05,  3.92it/s][A
Epoch 0:  93%|█████████▎| 236/255 [02:44<00:13,  1.44it/s, loss=

Epoch 0, global step 225: val_loss reached 0.67431 (best 0.67431), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-28.ckpt" as top 2


Epoch 1:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.67, v_num=3, train_loss=0.608, train_accuracy=0.722, val_loss=0.674, val_accuracy=0.597] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 1:  89%|████████▉ | 228/255 [02:44<00:19,  1.39it/s, loss=0.67, v_num=3, train_loss=0.608, train_accuracy=0.722, val_loss=0.674, val_accuracy=0.597]
Validating:   7%|▋         | 2/29 [00:02<00:33,  1.25s/it][A
Epoch 1:  90%|█████████ | 230/255 [02:44<00:17,  1.40it/s, loss=0.67, v_num=3, train_loss=0.608, train_accuracy=0.722, val_loss=0.674, val_accuracy=0.597]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.86it/s][A
Epoch 1:  91%|█████████ | 232/255 [02:44<00:16,  1.41it/s, loss=0.67, v_num=3, train_loss=0.608, train_accuracy=0.722, val_loss=0.674, val_accuracy=0.597]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.02it/s][A
Epoch 1:  92%|█████████▏| 234/255 [02:45<00:14,  1.42it/s, loss=0.67, v_num=3, train_loss=0.608, train_ac

Epoch 1, global step 451: val_loss reached 0.66977 (best 0.66977), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-28-v1.ckpt" as top 2


Epoch 2:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.607, v_num=3, train_loss=0.622, train_accuracy=0.722, val_loss=0.670, val_accuracy=0.598]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 2:  89%|████████▉ | 228/255 [02:44<00:19,  1.39it/s, loss=0.607, v_num=3, train_loss=0.622, train_accuracy=0.722, val_loss=0.670, val_accuracy=0.598]
Validating:   7%|▋         | 2/29 [00:02<00:34,  1.26s/it][A
Epoch 2:  90%|█████████ | 230/255 [02:44<00:17,  1.40it/s, loss=0.607, v_num=3, train_loss=0.622, train_accuracy=0.722, val_loss=0.670, val_accuracy=0.598]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.88it/s][A
Epoch 2:  91%|█████████ | 232/255 [02:44<00:16,  1.41it/s, loss=0.607, v_num=3, train_loss=0.622, train_accuracy=0.722, val_loss=0.670, val_accuracy=0.598]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.05it/s][A
Epoch 2:  92%|█████████▏| 234/255 [02:45<00:14,  1.42it/s, loss=0.607, v_num=3, train_loss=0.622, trai

Epoch 2, global step 677: val_loss reached 0.61586 (best 0.61586), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-28.ckpt" as top 2


Epoch 3:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.569, v_num=3, train_loss=0.733, train_accuracy=0.722, val_loss=0.616, val_accuracy=0.663]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 3:  89%|████████▉ | 228/255 [02:44<00:19,  1.39it/s, loss=0.569, v_num=3, train_loss=0.733, train_accuracy=0.722, val_loss=0.616, val_accuracy=0.663]
Validating:   7%|▋         | 2/29 [00:02<00:34,  1.27s/it][A
Epoch 3:  90%|█████████ | 230/255 [02:44<00:17,  1.40it/s, loss=0.569, v_num=3, train_loss=0.733, train_accuracy=0.722, val_loss=0.616, val_accuracy=0.663]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.86it/s][A
Epoch 3:  91%|█████████ | 232/255 [02:45<00:16,  1.41it/s, loss=0.569, v_num=3, train_loss=0.733, train_accuracy=0.722, val_loss=0.616, val_accuracy=0.663]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.03it/s][A
Epoch 3:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.569, v_num=3, train_loss=0.733, trai

Epoch 3, global step 903: val_loss reached 0.64446 (best 0.61586), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-28-v1.ckpt" as top 2


Epoch 4:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.619, v_num=3, train_loss=0.501, train_accuracy=0.722, val_loss=0.644, val_accuracy=0.672]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 4:  89%|████████▉ | 228/255 [02:44<00:19,  1.39it/s, loss=0.619, v_num=3, train_loss=0.501, train_accuracy=0.722, val_loss=0.644, val_accuracy=0.672]
Validating:   7%|▋         | 2/29 [00:02<00:34,  1.26s/it][A
Epoch 4:  90%|█████████ | 230/255 [02:44<00:17,  1.40it/s, loss=0.619, v_num=3, train_loss=0.501, train_accuracy=0.722, val_loss=0.644, val_accuracy=0.672]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.87it/s][A
Epoch 4:  91%|█████████ | 232/255 [02:45<00:16,  1.41it/s, loss=0.619, v_num=3, train_loss=0.501, train_accuracy=0.722, val_loss=0.644, val_accuracy=0.672]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.02it/s][A
Epoch 4:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.619, v_num=3, train_loss=0.501, trai

Epoch 4, global step 1129: val_loss reached 0.63609 (best 0.61586), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-28-v1.ckpt" as top 2


Epoch 5:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.616, v_num=3, train_loss=0.805, train_accuracy=0.611, val_loss=0.636, val_accuracy=0.622]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 5:  89%|████████▉ | 228/255 [02:44<00:19,  1.39it/s, loss=0.616, v_num=3, train_loss=0.805, train_accuracy=0.611, val_loss=0.636, val_accuracy=0.622]
Validating:   7%|▋         | 2/29 [00:03<00:34,  1.29s/it][A
Epoch 5:  90%|█████████ | 230/255 [02:44<00:17,  1.40it/s, loss=0.616, v_num=3, train_loss=0.805, train_accuracy=0.611, val_loss=0.636, val_accuracy=0.622]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.83it/s][A
Epoch 5:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.616, v_num=3, train_loss=0.805, train_accuracy=0.611, val_loss=0.636, val_accuracy=0.622]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.97it/s][A
Epoch 5:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.616, v_num=3, train_loss=0.805, trai

Epoch 5, global step 1355: val_loss was not in top 2


Epoch 6:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.559, v_num=3, train_loss=0.629, train_accuracy=0.667, val_loss=0.641, val_accuracy=0.666]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 6:  89%|████████▉ | 228/255 [02:44<00:19,  1.38it/s, loss=0.559, v_num=3, train_loss=0.629, train_accuracy=0.667, val_loss=0.641, val_accuracy=0.666]
Validating:   7%|▋         | 2/29 [00:03<00:35,  1.33s/it][A
Epoch 6:  90%|█████████ | 230/255 [02:44<00:17,  1.39it/s, loss=0.559, v_num=3, train_loss=0.629, train_accuracy=0.667, val_loss=0.641, val_accuracy=0.666]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.80it/s][A
Epoch 6:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.559, v_num=3, train_loss=0.629, train_accuracy=0.667, val_loss=0.641, val_accuracy=0.666]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.94it/s][A
Epoch 6:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.559, v_num=3, train_loss=0.629, trai

Epoch 6, global step 1581: val_loss reached 0.60035 (best 0.60035), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-28-v1.ckpt" as top 2


Epoch 7:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.602, v_num=3, train_loss=0.653, train_accuracy=0.611, val_loss=0.600, val_accuracy=0.710]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 7:  89%|████████▉ | 228/255 [02:44<00:19,  1.38it/s, loss=0.602, v_num=3, train_loss=0.653, train_accuracy=0.611, val_loss=0.600, val_accuracy=0.710]
Validating:   7%|▋         | 2/29 [00:02<00:34,  1.27s/it][A
Epoch 7:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.602, v_num=3, train_loss=0.653, train_accuracy=0.611, val_loss=0.600, val_accuracy=0.710]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.86it/s][A
Epoch 7:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.602, v_num=3, train_loss=0.653, train_accuracy=0.611, val_loss=0.600, val_accuracy=0.710]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.00it/s][A
Epoch 7:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.602, v_num=3, train_loss=0.653, trai

Epoch 7, global step 1807: val_loss was not in top 2


Epoch 8:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.557, v_num=3, train_loss=0.557, train_accuracy=0.722, val_loss=0.657, val_accuracy=0.664]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 8:  89%|████████▉ | 228/255 [02:44<00:19,  1.39it/s, loss=0.557, v_num=3, train_loss=0.557, train_accuracy=0.722, val_loss=0.657, val_accuracy=0.664]
Validating:   7%|▋         | 2/29 [00:03<00:34,  1.28s/it][A
Epoch 8:  90%|█████████ | 230/255 [02:44<00:17,  1.40it/s, loss=0.557, v_num=3, train_loss=0.557, train_accuracy=0.722, val_loss=0.657, val_accuracy=0.664]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.84it/s][A
Epoch 8:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.557, v_num=3, train_loss=0.557, train_accuracy=0.722, val_loss=0.657, val_accuracy=0.664]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.01it/s][A
Epoch 8:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.557, v_num=3, train_loss=0.557, trai

Epoch 8, global step 2033: val_loss reached 0.58963 (best 0.58963), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-28.ckpt" as top 2


Epoch 9:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.553, v_num=3, train_loss=0.572, train_accuracy=0.667, val_loss=0.590, val_accuracy=0.716]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 9:  89%|████████▉ | 228/255 [02:44<00:19,  1.39it/s, loss=0.553, v_num=3, train_loss=0.572, train_accuracy=0.667, val_loss=0.590, val_accuracy=0.716]
Validating:   7%|▋         | 2/29 [00:03<00:34,  1.29s/it][A
Epoch 9:  90%|█████████ | 230/255 [02:44<00:17,  1.40it/s, loss=0.553, v_num=3, train_loss=0.572, train_accuracy=0.667, val_loss=0.590, val_accuracy=0.716]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.83it/s][A
Epoch 9:  91%|█████████ | 232/255 [02:44<00:16,  1.41it/s, loss=0.553, v_num=3, train_loss=0.572, train_accuracy=0.667, val_loss=0.590, val_accuracy=0.716]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.00it/s][A
Epoch 9:  92%|█████████▏| 234/255 [02:45<00:14,  1.42it/s, loss=0.553, v_num=3, train_loss=0.572, trai

Epoch 9, global step 2259: val_loss reached 0.57720 (best 0.57720), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-28-v1.ckpt" as top 2


Epoch 10:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.488, v_num=3, train_loss=0.696, train_accuracy=0.667, val_loss=0.577, val_accuracy=0.718]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 10:  89%|████████▉ | 228/255 [02:44<00:19,  1.39it/s, loss=0.488, v_num=3, train_loss=0.696, train_accuracy=0.667, val_loss=0.577, val_accuracy=0.718]
Validating:   7%|▋         | 2/29 [00:03<00:34,  1.30s/it][A
Epoch 10:  90%|█████████ | 230/255 [02:44<00:17,  1.40it/s, loss=0.488, v_num=3, train_loss=0.696, train_accuracy=0.667, val_loss=0.577, val_accuracy=0.718]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.78it/s][A
Epoch 10:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.488, v_num=3, train_loss=0.696, train_accuracy=0.667, val_loss=0.577, val_accuracy=0.718]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.93it/s][A
Epoch 10:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.488, v_num=3, train_loss=0.696,

Epoch 10, global step 2485: val_loss reached 0.55083 (best 0.55083), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-28.ckpt" as top 2


Epoch 11:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.528, v_num=3, train_loss=0.672, train_accuracy=0.556, val_loss=0.551, val_accuracy=0.754]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 11:  89%|████████▉ | 228/255 [02:44<00:19,  1.39it/s, loss=0.528, v_num=3, train_loss=0.672, train_accuracy=0.556, val_loss=0.551, val_accuracy=0.754]
Validating:   7%|▋         | 2/29 [00:03<00:34,  1.27s/it][A
Epoch 11:  90%|█████████ | 230/255 [02:44<00:17,  1.40it/s, loss=0.528, v_num=3, train_loss=0.672, train_accuracy=0.556, val_loss=0.551, val_accuracy=0.754]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.79it/s][A
Epoch 11:  91%|█████████ | 232/255 [02:44<00:16,  1.41it/s, loss=0.528, v_num=3, train_loss=0.672, train_accuracy=0.556, val_loss=0.551, val_accuracy=0.754]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.95it/s][A
Epoch 11:  92%|█████████▏| 234/255 [02:45<00:14,  1.42it/s, loss=0.528, v_num=3, train_loss=0.672,

Epoch 11, global step 2711: val_loss was not in top 2


Epoch 12:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.555, v_num=3, train_loss=0.407, train_accuracy=0.833, val_loss=0.603, val_accuracy=0.705]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 12:  89%|████████▉ | 228/255 [02:44<00:19,  1.39it/s, loss=0.555, v_num=3, train_loss=0.407, train_accuracy=0.833, val_loss=0.603, val_accuracy=0.705]
Validating:   7%|▋         | 2/29 [00:03<00:34,  1.28s/it][A
Epoch 12:  90%|█████████ | 230/255 [02:44<00:17,  1.39it/s, loss=0.555, v_num=3, train_loss=0.407, train_accuracy=0.833, val_loss=0.603, val_accuracy=0.705]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.81it/s][A
Epoch 12:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.555, v_num=3, train_loss=0.407, train_accuracy=0.833, val_loss=0.603, val_accuracy=0.705]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.90it/s][A
Epoch 12:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.555, v_num=3, train_loss=0.407,

Epoch 12, global step 2937: val_loss reached 0.57661 (best 0.55083), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-28-v1.ckpt" as top 2


Epoch 13:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.612, v_num=3, train_loss=0.646, train_accuracy=0.556, val_loss=0.577, val_accuracy=0.687]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 13:  89%|████████▉ | 228/255 [02:44<00:19,  1.39it/s, loss=0.612, v_num=3, train_loss=0.646, train_accuracy=0.556, val_loss=0.577, val_accuracy=0.687]
Validating:   7%|▋         | 2/29 [00:03<00:34,  1.28s/it][A
Epoch 13:  90%|█████████ | 230/255 [02:44<00:17,  1.40it/s, loss=0.612, v_num=3, train_loss=0.646, train_accuracy=0.556, val_loss=0.577, val_accuracy=0.687]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.81it/s][A
Epoch 13:  91%|█████████ | 232/255 [02:45<00:16,  1.41it/s, loss=0.612, v_num=3, train_loss=0.646, train_accuracy=0.556, val_loss=0.577, val_accuracy=0.687]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.00it/s][A
Epoch 13:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.612, v_num=3, train_loss=0.646,

Epoch 13, global step 3163: val_loss was not in top 2


Epoch 14:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.481, v_num=3, train_loss=0.613, train_accuracy=0.667, val_loss=0.625, val_accuracy=0.639]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 14:  89%|████████▉ | 228/255 [02:44<00:19,  1.39it/s, loss=0.481, v_num=3, train_loss=0.613, train_accuracy=0.667, val_loss=0.625, val_accuracy=0.639]
Validating:   7%|▋         | 2/29 [00:03<00:34,  1.29s/it][A
Epoch 14:  90%|█████████ | 230/255 [02:44<00:17,  1.40it/s, loss=0.481, v_num=3, train_loss=0.613, train_accuracy=0.667, val_loss=0.625, val_accuracy=0.639]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.84it/s][A
Epoch 14:  91%|█████████ | 232/255 [02:45<00:16,  1.41it/s, loss=0.481, v_num=3, train_loss=0.613, train_accuracy=0.667, val_loss=0.625, val_accuracy=0.639]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.99it/s][A
Epoch 14:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.481, v_num=3, train_loss=0.613,

Epoch 14, global step 3389: val_loss reached 0.54238 (best 0.54238), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-28-v1.ckpt" as top 2


Epoch 15:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.366, v_num=3, train_loss=0.310, train_accuracy=0.889, val_loss=0.542, val_accuracy=0.722]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 15:  89%|████████▉ | 228/255 [02:44<00:19,  1.39it/s, loss=0.366, v_num=3, train_loss=0.310, train_accuracy=0.889, val_loss=0.542, val_accuracy=0.722]
Validating:   7%|▋         | 2/29 [00:03<00:35,  1.30s/it][A
Epoch 15:  90%|█████████ | 230/255 [02:44<00:17,  1.40it/s, loss=0.366, v_num=3, train_loss=0.310, train_accuracy=0.889, val_loss=0.542, val_accuracy=0.722]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.82it/s][A
Epoch 15:  91%|█████████ | 232/255 [02:44<00:16,  1.41it/s, loss=0.366, v_num=3, train_loss=0.310, train_accuracy=0.889, val_loss=0.542, val_accuracy=0.722]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.95it/s][A
Epoch 15:  92%|█████████▏| 234/255 [02:45<00:14,  1.42it/s, loss=0.366, v_num=3, train_loss=0.310,

Epoch 15, global step 3615: val_loss reached 0.46209 (best 0.46209), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-28.ckpt" as top 2


Epoch 16:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.389, v_num=3, train_loss=0.260, train_accuracy=0.889, val_loss=0.462, val_accuracy=0.811]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 16:  89%|████████▉ | 228/255 [02:44<00:19,  1.39it/s, loss=0.389, v_num=3, train_loss=0.260, train_accuracy=0.889, val_loss=0.462, val_accuracy=0.811]
Validating:   7%|▋         | 2/29 [00:03<00:34,  1.29s/it][A
Epoch 16:  90%|█████████ | 230/255 [02:44<00:17,  1.40it/s, loss=0.389, v_num=3, train_loss=0.260, train_accuracy=0.889, val_loss=0.462, val_accuracy=0.811]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.81it/s][A
Epoch 16:  91%|█████████ | 232/255 [02:44<00:16,  1.41it/s, loss=0.389, v_num=3, train_loss=0.260, train_accuracy=0.889, val_loss=0.462, val_accuracy=0.811]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.96it/s][A
Epoch 16:  92%|█████████▏| 234/255 [02:45<00:14,  1.42it/s, loss=0.389, v_num=3, train_loss=0.260,

Epoch 16, global step 3841: val_loss reached 0.51003 (best 0.46209), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-28-v1.ckpt" as top 2


Epoch 17:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.44, v_num=3, train_loss=0.459, train_accuracy=0.833, val_loss=0.510, val_accuracy=0.796] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 17:  89%|████████▉ | 228/255 [02:44<00:19,  1.39it/s, loss=0.44, v_num=3, train_loss=0.459, train_accuracy=0.833, val_loss=0.510, val_accuracy=0.796]
Validating:   7%|▋         | 2/29 [00:03<00:34,  1.27s/it][A
Epoch 17:  90%|█████████ | 230/255 [02:44<00:17,  1.40it/s, loss=0.44, v_num=3, train_loss=0.459, train_accuracy=0.833, val_loss=0.510, val_accuracy=0.796]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.83it/s][A
Epoch 17:  91%|█████████ | 232/255 [02:45<00:16,  1.41it/s, loss=0.44, v_num=3, train_loss=0.459, train_accuracy=0.833, val_loss=0.510, val_accuracy=0.796]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.90it/s][A
Epoch 17:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.44, v_num=3, train_loss=0.459, tra

Epoch 17, global step 4067: val_loss reached 0.38770 (best 0.38770), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-28-v1.ckpt" as top 2


Epoch 18:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.416, v_num=3, train_loss=0.444, train_accuracy=0.778, val_loss=0.388, val_accuracy=0.836]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 18:  89%|████████▉ | 228/255 [02:44<00:19,  1.39it/s, loss=0.416, v_num=3, train_loss=0.444, train_accuracy=0.778, val_loss=0.388, val_accuracy=0.836]
Validating:   7%|▋         | 2/29 [00:03<00:35,  1.30s/it][A
Epoch 18:  90%|█████████ | 230/255 [02:44<00:17,  1.40it/s, loss=0.416, v_num=3, train_loss=0.444, train_accuracy=0.778, val_loss=0.388, val_accuracy=0.836]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.81it/s][A
Epoch 18:  91%|█████████ | 232/255 [02:45<00:16,  1.41it/s, loss=0.416, v_num=3, train_loss=0.444, train_accuracy=0.778, val_loss=0.388, val_accuracy=0.836]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.88it/s][A
Epoch 18:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.416, v_num=3, train_loss=0.444,

Epoch 18, global step 4293: val_loss reached 0.44782 (best 0.38770), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-28.ckpt" as top 2


Epoch 19:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.366, v_num=3, train_loss=0.365, train_accuracy=0.722, val_loss=0.448, val_accuracy=0.801]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 19:  89%|████████▉ | 228/255 [02:44<00:19,  1.39it/s, loss=0.366, v_num=3, train_loss=0.365, train_accuracy=0.722, val_loss=0.448, val_accuracy=0.801]
Validating:   7%|▋         | 2/29 [00:03<00:36,  1.33s/it][A
Epoch 19:  90%|█████████ | 230/255 [02:44<00:17,  1.40it/s, loss=0.366, v_num=3, train_loss=0.365, train_accuracy=0.722, val_loss=0.448, val_accuracy=0.801]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.79it/s][A
Epoch 19:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.366, v_num=3, train_loss=0.365, train_accuracy=0.722, val_loss=0.448, val_accuracy=0.801]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.95it/s][A
Epoch 19:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.366, v_num=3, train_loss=0.365,

Epoch 19, global step 4519: val_loss reached 0.42852 (best 0.38770), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-28.ckpt" as top 2


Epoch 20:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.361, v_num=3, train_loss=0.368, train_accuracy=0.833, val_loss=0.429, val_accuracy=0.820]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 20:  89%|████████▉ | 228/255 [02:44<00:19,  1.39it/s, loss=0.361, v_num=3, train_loss=0.368, train_accuracy=0.833, val_loss=0.429, val_accuracy=0.820]
Validating:   7%|▋         | 2/29 [00:03<00:34,  1.27s/it][A
Epoch 20:  90%|█████████ | 230/255 [02:44<00:17,  1.40it/s, loss=0.361, v_num=3, train_loss=0.368, train_accuracy=0.833, val_loss=0.429, val_accuracy=0.820]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.86it/s][A
Epoch 20:  91%|█████████ | 232/255 [02:44<00:16,  1.41it/s, loss=0.361, v_num=3, train_loss=0.368, train_accuracy=0.833, val_loss=0.429, val_accuracy=0.820]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.03it/s][A
Epoch 20:  92%|█████████▏| 234/255 [02:45<00:14,  1.42it/s, loss=0.361, v_num=3, train_loss=0.368,

Epoch 20, global step 4745: val_loss reached 0.41306 (best 0.38770), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-28.ckpt" as top 2


Epoch 21:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.453, v_num=3, train_loss=0.330, train_accuracy=0.778, val_loss=0.413, val_accuracy=0.828]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 21:  89%|████████▉ | 228/255 [02:44<00:19,  1.39it/s, loss=0.453, v_num=3, train_loss=0.330, train_accuracy=0.778, val_loss=0.413, val_accuracy=0.828]
Validating:   7%|▋         | 2/29 [00:03<00:35,  1.30s/it][A
Epoch 21:  90%|█████████ | 230/255 [02:44<00:17,  1.40it/s, loss=0.453, v_num=3, train_loss=0.330, train_accuracy=0.778, val_loss=0.413, val_accuracy=0.828]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.83it/s][A
Epoch 21:  91%|█████████ | 232/255 [02:45<00:16,  1.41it/s, loss=0.453, v_num=3, train_loss=0.330, train_accuracy=0.778, val_loss=0.413, val_accuracy=0.828]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.94it/s][A
Epoch 21:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.453, v_num=3, train_loss=0.330,

Epoch 21, global step 4971: val_loss was not in top 2


Epoch 22:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.354, v_num=3, train_loss=0.191, train_accuracy=0.944, val_loss=0.426, val_accuracy=0.811]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 22:  89%|████████▉ | 228/255 [02:44<00:19,  1.39it/s, loss=0.354, v_num=3, train_loss=0.191, train_accuracy=0.944, val_loss=0.426, val_accuracy=0.811]
Validating:   7%|▋         | 2/29 [00:03<00:34,  1.28s/it][A
Epoch 22:  90%|█████████ | 230/255 [02:44<00:17,  1.40it/s, loss=0.354, v_num=3, train_loss=0.191, train_accuracy=0.944, val_loss=0.426, val_accuracy=0.811]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.82it/s][A
Epoch 22:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.354, v_num=3, train_loss=0.191, train_accuracy=0.944, val_loss=0.426, val_accuracy=0.811]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.99it/s][A
Epoch 22:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.354, v_num=3, train_loss=0.191,

Epoch 22, global step 5197: val_loss was not in top 2


Epoch 23:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.347, v_num=3, train_loss=0.292, train_accuracy=0.889, val_loss=0.434, val_accuracy=0.806]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 23:  89%|████████▉ | 228/255 [02:44<00:19,  1.39it/s, loss=0.347, v_num=3, train_loss=0.292, train_accuracy=0.889, val_loss=0.434, val_accuracy=0.806]
Validating:   7%|▋         | 2/29 [00:03<00:34,  1.28s/it][A
Epoch 23:  90%|█████████ | 230/255 [02:44<00:17,  1.40it/s, loss=0.347, v_num=3, train_loss=0.292, train_accuracy=0.889, val_loss=0.434, val_accuracy=0.806]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.80it/s][A
Epoch 23:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.347, v_num=3, train_loss=0.292, train_accuracy=0.889, val_loss=0.434, val_accuracy=0.806]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.95it/s][A
Epoch 23:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.347, v_num=3, train_loss=0.292,

Epoch 23, global step 5423: val_loss was not in top 2


Epoch 24:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.353, v_num=3, train_loss=0.128, train_accuracy=1.000, val_loss=0.464, val_accuracy=0.793]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 24:  89%|████████▉ | 228/255 [02:44<00:19,  1.38it/s, loss=0.353, v_num=3, train_loss=0.128, train_accuracy=1.000, val_loss=0.464, val_accuracy=0.793]
Validating:   7%|▋         | 2/29 [00:03<00:35,  1.32s/it][A
Epoch 24:  90%|█████████ | 230/255 [02:44<00:17,  1.39it/s, loss=0.353, v_num=3, train_loss=0.128, train_accuracy=1.000, val_loss=0.464, val_accuracy=0.793]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.78it/s][A
Epoch 24:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.353, v_num=3, train_loss=0.128, train_accuracy=1.000, val_loss=0.464, val_accuracy=0.793]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.89it/s][A
Epoch 24:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.353, v_num=3, train_loss=0.128,

Epoch 24, global step 5649: val_loss was not in top 2


Epoch 25:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.322, v_num=3, train_loss=0.190, train_accuracy=1.000, val_loss=0.440, val_accuracy=0.820]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 25:  89%|████████▉ | 228/255 [02:44<00:19,  1.39it/s, loss=0.322, v_num=3, train_loss=0.190, train_accuracy=1.000, val_loss=0.440, val_accuracy=0.820]
Validating:   7%|▋         | 2/29 [00:03<00:36,  1.36s/it][A
Epoch 25:  90%|█████████ | 230/255 [02:44<00:17,  1.39it/s, loss=0.322, v_num=3, train_loss=0.190, train_accuracy=1.000, val_loss=0.440, val_accuracy=0.820]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.74it/s][A
Epoch 25:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.322, v_num=3, train_loss=0.190, train_accuracy=1.000, val_loss=0.440, val_accuracy=0.820]
Validating:  21%|██        | 6/29 [00:03<00:08,  2.84it/s][A
Epoch 25:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.322, v_num=3, train_loss=0.190,

Epoch 25, global step 5875: val_loss reached 0.35743 (best 0.35743), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-28.ckpt" as top 2


Epoch 26:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.292, v_num=3, train_loss=0.336, train_accuracy=0.833, val_loss=0.357, val_accuracy=0.850]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 26:  89%|████████▉ | 228/255 [02:44<00:19,  1.39it/s, loss=0.292, v_num=3, train_loss=0.336, train_accuracy=0.833, val_loss=0.357, val_accuracy=0.850]
Validating:   7%|▋         | 2/29 [00:03<00:34,  1.29s/it][A
Epoch 26:  90%|█████████ | 230/255 [02:44<00:17,  1.40it/s, loss=0.292, v_num=3, train_loss=0.336, train_accuracy=0.833, val_loss=0.357, val_accuracy=0.850]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.82it/s][A
Epoch 26:  91%|█████████ | 232/255 [02:45<00:16,  1.41it/s, loss=0.292, v_num=3, train_loss=0.336, train_accuracy=0.833, val_loss=0.357, val_accuracy=0.850]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.93it/s][A
Epoch 26:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.292, v_num=3, train_loss=0.336,

Epoch 26, global step 6101: val_loss was not in top 2


Epoch 27:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.313, v_num=3, train_loss=0.396, train_accuracy=0.778, val_loss=0.390, val_accuracy=0.850]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 27:  89%|████████▉ | 228/255 [02:44<00:19,  1.39it/s, loss=0.313, v_num=3, train_loss=0.396, train_accuracy=0.778, val_loss=0.390, val_accuracy=0.850]
Validating:   7%|▋         | 2/29 [00:03<00:34,  1.28s/it][A
Epoch 27:  90%|█████████ | 230/255 [02:44<00:17,  1.40it/s, loss=0.313, v_num=3, train_loss=0.396, train_accuracy=0.778, val_loss=0.390, val_accuracy=0.850]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.84it/s][A
Epoch 27:  91%|█████████ | 232/255 [02:45<00:16,  1.41it/s, loss=0.313, v_num=3, train_loss=0.396, train_accuracy=0.778, val_loss=0.390, val_accuracy=0.850]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.98it/s][A
Epoch 27:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.313, v_num=3, train_loss=0.396,

Epoch 27, global step 6327: val_loss reached 0.38120 (best 0.35743), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-28-v1.ckpt" as top 2


Epoch 28:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.324, v_num=3, train_loss=0.297, train_accuracy=0.833, val_loss=0.381, val_accuracy=0.834]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 28:  89%|████████▉ | 228/255 [02:44<00:19,  1.39it/s, loss=0.324, v_num=3, train_loss=0.297, train_accuracy=0.833, val_loss=0.381, val_accuracy=0.834]
Validating:   7%|▋         | 2/29 [00:03<00:34,  1.28s/it][A
Epoch 28:  90%|█████████ | 230/255 [02:44<00:17,  1.40it/s, loss=0.324, v_num=3, train_loss=0.297, train_accuracy=0.833, val_loss=0.381, val_accuracy=0.834]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.84it/s][A
Epoch 28:  91%|█████████ | 232/255 [02:44<00:16,  1.41it/s, loss=0.324, v_num=3, train_loss=0.297, train_accuracy=0.833, val_loss=0.381, val_accuracy=0.834]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.01it/s][A
Epoch 28:  92%|█████████▏| 234/255 [02:45<00:14,  1.42it/s, loss=0.324, v_num=3, train_loss=0.297,

Epoch 28, global step 6553: val_loss reached 0.35625 (best 0.35625), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-28-v1.ckpt" as top 2


Epoch 29:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.452, v_num=3, train_loss=0.294, train_accuracy=0.833, val_loss=0.356, val_accuracy=0.857]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 29:  89%|████████▉ | 228/255 [02:44<00:19,  1.39it/s, loss=0.452, v_num=3, train_loss=0.294, train_accuracy=0.833, val_loss=0.356, val_accuracy=0.857]
Validating:   7%|▋         | 2/29 [00:03<00:34,  1.28s/it][A
Epoch 29:  90%|█████████ | 230/255 [02:44<00:17,  1.40it/s, loss=0.452, v_num=3, train_loss=0.294, train_accuracy=0.833, val_loss=0.356, val_accuracy=0.857]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.80it/s][A
Epoch 29:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.452, v_num=3, train_loss=0.294, train_accuracy=0.833, val_loss=0.356, val_accuracy=0.857]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.97it/s][A
Epoch 29:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.452, v_num=3, train_loss=0.294,

Epoch 29, global step 6779: val_loss was not in top 2


Epoch 30:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.321, v_num=3, train_loss=0.145, train_accuracy=0.944, val_loss=0.393, val_accuracy=0.824]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 30:  89%|████████▉ | 228/255 [02:44<00:19,  1.39it/s, loss=0.321, v_num=3, train_loss=0.145, train_accuracy=0.944, val_loss=0.393, val_accuracy=0.824]
Validating:   7%|▋         | 2/29 [00:03<00:34,  1.29s/it][A
Epoch 30:  90%|█████████ | 230/255 [02:44<00:17,  1.40it/s, loss=0.321, v_num=3, train_loss=0.145, train_accuracy=0.944, val_loss=0.393, val_accuracy=0.824]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.79it/s][A
Epoch 30:  91%|█████████ | 232/255 [02:45<00:16,  1.41it/s, loss=0.321, v_num=3, train_loss=0.145, train_accuracy=0.944, val_loss=0.393, val_accuracy=0.824]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.93it/s][A
Epoch 30:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.321, v_num=3, train_loss=0.145,

Epoch 30, global step 7005: val_loss was not in top 2


Epoch 31:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.289, v_num=3, train_loss=0.194, train_accuracy=0.944, val_loss=0.375, val_accuracy=0.851]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 31:  89%|████████▉ | 228/255 [02:44<00:19,  1.39it/s, loss=0.289, v_num=3, train_loss=0.194, train_accuracy=0.944, val_loss=0.375, val_accuracy=0.851]
Validating:   7%|▋         | 2/29 [00:03<00:34,  1.30s/it][A
Epoch 31:  90%|█████████ | 230/255 [02:44<00:17,  1.40it/s, loss=0.289, v_num=3, train_loss=0.194, train_accuracy=0.944, val_loss=0.375, val_accuracy=0.851]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.82it/s][A
Epoch 31:  91%|█████████ | 232/255 [02:44<00:16,  1.41it/s, loss=0.289, v_num=3, train_loss=0.194, train_accuracy=0.944, val_loss=0.375, val_accuracy=0.851]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.95it/s][A
Epoch 31:  92%|█████████▏| 234/255 [02:45<00:14,  1.42it/s, loss=0.289, v_num=3, train_loss=0.194,

Epoch 31, global step 7231: val_loss reached 0.35673 (best 0.35625), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-28.ckpt" as top 2


Epoch 32:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.28, v_num=3, train_loss=0.257, train_accuracy=0.889, val_loss=0.357, val_accuracy=0.844] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 32:  89%|████████▉ | 228/255 [02:44<00:19,  1.39it/s, loss=0.28, v_num=3, train_loss=0.257, train_accuracy=0.889, val_loss=0.357, val_accuracy=0.844]
Validating:   7%|▋         | 2/29 [00:03<00:34,  1.28s/it][A
Epoch 32:  90%|█████████ | 230/255 [02:44<00:17,  1.40it/s, loss=0.28, v_num=3, train_loss=0.257, train_accuracy=0.889, val_loss=0.357, val_accuracy=0.844]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.83it/s][A
Epoch 32:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.28, v_num=3, train_loss=0.257, train_accuracy=0.889, val_loss=0.357, val_accuracy=0.844]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.93it/s][A
Epoch 32:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.28, v_num=3, train_loss=0.257, tra

Epoch 32, global step 7457: val_loss reached 0.33591 (best 0.33591), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-28.ckpt" as top 2


Epoch 33:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.374, v_num=3, train_loss=0.409, train_accuracy=0.778, val_loss=0.336, val_accuracy=0.847]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 33:  89%|████████▉ | 228/255 [02:44<00:19,  1.38it/s, loss=0.374, v_num=3, train_loss=0.409, train_accuracy=0.778, val_loss=0.336, val_accuracy=0.847]
Validating:   7%|▋         | 2/29 [00:03<00:34,  1.29s/it][A
Epoch 33:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.374, v_num=3, train_loss=0.409, train_accuracy=0.778, val_loss=0.336, val_accuracy=0.847]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.83it/s][A
Epoch 33:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.374, v_num=3, train_loss=0.409, train_accuracy=0.778, val_loss=0.336, val_accuracy=0.847]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.99it/s][A
Epoch 33:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.374, v_num=3, train_loss=0.409,

Epoch 33, global step 7683: val_loss was not in top 2


Epoch 34:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.297, v_num=3, train_loss=0.301, train_accuracy=0.889, val_loss=0.381, val_accuracy=0.848]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 34:  89%|████████▉ | 228/255 [02:44<00:19,  1.39it/s, loss=0.297, v_num=3, train_loss=0.301, train_accuracy=0.889, val_loss=0.381, val_accuracy=0.848]
Validating:   7%|▋         | 2/29 [00:03<00:35,  1.30s/it][A
Epoch 34:  90%|█████████ | 230/255 [02:44<00:17,  1.40it/s, loss=0.297, v_num=3, train_loss=0.301, train_accuracy=0.889, val_loss=0.381, val_accuracy=0.848]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.81it/s][A
Epoch 34:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.297, v_num=3, train_loss=0.301, train_accuracy=0.889, val_loss=0.381, val_accuracy=0.848]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.96it/s][A
Epoch 34:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.297, v_num=3, train_loss=0.301,

Epoch 34, global step 7909: val_loss was not in top 2


Epoch 35:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.321, v_num=3, train_loss=0.511, train_accuracy=0.667, val_loss=0.379, val_accuracy=0.859]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 35:  89%|████████▉ | 228/255 [02:44<00:19,  1.39it/s, loss=0.321, v_num=3, train_loss=0.511, train_accuracy=0.667, val_loss=0.379, val_accuracy=0.859]
Validating:   7%|▋         | 2/29 [00:03<00:34,  1.30s/it][A
Epoch 35:  90%|█████████ | 230/255 [02:44<00:17,  1.39it/s, loss=0.321, v_num=3, train_loss=0.511, train_accuracy=0.667, val_loss=0.379, val_accuracy=0.859]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.82it/s][A
Epoch 35:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.321, v_num=3, train_loss=0.511, train_accuracy=0.667, val_loss=0.379, val_accuracy=0.859]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.88it/s][A
Epoch 35:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.321, v_num=3, train_loss=0.511,

Epoch 35, global step 8135: val_loss reached 0.32210 (best 0.32210), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-28-v1.ckpt" as top 2


Epoch 36:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.274, v_num=3, train_loss=0.343, train_accuracy=0.833, val_loss=0.322, val_accuracy=0.869]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 36:  89%|████████▉ | 228/255 [02:44<00:19,  1.38it/s, loss=0.274, v_num=3, train_loss=0.343, train_accuracy=0.833, val_loss=0.322, val_accuracy=0.869]
Validating:   7%|▋         | 2/29 [00:03<00:34,  1.28s/it][A
Epoch 36:  90%|█████████ | 230/255 [02:44<00:17,  1.39it/s, loss=0.274, v_num=3, train_loss=0.343, train_accuracy=0.833, val_loss=0.322, val_accuracy=0.869]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.82it/s][A
Epoch 36:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.274, v_num=3, train_loss=0.343, train_accuracy=0.833, val_loss=0.322, val_accuracy=0.869]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.90it/s][A
Epoch 36:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.274, v_num=3, train_loss=0.343,

Epoch 36, global step 8361: val_loss was not in top 2


Epoch 37:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.271, v_num=3, train_loss=0.274, train_accuracy=0.889, val_loss=0.336, val_accuracy=0.872]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 37:  89%|████████▉ | 228/255 [02:44<00:19,  1.39it/s, loss=0.271, v_num=3, train_loss=0.274, train_accuracy=0.889, val_loss=0.336, val_accuracy=0.872]
Validating:   7%|▋         | 2/29 [00:03<00:34,  1.29s/it][A
Epoch 37:  90%|█████████ | 230/255 [02:44<00:17,  1.40it/s, loss=0.271, v_num=3, train_loss=0.274, train_accuracy=0.889, val_loss=0.336, val_accuracy=0.872]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.83it/s][A
Epoch 37:  91%|█████████ | 232/255 [02:44<00:16,  1.41it/s, loss=0.271, v_num=3, train_loss=0.274, train_accuracy=0.889, val_loss=0.336, val_accuracy=0.872]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.99it/s][A
Epoch 37:  92%|█████████▏| 234/255 [02:45<00:14,  1.42it/s, loss=0.271, v_num=3, train_loss=0.274,

Epoch 37, global step 8587: val_loss was not in top 2


Epoch 38:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.243, v_num=3, train_loss=0.242, train_accuracy=0.889, val_loss=0.336, val_accuracy=0.855]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 38:  89%|████████▉ | 228/255 [02:44<00:19,  1.38it/s, loss=0.243, v_num=3, train_loss=0.242, train_accuracy=0.889, val_loss=0.336, val_accuracy=0.855]
Validating:   7%|▋         | 2/29 [00:03<00:35,  1.30s/it][A
Epoch 38:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.243, v_num=3, train_loss=0.242, train_accuracy=0.889, val_loss=0.336, val_accuracy=0.855]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.80it/s][A
Epoch 38:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.243, v_num=3, train_loss=0.242, train_accuracy=0.889, val_loss=0.336, val_accuracy=0.855]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.90it/s][A
Epoch 38:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.243, v_num=3, train_loss=0.242,

Epoch 38, global step 8813: val_loss reached 0.30740 (best 0.30740), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-28.ckpt" as top 2


Epoch 39:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.287, v_num=3, train_loss=0.152, train_accuracy=0.944, val_loss=0.307, val_accuracy=0.857]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 39:  89%|████████▉ | 228/255 [02:44<00:19,  1.39it/s, loss=0.287, v_num=3, train_loss=0.152, train_accuracy=0.944, val_loss=0.307, val_accuracy=0.857]
Validating:   7%|▋         | 2/29 [00:03<00:35,  1.32s/it][A
Epoch 39:  90%|█████████ | 230/255 [02:44<00:17,  1.40it/s, loss=0.287, v_num=3, train_loss=0.152, train_accuracy=0.944, val_loss=0.307, val_accuracy=0.857]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.78it/s][A
Epoch 39:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.287, v_num=3, train_loss=0.152, train_accuracy=0.944, val_loss=0.307, val_accuracy=0.857]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.94it/s][A
Epoch 39:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.287, v_num=3, train_loss=0.152,

Epoch 39, global step 9039: val_loss was not in top 2


Epoch 40:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.231, v_num=3, train_loss=0.309, train_accuracy=0.944, val_loss=0.349, val_accuracy=0.849]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 40:  89%|████████▉ | 228/255 [02:44<00:19,  1.39it/s, loss=0.231, v_num=3, train_loss=0.309, train_accuracy=0.944, val_loss=0.349, val_accuracy=0.849]
Validating:   7%|▋         | 2/29 [00:03<00:36,  1.34s/it][A
Epoch 40:  90%|█████████ | 230/255 [02:44<00:17,  1.39it/s, loss=0.231, v_num=3, train_loss=0.309, train_accuracy=0.944, val_loss=0.349, val_accuracy=0.849]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.79it/s][A
Epoch 40:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.231, v_num=3, train_loss=0.309, train_accuracy=0.944, val_loss=0.349, val_accuracy=0.849]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.93it/s][A
Epoch 40:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.231, v_num=3, train_loss=0.309,

Epoch 40, global step 9265: val_loss reached 0.30991 (best 0.30740), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-28-v1.ckpt" as top 2


Epoch 41:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.234, v_num=3, train_loss=0.296, train_accuracy=0.889, val_loss=0.310, val_accuracy=0.872]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 41:  89%|████████▉ | 228/255 [02:44<00:19,  1.39it/s, loss=0.234, v_num=3, train_loss=0.296, train_accuracy=0.889, val_loss=0.310, val_accuracy=0.872]
Validating:   7%|▋         | 2/29 [00:03<00:35,  1.32s/it][A
Epoch 41:  90%|█████████ | 230/255 [02:44<00:17,  1.40it/s, loss=0.234, v_num=3, train_loss=0.296, train_accuracy=0.889, val_loss=0.310, val_accuracy=0.872]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.79it/s][A
Epoch 41:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.234, v_num=3, train_loss=0.296, train_accuracy=0.889, val_loss=0.310, val_accuracy=0.872]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.94it/s][A
Epoch 41:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.234, v_num=3, train_loss=0.296,

Epoch 41, global step 9491: val_loss reached 0.30323 (best 0.30323), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-28-v1.ckpt" as top 2


Epoch 42:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.256, v_num=3, train_loss=0.187, train_accuracy=0.944, val_loss=0.303, val_accuracy=0.881] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 42:  89%|████████▉ | 228/255 [02:44<00:19,  1.38it/s, loss=0.256, v_num=3, train_loss=0.187, train_accuracy=0.944, val_loss=0.303, val_accuracy=0.881]
Validating:   7%|▋         | 2/29 [00:03<00:36,  1.34s/it][A
Epoch 42:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.256, v_num=3, train_loss=0.187, train_accuracy=0.944, val_loss=0.303, val_accuracy=0.881]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.78it/s][A
Epoch 42:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.256, v_num=3, train_loss=0.187, train_accuracy=0.944, val_loss=0.303, val_accuracy=0.881]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.97it/s][A
Epoch 42:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.256, v_num=3, train_loss=0.187

Epoch 42, global step 9717: val_loss was not in top 2


Epoch 43:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.219, v_num=3, train_loss=0.0883, train_accuracy=1.000, val_loss=0.308, val_accuracy=0.873]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 43:  89%|████████▉ | 228/255 [02:44<00:19,  1.39it/s, loss=0.219, v_num=3, train_loss=0.0883, train_accuracy=1.000, val_loss=0.308, val_accuracy=0.873]
Validating:   7%|▋         | 2/29 [00:03<00:35,  1.30s/it][A
Epoch 43:  90%|█████████ | 230/255 [02:44<00:17,  1.39it/s, loss=0.219, v_num=3, train_loss=0.0883, train_accuracy=1.000, val_loss=0.308, val_accuracy=0.873]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.81it/s][A
Epoch 43:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.219, v_num=3, train_loss=0.0883, train_accuracy=1.000, val_loss=0.308, val_accuracy=0.873]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.96it/s][A
Epoch 43:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.219, v_num=3, train_loss=0.

Epoch 43, global step 9943: val_loss reached 0.28838 (best 0.28838), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-28.ckpt" as top 2


Epoch 44:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.236, v_num=3, train_loss=0.202, train_accuracy=0.944, val_loss=0.288, val_accuracy=0.881] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 44:  89%|████████▉ | 228/255 [02:44<00:19,  1.38it/s, loss=0.236, v_num=3, train_loss=0.202, train_accuracy=0.944, val_loss=0.288, val_accuracy=0.881]
Validating:   7%|▋         | 2/29 [00:03<00:35,  1.32s/it][A
Epoch 44:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.236, v_num=3, train_loss=0.202, train_accuracy=0.944, val_loss=0.288, val_accuracy=0.881]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.79it/s][A
Epoch 44:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.236, v_num=3, train_loss=0.202, train_accuracy=0.944, val_loss=0.288, val_accuracy=0.881]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.97it/s][A
Epoch 44:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.236, v_num=3, train_loss=0.202

Epoch 44, global step 10169: val_loss reached 0.29666 (best 0.28838), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-28-v1.ckpt" as top 2


Epoch 45:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.232, v_num=3, train_loss=0.107, train_accuracy=0.944, val_loss=0.297, val_accuracy=0.876] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 45:  89%|████████▉ | 228/255 [02:44<00:19,  1.39it/s, loss=0.232, v_num=3, train_loss=0.107, train_accuracy=0.944, val_loss=0.297, val_accuracy=0.876]
Validating:   7%|▋         | 2/29 [00:03<00:35,  1.31s/it][A
Epoch 45:  90%|█████████ | 230/255 [02:44<00:17,  1.39it/s, loss=0.232, v_num=3, train_loss=0.107, train_accuracy=0.944, val_loss=0.297, val_accuracy=0.876]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.81it/s][A
Epoch 45:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.232, v_num=3, train_loss=0.107, train_accuracy=0.944, val_loss=0.297, val_accuracy=0.876]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.92it/s][A
Epoch 45:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.232, v_num=3, train_loss=0.107

Epoch 45, global step 10395: val_loss reached 0.29650 (best 0.28838), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-28-v1.ckpt" as top 2


Epoch 46:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.223, v_num=3, train_loss=0.396, train_accuracy=0.778, val_loss=0.297, val_accuracy=0.885] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 46:  89%|████████▉ | 228/255 [02:44<00:19,  1.39it/s, loss=0.223, v_num=3, train_loss=0.396, train_accuracy=0.778, val_loss=0.297, val_accuracy=0.885]
Validating:   7%|▋         | 2/29 [00:03<00:35,  1.31s/it][A
Epoch 46:  90%|█████████ | 230/255 [02:44<00:17,  1.39it/s, loss=0.223, v_num=3, train_loss=0.396, train_accuracy=0.778, val_loss=0.297, val_accuracy=0.885]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.81it/s][A
Epoch 46:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.223, v_num=3, train_loss=0.396, train_accuracy=0.778, val_loss=0.297, val_accuracy=0.885]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.99it/s][A
Epoch 46:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.223, v_num=3, train_loss=0.396

Epoch 46, global step 10621: val_loss was not in top 2


Epoch 47:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.211, v_num=3, train_loss=0.272, train_accuracy=0.778, val_loss=0.369, val_accuracy=0.832]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 47:  89%|████████▉ | 228/255 [02:44<00:19,  1.39it/s, loss=0.211, v_num=3, train_loss=0.272, train_accuracy=0.778, val_loss=0.369, val_accuracy=0.832]
Validating:   7%|▋         | 2/29 [00:03<00:34,  1.28s/it][A
Epoch 47:  90%|█████████ | 230/255 [02:44<00:17,  1.40it/s, loss=0.211, v_num=3, train_loss=0.272, train_accuracy=0.778, val_loss=0.369, val_accuracy=0.832]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.81it/s][A
Epoch 47:  91%|█████████ | 232/255 [02:44<00:16,  1.41it/s, loss=0.211, v_num=3, train_loss=0.272, train_accuracy=0.778, val_loss=0.369, val_accuracy=0.832]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.93it/s][A
Epoch 47:  92%|█████████▏| 234/255 [02:45<00:14,  1.42it/s, loss=0.211, v_num=3, train_loss=0.272,

Epoch 47, global step 10847: val_loss reached 0.27338 (best 0.27338), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-28-v1.ckpt" as top 2


Epoch 48:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.226, v_num=3, train_loss=0.173, train_accuracy=0.944, val_loss=0.273, val_accuracy=0.877] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 48:  89%|████████▉ | 228/255 [02:44<00:19,  1.39it/s, loss=0.226, v_num=3, train_loss=0.173, train_accuracy=0.944, val_loss=0.273, val_accuracy=0.877]
Validating:   7%|▋         | 2/29 [00:03<00:35,  1.32s/it][A
Epoch 48:  90%|█████████ | 230/255 [02:44<00:17,  1.40it/s, loss=0.226, v_num=3, train_loss=0.173, train_accuracy=0.944, val_loss=0.273, val_accuracy=0.877]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.79it/s][A
Epoch 48:  91%|█████████ | 232/255 [02:44<00:16,  1.41it/s, loss=0.226, v_num=3, train_loss=0.173, train_accuracy=0.944, val_loss=0.273, val_accuracy=0.877]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.89it/s][A
Epoch 48:  92%|█████████▏| 234/255 [02:45<00:14,  1.42it/s, loss=0.226, v_num=3, train_loss=0.173

Epoch 48, global step 11073: val_loss was not in top 2


Epoch 49:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.24, v_num=3, train_loss=0.095, train_accuracy=1.000, val_loss=0.345, val_accuracy=0.861]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 49:  89%|████████▉ | 228/255 [02:44<00:19,  1.39it/s, loss=0.24, v_num=3, train_loss=0.095, train_accuracy=1.000, val_loss=0.345, val_accuracy=0.861]
Validating:   7%|▋         | 2/29 [00:03<00:34,  1.29s/it][A
Epoch 49:  90%|█████████ | 230/255 [02:44<00:17,  1.40it/s, loss=0.24, v_num=3, train_loss=0.095, train_accuracy=1.000, val_loss=0.345, val_accuracy=0.861]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.78it/s][A
Epoch 49:  91%|█████████ | 232/255 [02:45<00:16,  1.41it/s, loss=0.24, v_num=3, train_loss=0.095, train_accuracy=1.000, val_loss=0.345, val_accuracy=0.861]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.89it/s][A
Epoch 49:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.24, v_num=3, train_loss=0.095, tr

Epoch 49, global step 11299: val_loss was not in top 2


Epoch 50:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.21, v_num=3, train_loss=0.294, train_accuracy=0.833, val_loss=0.292, val_accuracy=0.862]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 50:  89%|████████▉ | 228/255 [02:44<00:19,  1.39it/s, loss=0.21, v_num=3, train_loss=0.294, train_accuracy=0.833, val_loss=0.292, val_accuracy=0.862]
Validating:   7%|▋         | 2/29 [00:03<00:34,  1.29s/it][A
Epoch 50:  90%|█████████ | 230/255 [02:44<00:17,  1.40it/s, loss=0.21, v_num=3, train_loss=0.294, train_accuracy=0.833, val_loss=0.292, val_accuracy=0.862]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.83it/s][A
Epoch 50:  91%|█████████ | 232/255 [02:44<00:16,  1.41it/s, loss=0.21, v_num=3, train_loss=0.294, train_accuracy=0.833, val_loss=0.292, val_accuracy=0.862]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.92it/s][A
Epoch 50:  92%|█████████▏| 234/255 [02:45<00:14,  1.42it/s, loss=0.21, v_num=3, train_loss=0.294, tr

Epoch 50, global step 11525: val_loss was not in top 2


Epoch 51:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.484, v_num=3, train_loss=0.867, train_accuracy=0.667, val_loss=0.314, val_accuracy=0.862] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 51:  89%|████████▉ | 228/255 [02:44<00:19,  1.39it/s, loss=0.484, v_num=3, train_loss=0.867, train_accuracy=0.667, val_loss=0.314, val_accuracy=0.862]
Validating:   7%|▋         | 2/29 [00:03<00:35,  1.30s/it][A
Epoch 51:  90%|█████████ | 230/255 [02:44<00:17,  1.39it/s, loss=0.484, v_num=3, train_loss=0.867, train_accuracy=0.667, val_loss=0.314, val_accuracy=0.862]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.81it/s][A
Epoch 51:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.484, v_num=3, train_loss=0.867, train_accuracy=0.667, val_loss=0.314, val_accuracy=0.862]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.95it/s][A
Epoch 51:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.484, v_num=3, train_loss=0.867

Epoch 51, global step 11751: val_loss was not in top 2


Epoch 52:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.277, v_num=3, train_loss=0.180, train_accuracy=0.944, val_loss=0.399, val_accuracy=0.808]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 52:  89%|████████▉ | 228/255 [02:44<00:19,  1.39it/s, loss=0.277, v_num=3, train_loss=0.180, train_accuracy=0.944, val_loss=0.399, val_accuracy=0.808]
Validating:   7%|▋         | 2/29 [00:03<00:35,  1.31s/it][A
Epoch 52:  90%|█████████ | 230/255 [02:44<00:17,  1.40it/s, loss=0.277, v_num=3, train_loss=0.180, train_accuracy=0.944, val_loss=0.399, val_accuracy=0.808]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.77it/s][A
Epoch 52:  91%|█████████ | 232/255 [02:45<00:16,  1.41it/s, loss=0.277, v_num=3, train_loss=0.180, train_accuracy=0.944, val_loss=0.399, val_accuracy=0.808]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.94it/s][A
Epoch 52:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.277, v_num=3, train_loss=0.180,

Epoch 52, global step 11977: val_loss reached 0.27072 (best 0.27072), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-28.ckpt" as top 2


Epoch 53:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.24, v_num=3, train_loss=0.277, train_accuracy=0.944, val_loss=0.271, val_accuracy=0.862] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 53:  89%|████████▉ | 228/255 [02:44<00:19,  1.39it/s, loss=0.24, v_num=3, train_loss=0.277, train_accuracy=0.944, val_loss=0.271, val_accuracy=0.862]
Validating:   7%|▋         | 2/29 [00:03<00:34,  1.29s/it][A
Epoch 53:  90%|█████████ | 230/255 [02:44<00:17,  1.40it/s, loss=0.24, v_num=3, train_loss=0.277, train_accuracy=0.944, val_loss=0.271, val_accuracy=0.862]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.82it/s][A
Epoch 53:  91%|█████████ | 232/255 [02:44<00:16,  1.41it/s, loss=0.24, v_num=3, train_loss=0.277, train_accuracy=0.944, val_loss=0.271, val_accuracy=0.862]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.91it/s][A
Epoch 53:  92%|█████████▏| 234/255 [02:45<00:14,  1.42it/s, loss=0.24, v_num=3, train_loss=0.277, tra

Epoch 53, global step 12203: val_loss reached 0.26690 (best 0.26690), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-28-v1.ckpt" as top 2


Epoch 54:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.302, v_num=3, train_loss=0.404, train_accuracy=0.889, val_loss=0.267, val_accuracy=0.878] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 54:  89%|████████▉ | 228/255 [02:44<00:19,  1.39it/s, loss=0.302, v_num=3, train_loss=0.404, train_accuracy=0.889, val_loss=0.267, val_accuracy=0.878]
Validating:   7%|▋         | 2/29 [00:03<00:35,  1.30s/it][A
Epoch 54:  90%|█████████ | 230/255 [02:44<00:17,  1.40it/s, loss=0.302, v_num=3, train_loss=0.404, train_accuracy=0.889, val_loss=0.267, val_accuracy=0.878]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.78it/s][A
Epoch 54:  91%|█████████ | 232/255 [02:44<00:16,  1.41it/s, loss=0.302, v_num=3, train_loss=0.404, train_accuracy=0.889, val_loss=0.267, val_accuracy=0.878]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.95it/s][A
Epoch 54:  92%|█████████▏| 234/255 [02:45<00:14,  1.42it/s, loss=0.302, v_num=3, train_loss=0.404

Epoch 54, global step 12429: val_loss was not in top 2


Epoch 55:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.202, v_num=3, train_loss=0.201, train_accuracy=0.944, val_loss=0.431, val_accuracy=0.832] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 55:  89%|████████▉ | 228/255 [02:44<00:19,  1.39it/s, loss=0.202, v_num=3, train_loss=0.201, train_accuracy=0.944, val_loss=0.431, val_accuracy=0.832]
Validating:   7%|▋         | 2/29 [00:03<00:34,  1.29s/it][A
Epoch 55:  90%|█████████ | 230/255 [02:44<00:17,  1.40it/s, loss=0.202, v_num=3, train_loss=0.201, train_accuracy=0.944, val_loss=0.431, val_accuracy=0.832]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.83it/s][A
Epoch 55:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.202, v_num=3, train_loss=0.201, train_accuracy=0.944, val_loss=0.431, val_accuracy=0.832]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.92it/s][A
Epoch 55:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.202, v_num=3, train_loss=0.201

Epoch 55, global step 12655: val_loss reached 0.26775 (best 0.26690), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-28.ckpt" as top 2


Epoch 56:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.224, v_num=3, train_loss=0.201, train_accuracy=0.889, val_loss=0.268, val_accuracy=0.879] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 56:  89%|████████▉ | 228/255 [02:44<00:19,  1.39it/s, loss=0.224, v_num=3, train_loss=0.201, train_accuracy=0.889, val_loss=0.268, val_accuracy=0.879]
Validating:   7%|▋         | 2/29 [00:03<00:35,  1.30s/it][A
Epoch 56:  90%|█████████ | 230/255 [02:44<00:17,  1.40it/s, loss=0.224, v_num=3, train_loss=0.201, train_accuracy=0.889, val_loss=0.268, val_accuracy=0.879]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.80it/s][A
Epoch 56:  91%|█████████ | 232/255 [02:44<00:16,  1.41it/s, loss=0.224, v_num=3, train_loss=0.201, train_accuracy=0.889, val_loss=0.268, val_accuracy=0.879]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.96it/s][A
Epoch 56:  92%|█████████▏| 234/255 [02:45<00:14,  1.42it/s, loss=0.224, v_num=3, train_loss=0.201

Epoch 56, global step 12881: val_loss reached 0.23100 (best 0.23100), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-28.ckpt" as top 2


Epoch 57:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.197, v_num=3, train_loss=0.117, train_accuracy=0.944, val_loss=0.231, val_accuracy=0.894] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 57:  89%|████████▉ | 228/255 [02:44<00:19,  1.39it/s, loss=0.197, v_num=3, train_loss=0.117, train_accuracy=0.944, val_loss=0.231, val_accuracy=0.894]
Validating:   7%|▋         | 2/29 [00:03<00:35,  1.30s/it][A
Epoch 57:  90%|█████████ | 230/255 [02:44<00:17,  1.40it/s, loss=0.197, v_num=3, train_loss=0.117, train_accuracy=0.944, val_loss=0.231, val_accuracy=0.894]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.79it/s][A
Epoch 57:  91%|█████████ | 232/255 [02:45<00:16,  1.41it/s, loss=0.197, v_num=3, train_loss=0.117, train_accuracy=0.944, val_loss=0.231, val_accuracy=0.894]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.95it/s][A
Epoch 57:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.197, v_num=3, train_loss=0.117

Epoch 57, global step 13107: val_loss reached 0.24278 (best 0.23100), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-28-v1.ckpt" as top 2


Epoch 58:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.186, v_num=3, train_loss=0.232, train_accuracy=0.833, val_loss=0.243, val_accuracy=0.889] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 58:  89%|████████▉ | 228/255 [02:44<00:19,  1.39it/s, loss=0.186, v_num=3, train_loss=0.232, train_accuracy=0.833, val_loss=0.243, val_accuracy=0.889]
Validating:   7%|▋         | 2/29 [00:03<00:34,  1.29s/it][A
Epoch 58:  90%|█████████ | 230/255 [02:44<00:17,  1.40it/s, loss=0.186, v_num=3, train_loss=0.232, train_accuracy=0.833, val_loss=0.243, val_accuracy=0.889]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.81it/s][A
Epoch 58:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.186, v_num=3, train_loss=0.232, train_accuracy=0.833, val_loss=0.243, val_accuracy=0.889]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.95it/s][A
Epoch 58:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.186, v_num=3, train_loss=0.232

Epoch 58, global step 13333: val_loss was not in top 2


Epoch 59:  19%|█▉        | 48/255 [00:36<02:37,  1.31it/s, loss=0.228, v_num=3, train_loss=0.218, train_accuracy=0.900, val_loss=0.282, val_accuracy=0.888] 

IOPub message rate exceeded.
The notebook server will temporarily stop sending output
to the client in order to avoid crashing it.
To change this limit, set the config variable
`--NotebookApp.iopub_msg_rate_limit`.

Current values:
NotebookApp.iopub_msg_rate_limit=1000.0 (msgs/sec)
NotebookApp.rate_limit_window=3.0 (secs)



Epoch 62:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.226, v_num=3, train_loss=0.127, train_accuracy=1.000, val_loss=0.503, val_accuracy=0.787]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 62:  89%|████████▉ | 228/255 [02:44<00:19,  1.39it/s, loss=0.226, v_num=3, train_loss=0.127, train_accuracy=1.000, val_loss=0.503, val_accuracy=0.787]
Validating:   7%|▋         | 2/29 [00:03<00:35,  1.31s/it][A
Epoch 62:  90%|█████████ | 230/255 [02:44<00:17,  1.40it/s, loss=0.226, v_num=3, train_loss=0.127, train_accuracy=1.000, val_loss=0.503, val_accuracy=0.787]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.79it/s][A
Epoch 62:  91%|█████████ | 232/255 [02:45<00:16,  1.41it/s, loss=0.226, v_num=3, train_loss=0.127, train_accuracy=1.000, val_loss=0.503, val_accuracy=0.787]
Validating:  21%|██        | 6/29 [00:03<00:08,  2.86it/s][A
Epoch 62:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.226, v_num=3, train_loss=0.127,

Epoch 62, global step 14237: val_loss was not in top 2


Epoch 63:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.217, v_num=3, train_loss=0.274, train_accuracy=0.778, val_loss=0.278, val_accuracy=0.868] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 63:  89%|████████▉ | 228/255 [02:44<00:19,  1.38it/s, loss=0.217, v_num=3, train_loss=0.274, train_accuracy=0.778, val_loss=0.278, val_accuracy=0.868]
Validating:   7%|▋         | 2/29 [00:03<00:36,  1.34s/it][A
Epoch 63:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.217, v_num=3, train_loss=0.274, train_accuracy=0.778, val_loss=0.278, val_accuracy=0.868]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.77it/s][A
Epoch 63:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.217, v_num=3, train_loss=0.274, train_accuracy=0.778, val_loss=0.278, val_accuracy=0.868]
Validating:  21%|██        | 6/29 [00:03<00:08,  2.80it/s][A
Epoch 63:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.217, v_num=3, train_loss=0.274

Epoch 63, global step 14463: val_loss was not in top 2


Epoch 64:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.257, v_num=3, train_loss=0.236, train_accuracy=0.889, val_loss=0.271, val_accuracy=0.877] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 64:  89%|████████▉ | 228/255 [02:44<00:19,  1.39it/s, loss=0.257, v_num=3, train_loss=0.236, train_accuracy=0.889, val_loss=0.271, val_accuracy=0.877]
Validating:   7%|▋         | 2/29 [00:03<00:34,  1.29s/it][A
Epoch 64:  90%|█████████ | 230/255 [02:44<00:17,  1.40it/s, loss=0.257, v_num=3, train_loss=0.236, train_accuracy=0.889, val_loss=0.271, val_accuracy=0.877]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.80it/s][A
Epoch 64:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.257, v_num=3, train_loss=0.236, train_accuracy=0.889, val_loss=0.271, val_accuracy=0.877]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.91it/s][A
Epoch 64:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.257, v_num=3, train_loss=0.236

Epoch 64, global step 14689: val_loss was not in top 2


Epoch 65:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.204, v_num=3, train_loss=0.097, train_accuracy=0.944, val_loss=0.310, val_accuracy=0.875] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 65:  89%|████████▉ | 228/255 [02:44<00:19,  1.38it/s, loss=0.204, v_num=3, train_loss=0.097, train_accuracy=0.944, val_loss=0.310, val_accuracy=0.875]
Validating:   7%|▋         | 2/29 [00:03<00:34,  1.29s/it][A
Epoch 65:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.204, v_num=3, train_loss=0.097, train_accuracy=0.944, val_loss=0.310, val_accuracy=0.875]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.82it/s][A
Epoch 65:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.204, v_num=3, train_loss=0.097, train_accuracy=0.944, val_loss=0.310, val_accuracy=0.875]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.92it/s][A
Epoch 65:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.204, v_num=3, train_loss=0.097

Epoch 65, global step 14915: val_loss was not in top 2


Epoch 66:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.235, v_num=3, train_loss=0.162, train_accuracy=0.944, val_loss=0.308, val_accuracy=0.874]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 66:  89%|████████▉ | 228/255 [02:44<00:19,  1.38it/s, loss=0.235, v_num=3, train_loss=0.162, train_accuracy=0.944, val_loss=0.308, val_accuracy=0.874]
Validating:   7%|▋         | 2/29 [00:03<00:35,  1.31s/it][A
Epoch 66:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.235, v_num=3, train_loss=0.162, train_accuracy=0.944, val_loss=0.308, val_accuracy=0.874]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.81it/s][A
Epoch 66:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.235, v_num=3, train_loss=0.162, train_accuracy=0.944, val_loss=0.308, val_accuracy=0.874]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.90it/s][A
Epoch 66:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.235, v_num=3, train_loss=0.162,

Epoch 66, global step 15141: val_loss was not in top 2


Epoch 67:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.211, v_num=3, train_loss=0.356, train_accuracy=0.833, val_loss=0.295, val_accuracy=0.873]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 67:  89%|████████▉ | 228/255 [02:44<00:19,  1.39it/s, loss=0.211, v_num=3, train_loss=0.356, train_accuracy=0.833, val_loss=0.295, val_accuracy=0.873]
Validating:   7%|▋         | 2/29 [00:03<00:34,  1.29s/it][A
Epoch 67:  90%|█████████ | 230/255 [02:44<00:17,  1.39it/s, loss=0.211, v_num=3, train_loss=0.356, train_accuracy=0.833, val_loss=0.295, val_accuracy=0.873]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.81it/s][A
Epoch 67:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.211, v_num=3, train_loss=0.356, train_accuracy=0.833, val_loss=0.295, val_accuracy=0.873]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.97it/s][A
Epoch 67:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.211, v_num=3, train_loss=0.356,

Epoch 67, global step 15367: val_loss was not in top 2


Epoch 68:  78%|███████▊  | 200/255 [02:23<00:39,  1.40it/s, loss=0.194, v_num=3, train_loss=0.201, train_accuracy=0.920, val_loss=0.278, val_accuracy=0.887] 

IOPub message rate exceeded.
The notebook server will temporarily stop sending output
to the client in order to avoid crashing it.
To change this limit, set the config variable
`--NotebookApp.iopub_msg_rate_limit`.

Current values:
NotebookApp.iopub_msg_rate_limit=1000.0 (msgs/sec)
NotebookApp.rate_limit_window=3.0 (secs)



Epoch 72:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.214, v_num=3, train_loss=0.484, train_accuracy=0.722, val_loss=0.344, val_accuracy=0.877] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 72:  89%|████████▉ | 228/255 [02:44<00:19,  1.39it/s, loss=0.214, v_num=3, train_loss=0.484, train_accuracy=0.722, val_loss=0.344, val_accuracy=0.877]
Validating:   7%|▋         | 2/29 [00:03<00:35,  1.31s/it][A
Epoch 72:  90%|█████████ | 230/255 [02:44<00:17,  1.39it/s, loss=0.214, v_num=3, train_loss=0.484, train_accuracy=0.722, val_loss=0.344, val_accuracy=0.877]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.77it/s][A
Epoch 72:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.214, v_num=3, train_loss=0.484, train_accuracy=0.722, val_loss=0.344, val_accuracy=0.877]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.92it/s][A
Epoch 72:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.214, v_num=3, train_loss=0.484

Epoch 72, global step 16497: val_loss was not in top 2


Epoch 73:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.245, v_num=3, train_loss=0.532, train_accuracy=0.722, val_loss=0.319, val_accuracy=0.879] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 73:  89%|████████▉ | 228/255 [02:44<00:19,  1.39it/s, loss=0.245, v_num=3, train_loss=0.532, train_accuracy=0.722, val_loss=0.319, val_accuracy=0.879]
Validating:   7%|▋         | 2/29 [00:03<00:35,  1.30s/it][A
Epoch 73:  90%|█████████ | 230/255 [02:44<00:17,  1.40it/s, loss=0.245, v_num=3, train_loss=0.532, train_accuracy=0.722, val_loss=0.319, val_accuracy=0.879]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.80it/s][A
Epoch 73:  91%|█████████ | 232/255 [02:45<00:16,  1.41it/s, loss=0.245, v_num=3, train_loss=0.532, train_accuracy=0.722, val_loss=0.319, val_accuracy=0.879]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.98it/s][A
Epoch 73:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.245, v_num=3, train_loss=0.532

Epoch 73, global step 16723: val_loss was not in top 2


Epoch 74:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.181, v_num=3, train_loss=0.187, train_accuracy=0.889, val_loss=0.269, val_accuracy=0.895] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 74:  89%|████████▉ | 228/255 [02:44<00:19,  1.39it/s, loss=0.181, v_num=3, train_loss=0.187, train_accuracy=0.889, val_loss=0.269, val_accuracy=0.895]
Validating:   7%|▋         | 2/29 [00:03<00:35,  1.31s/it][A
Epoch 74:  90%|█████████ | 230/255 [02:44<00:17,  1.40it/s, loss=0.181, v_num=3, train_loss=0.187, train_accuracy=0.889, val_loss=0.269, val_accuracy=0.895]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.79it/s][A
Epoch 74:  91%|█████████ | 232/255 [02:44<00:16,  1.41it/s, loss=0.181, v_num=3, train_loss=0.187, train_accuracy=0.889, val_loss=0.269, val_accuracy=0.895]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.89it/s][A
Epoch 74:  92%|█████████▏| 234/255 [02:45<00:14,  1.42it/s, loss=0.181, v_num=3, train_loss=0.187

Epoch 74, global step 16949: val_loss was not in top 2


Epoch 75:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.299, v_num=3, train_loss=0.315, train_accuracy=0.833, val_loss=0.245, val_accuracy=0.899] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 75:  89%|████████▉ | 228/255 [02:44<00:19,  1.39it/s, loss=0.299, v_num=3, train_loss=0.315, train_accuracy=0.833, val_loss=0.245, val_accuracy=0.899]
Validating:   7%|▋         | 2/29 [00:03<00:35,  1.31s/it][A
Epoch 75:  90%|█████████ | 230/255 [02:44<00:17,  1.40it/s, loss=0.299, v_num=3, train_loss=0.315, train_accuracy=0.833, val_loss=0.245, val_accuracy=0.899]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.80it/s][A
Epoch 75:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.299, v_num=3, train_loss=0.315, train_accuracy=0.833, val_loss=0.245, val_accuracy=0.899]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.88it/s][A
Epoch 75:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.299, v_num=3, train_loss=0.315

Epoch 75, global step 17175: val_loss was not in top 2


Epoch 76:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.166, v_num=3, train_loss=0.0937, train_accuracy=1.000, val_loss=0.294, val_accuracy=0.887]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 76:  89%|████████▉ | 228/255 [02:44<00:19,  1.38it/s, loss=0.166, v_num=3, train_loss=0.0937, train_accuracy=1.000, val_loss=0.294, val_accuracy=0.887]
Validating:   7%|▋         | 2/29 [00:03<00:36,  1.35s/it][A
Epoch 76:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.166, v_num=3, train_loss=0.0937, train_accuracy=1.000, val_loss=0.294, val_accuracy=0.887]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.77it/s][A
Epoch 76:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.166, v_num=3, train_loss=0.0937, train_accuracy=1.000, val_loss=0.294, val_accuracy=0.887]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.95it/s][A
Epoch 76:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.166, v_num=3, train_loss=0.

Epoch 76, global step 17401: val_loss was not in top 2


Epoch 77:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.169, v_num=3, train_loss=0.0872, train_accuracy=0.944, val_loss=0.240, val_accuracy=0.906]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 77:  89%|████████▉ | 228/255 [02:44<00:19,  1.38it/s, loss=0.169, v_num=3, train_loss=0.0872, train_accuracy=0.944, val_loss=0.240, val_accuracy=0.906]
Validating:   7%|▋         | 2/29 [00:03<00:35,  1.31s/it][A
Epoch 77:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.169, v_num=3, train_loss=0.0872, train_accuracy=0.944, val_loss=0.240, val_accuracy=0.906]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.81it/s][A
Epoch 77:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.169, v_num=3, train_loss=0.0872, train_accuracy=0.944, val_loss=0.240, val_accuracy=0.906]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.94it/s][A
Epoch 77:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.169, v_num=3, train_loss=0.

Epoch 77, global step 17627: val_loss was not in top 2


Epoch 78:  85%|████████▍ | 216/255 [02:34<00:27,  1.40it/s, loss=0.169, v_num=3, train_loss=0.0614, train_accuracy=1.000, val_loss=0.292, val_accuracy=0.881]

IOPub message rate exceeded.
The notebook server will temporarily stop sending output
to the client in order to avoid crashing it.
To change this limit, set the config variable
`--NotebookApp.iopub_msg_rate_limit`.

Current values:
NotebookApp.iopub_msg_rate_limit=1000.0 (msgs/sec)
NotebookApp.rate_limit_window=3.0 (secs)



Epoch 81:  89%|████████▊ | 226/255 [02:42<00:20,  1.39it/s, loss=0.193, v_num=3, train_loss=0.123, train_accuracy=1.000, val_loss=0.273, val_accuracy=0.892] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 81:  89%|████████▉ | 228/255 [02:45<00:19,  1.38it/s, loss=0.193, v_num=3, train_loss=0.123, train_accuracy=1.000, val_loss=0.273, val_accuracy=0.892]
Validating:   7%|▋         | 2/29 [00:03<00:35,  1.30s/it][A
Epoch 81:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.193, v_num=3, train_loss=0.123, train_accuracy=1.000, val_loss=0.273, val_accuracy=0.892]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.79it/s][A
Epoch 81:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.193, v_num=3, train_loss=0.123, train_accuracy=1.000, val_loss=0.273, val_accuracy=0.892]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.95it/s][A
Epoch 81:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.193, v_num=3, train_loss=0.123

Epoch 81, global step 18531: val_loss was not in top 2


Epoch 82:  89%|████████▊ | 226/255 [02:42<00:20,  1.39it/s, loss=0.178, v_num=3, train_loss=0.212, train_accuracy=0.944, val_loss=0.240, val_accuracy=0.894] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 82:  89%|████████▉ | 228/255 [02:45<00:19,  1.38it/s, loss=0.178, v_num=3, train_loss=0.212, train_accuracy=0.944, val_loss=0.240, val_accuracy=0.894]
Validating:   7%|▋         | 2/29 [00:03<00:35,  1.33s/it][A
Epoch 82:  90%|█████████ | 230/255 [02:45<00:18,  1.39it/s, loss=0.178, v_num=3, train_loss=0.212, train_accuracy=0.944, val_loss=0.240, val_accuracy=0.894]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.75it/s][A
Epoch 82:  91%|█████████ | 232/255 [02:46<00:16,  1.40it/s, loss=0.178, v_num=3, train_loss=0.212, train_accuracy=0.944, val_loss=0.240, val_accuracy=0.894]
Validating:  21%|██        | 6/29 [00:03<00:08,  2.86it/s][A
Epoch 82:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.178, v_num=3, train_loss=0.212

Epoch 82, global step 18757: val_loss was not in top 2


Epoch 83:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.133, v_num=3, train_loss=0.106, train_accuracy=0.944, val_loss=0.281, val_accuracy=0.887] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 83:  89%|████████▉ | 228/255 [02:44<00:19,  1.38it/s, loss=0.133, v_num=3, train_loss=0.106, train_accuracy=0.944, val_loss=0.281, val_accuracy=0.887]
Validating:   7%|▋         | 2/29 [00:03<00:34,  1.30s/it][A
Epoch 83:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.133, v_num=3, train_loss=0.106, train_accuracy=0.944, val_loss=0.281, val_accuracy=0.887]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.79it/s][A
Epoch 83:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.133, v_num=3, train_loss=0.106, train_accuracy=0.944, val_loss=0.281, val_accuracy=0.887]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.91it/s][A
Epoch 83:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.133, v_num=3, train_loss=0.106

Epoch 83, global step 18983: val_loss was not in top 2


Epoch 84:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.155, v_num=3, train_loss=0.143, train_accuracy=0.944, val_loss=0.252, val_accuracy=0.903] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 84:  89%|████████▉ | 228/255 [02:44<00:19,  1.38it/s, loss=0.155, v_num=3, train_loss=0.143, train_accuracy=0.944, val_loss=0.252, val_accuracy=0.903]
Validating:   7%|▋         | 2/29 [00:03<00:35,  1.31s/it][A
Epoch 84:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.155, v_num=3, train_loss=0.143, train_accuracy=0.944, val_loss=0.252, val_accuracy=0.903]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.81it/s][A
Epoch 84:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.155, v_num=3, train_loss=0.143, train_accuracy=0.944, val_loss=0.252, val_accuracy=0.903]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.96it/s][A
Epoch 84:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.155, v_num=3, train_loss=0.143

Epoch 84, global step 19209: val_loss reached 0.22359 (best 0.22219), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-28.ckpt" as top 2


Epoch 85:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.22, v_num=3, train_loss=0.605, train_accuracy=0.889, val_loss=0.224, val_accuracy=0.911]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 85:  89%|████████▉ | 228/255 [02:44<00:19,  1.38it/s, loss=0.22, v_num=3, train_loss=0.605, train_accuracy=0.889, val_loss=0.224, val_accuracy=0.911]
Validating:   7%|▋         | 2/29 [00:03<00:35,  1.32s/it][A
Epoch 85:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.22, v_num=3, train_loss=0.605, train_accuracy=0.889, val_loss=0.224, val_accuracy=0.911]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.77it/s][A
Epoch 85:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.22, v_num=3, train_loss=0.605, train_accuracy=0.889, val_loss=0.224, val_accuracy=0.911]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.90it/s][A
Epoch 85:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.22, v_num=3, train_loss=0.605, tr

Epoch 85, global step 19435: val_loss was not in top 2


Epoch 86:  89%|████████▊ | 226/255 [02:42<00:20,  1.39it/s, loss=0.166, v_num=3, train_loss=0.0741, train_accuracy=0.944, val_loss=0.560, val_accuracy=0.828]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 86:  89%|████████▉ | 228/255 [02:44<00:19,  1.38it/s, loss=0.166, v_num=3, train_loss=0.0741, train_accuracy=0.944, val_loss=0.560, val_accuracy=0.828]
Validating:   7%|▋         | 2/29 [00:03<00:35,  1.30s/it][A
Epoch 86:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.166, v_num=3, train_loss=0.0741, train_accuracy=0.944, val_loss=0.560, val_accuracy=0.828]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.78it/s][A
Epoch 86:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.166, v_num=3, train_loss=0.0741, train_accuracy=0.944, val_loss=0.560, val_accuracy=0.828]
Validating:  21%|██        | 6/29 [00:03<00:08,  2.84it/s][A
Epoch 86:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.166, v_num=3, train_loss=0.

Epoch 86, global step 19661: val_loss was not in top 2


Epoch 87:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.143, v_num=3, train_loss=0.250, train_accuracy=0.889, val_loss=0.230, val_accuracy=0.899] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 87:  89%|████████▉ | 228/255 [02:44<00:19,  1.38it/s, loss=0.143, v_num=3, train_loss=0.250, train_accuracy=0.889, val_loss=0.230, val_accuracy=0.899]
Validating:   7%|▋         | 2/29 [00:03<00:35,  1.32s/it][A
Epoch 87:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.143, v_num=3, train_loss=0.250, train_accuracy=0.889, val_loss=0.230, val_accuracy=0.899]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.80it/s][A
Epoch 87:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.143, v_num=3, train_loss=0.250, train_accuracy=0.889, val_loss=0.230, val_accuracy=0.899]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.90it/s][A
Epoch 87:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.143, v_num=3, train_loss=0.250

Epoch 87, global step 19887: val_loss was not in top 2


Epoch 88:  22%|██▏       | 55/255 [00:41<02:30,  1.33it/s, loss=0.14, v_num=3, train_loss=0.139, train_accuracy=0.920, val_loss=0.239, val_accuracy=0.908]  

IOPub message rate exceeded.
The notebook server will temporarily stop sending output
to the client in order to avoid crashing it.
To change this limit, set the config variable
`--NotebookApp.iopub_msg_rate_limit`.

Current values:
NotebookApp.iopub_msg_rate_limit=1000.0 (msgs/sec)
NotebookApp.rate_limit_window=3.0 (secs)



Epoch 91:  89%|████████▊ | 226/255 [02:42<00:20,  1.39it/s, loss=0.221, v_num=3, train_loss=0.362, train_accuracy=0.889, val_loss=0.218, val_accuracy=0.909] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 91:  89%|████████▉ | 228/255 [02:45<00:19,  1.38it/s, loss=0.221, v_num=3, train_loss=0.362, train_accuracy=0.889, val_loss=0.218, val_accuracy=0.909]
Validating:   7%|▋         | 2/29 [00:03<00:35,  1.32s/it][A
Epoch 91:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.221, v_num=3, train_loss=0.362, train_accuracy=0.889, val_loss=0.218, val_accuracy=0.909]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.80it/s][A
Epoch 91:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.221, v_num=3, train_loss=0.362, train_accuracy=0.889, val_loss=0.218, val_accuracy=0.909]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.95it/s][A
Epoch 91:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.221, v_num=3, train_loss=0.362

Epoch 91, global step 20791: val_loss was not in top 2


Epoch 92:  89%|████████▊ | 226/255 [02:42<00:20,  1.39it/s, loss=0.179, v_num=3, train_loss=0.207, train_accuracy=0.889, val_loss=0.258, val_accuracy=0.904] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 92:  89%|████████▉ | 228/255 [02:44<00:19,  1.38it/s, loss=0.179, v_num=3, train_loss=0.207, train_accuracy=0.889, val_loss=0.258, val_accuracy=0.904]
Validating:   7%|▋         | 2/29 [00:03<00:35,  1.33s/it][A
Epoch 92:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.179, v_num=3, train_loss=0.207, train_accuracy=0.889, val_loss=0.258, val_accuracy=0.904]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.80it/s][A
Epoch 92:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.179, v_num=3, train_loss=0.207, train_accuracy=0.889, val_loss=0.258, val_accuracy=0.904]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.96it/s][A
Epoch 92:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.179, v_num=3, train_loss=0.207

Epoch 92, global step 21017: val_loss was not in top 2


Epoch 93:  89%|████████▊ | 226/255 [02:42<00:20,  1.39it/s, loss=0.152, v_num=3, train_loss=0.085, train_accuracy=0.944, val_loss=0.241, val_accuracy=0.901] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 93:  89%|████████▉ | 228/255 [02:45<00:19,  1.38it/s, loss=0.152, v_num=3, train_loss=0.085, train_accuracy=0.944, val_loss=0.241, val_accuracy=0.901]
Validating:   7%|▋         | 2/29 [00:03<00:35,  1.32s/it][A
Epoch 93:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.152, v_num=3, train_loss=0.085, train_accuracy=0.944, val_loss=0.241, val_accuracy=0.901]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.79it/s][A
Epoch 93:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.152, v_num=3, train_loss=0.085, train_accuracy=0.944, val_loss=0.241, val_accuracy=0.901]
Validating:  21%|██        | 6/29 [00:03<00:08,  2.87it/s][A
Epoch 93:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.152, v_num=3, train_loss=0.085

Epoch 93, global step 21243: val_loss reached 0.21134 (best 0.21134), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-28-v1.ckpt" as top 2


Epoch 94:  89%|████████▊ | 226/255 [02:42<00:20,  1.39it/s, loss=0.155, v_num=3, train_loss=0.161, train_accuracy=0.944, val_loss=0.211, val_accuracy=0.920] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 94:  89%|████████▉ | 228/255 [02:45<00:19,  1.38it/s, loss=0.155, v_num=3, train_loss=0.161, train_accuracy=0.944, val_loss=0.211, val_accuracy=0.920]
Validating:   7%|▋         | 2/29 [00:03<00:35,  1.33s/it][A
Epoch 94:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.155, v_num=3, train_loss=0.161, train_accuracy=0.944, val_loss=0.211, val_accuracy=0.920]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.78it/s][A
Epoch 94:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.155, v_num=3, train_loss=0.161, train_accuracy=0.944, val_loss=0.211, val_accuracy=0.920]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.95it/s][A
Epoch 94:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.155, v_num=3, train_loss=0.161

Epoch 94, global step 21469: val_loss was not in top 2


Epoch 95:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.129, v_num=3, train_loss=0.0661, train_accuracy=1.000, val_loss=0.243, val_accuracy=0.903]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 95:  89%|████████▉ | 228/255 [02:44<00:19,  1.38it/s, loss=0.129, v_num=3, train_loss=0.0661, train_accuracy=1.000, val_loss=0.243, val_accuracy=0.903]
Validating:   7%|▋         | 2/29 [00:03<00:35,  1.31s/it][A
Epoch 95:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.129, v_num=3, train_loss=0.0661, train_accuracy=1.000, val_loss=0.243, val_accuracy=0.903]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.80it/s][A
Epoch 95:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.129, v_num=3, train_loss=0.0661, train_accuracy=1.000, val_loss=0.243, val_accuracy=0.903]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.90it/s][A
Epoch 95:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.129, v_num=3, train_loss=0.

Epoch 95, global step 21695: val_loss was not in top 2


Epoch 96:  89%|████████▊ | 226/255 [02:42<00:20,  1.39it/s, loss=0.148, v_num=3, train_loss=0.0229, train_accuracy=1.000, val_loss=0.254, val_accuracy=0.906]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 96:  89%|████████▉ | 228/255 [02:45<00:19,  1.38it/s, loss=0.148, v_num=3, train_loss=0.0229, train_accuracy=1.000, val_loss=0.254, val_accuracy=0.906]
Validating:   7%|▋         | 2/29 [00:03<00:36,  1.33s/it][A
Epoch 96:  90%|█████████ | 230/255 [02:45<00:18,  1.39it/s, loss=0.148, v_num=3, train_loss=0.0229, train_accuracy=1.000, val_loss=0.254, val_accuracy=0.906]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.77it/s][A
Epoch 96:  91%|█████████ | 232/255 [02:46<00:16,  1.40it/s, loss=0.148, v_num=3, train_loss=0.0229, train_accuracy=1.000, val_loss=0.254, val_accuracy=0.906]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.92it/s][A
Epoch 96:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.148, v_num=3, train_loss=0.

Epoch 96, global step 21921: val_loss was not in top 2


Epoch 97:  89%|████████▊ | 226/255 [02:42<00:20,  1.39it/s, loss=0.162, v_num=3, train_loss=0.103, train_accuracy=0.944, val_loss=0.341, val_accuracy=0.886] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 97:  89%|████████▉ | 228/255 [02:45<00:19,  1.38it/s, loss=0.162, v_num=3, train_loss=0.103, train_accuracy=0.944, val_loss=0.341, val_accuracy=0.886]
Validating:   7%|▋         | 2/29 [00:03<00:35,  1.32s/it][A
Epoch 97:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.162, v_num=3, train_loss=0.103, train_accuracy=0.944, val_loss=0.341, val_accuracy=0.886]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.80it/s][A
Epoch 97:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.162, v_num=3, train_loss=0.103, train_accuracy=0.944, val_loss=0.341, val_accuracy=0.886]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.93it/s][A
Epoch 97:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.162, v_num=3, train_loss=0.103

Epoch 97, global step 22147: val_loss was not in top 2


Epoch 98:  33%|███▎      | 85/255 [01:02<02:05,  1.36it/s, loss=0.158, v_num=3, train_loss=0.0736, train_accuracy=0.980, val_loss=0.258, val_accuracy=0.905]

IOPub message rate exceeded.
The notebook server will temporarily stop sending output
to the client in order to avoid crashing it.
To change this limit, set the config variable
`--NotebookApp.iopub_msg_rate_limit`.

Current values:
NotebookApp.iopub_msg_rate_limit=1000.0 (msgs/sec)
NotebookApp.rate_limit_window=3.0 (secs)




Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 101:  89%|████████▉ | 228/255 [02:45<00:19,  1.38it/s, loss=0.147, v_num=3, train_loss=0.325, train_accuracy=0.833, val_loss=0.216, val_accuracy=0.913]
Validating:   7%|▋         | 2/29 [00:03<00:36,  1.33s/it][A
Epoch 101:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.147, v_num=3, train_loss=0.325, train_accuracy=0.833, val_loss=0.216, val_accuracy=0.913]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.79it/s][A
Epoch 101:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.147, v_num=3, train_loss=0.325, train_accuracy=0.833, val_loss=0.216, val_accuracy=0.913]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.93it/s][A
Epoch 101:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.147, v_num=3, train_loss=0.325, train_accuracy=0.833, val_loss=0.216, val_accuracy=0.913]
Validating:  28%|██▊       | 8/29 [00:04<00:05,  3.88it/s][A
Epoch 101:  93%|█████████▎| 236

Epoch 101, global step 23051: val_loss reached 0.19952 (best 0.19952), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-28-v1.ckpt" as top 2


Epoch 102:  89%|████████▊ | 226/255 [02:42<00:20,  1.39it/s, loss=0.17, v_num=3, train_loss=0.125, train_accuracy=0.944, val_loss=0.200, val_accuracy=0.914]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 102:  89%|████████▉ | 228/255 [02:45<00:19,  1.38it/s, loss=0.17, v_num=3, train_loss=0.125, train_accuracy=0.944, val_loss=0.200, val_accuracy=0.914]
Validating:   7%|▋         | 2/29 [00:03<00:36,  1.34s/it][A
Epoch 102:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.17, v_num=3, train_loss=0.125, train_accuracy=0.944, val_loss=0.200, val_accuracy=0.914]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.76it/s][A
Epoch 102:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.17, v_num=3, train_loss=0.125, train_accuracy=0.944, val_loss=0.200, val_accuracy=0.914]
Validating:  21%|██        | 6/29 [00:03<00:08,  2.85it/s][A
Epoch 102:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.17, v_num=3, train_loss=0.12

Epoch 102, global step 23277: val_loss was not in top 2


Epoch 103:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.142, v_num=3, train_loss=0.120, train_accuracy=0.944, val_loss=0.253, val_accuracy=0.907] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 103:  89%|████████▉ | 228/255 [02:44<00:19,  1.38it/s, loss=0.142, v_num=3, train_loss=0.120, train_accuracy=0.944, val_loss=0.253, val_accuracy=0.907]
Validating:   7%|▋         | 2/29 [00:03<00:36,  1.33s/it][A
Epoch 103:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.142, v_num=3, train_loss=0.120, train_accuracy=0.944, val_loss=0.253, val_accuracy=0.907]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.75it/s][A
Epoch 103:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.142, v_num=3, train_loss=0.120, train_accuracy=0.944, val_loss=0.253, val_accuracy=0.907]
Validating:  21%|██        | 6/29 [00:03<00:08,  2.84it/s][A
Epoch 103:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.142, v_num=3, train_loss=

Epoch 103, global step 23503: val_loss was not in top 2


Epoch 104:  89%|████████▊ | 226/255 [02:42<00:20,  1.39it/s, loss=0.135, v_num=3, train_loss=0.036, train_accuracy=1.000, val_loss=0.225, val_accuracy=0.906]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 104:  89%|████████▉ | 228/255 [02:45<00:19,  1.38it/s, loss=0.135, v_num=3, train_loss=0.036, train_accuracy=1.000, val_loss=0.225, val_accuracy=0.906]
Validating:   7%|▋         | 2/29 [00:03<00:36,  1.34s/it][A
Epoch 104:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.135, v_num=3, train_loss=0.036, train_accuracy=1.000, val_loss=0.225, val_accuracy=0.906]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.78it/s][A
Epoch 104:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.135, v_num=3, train_loss=0.036, train_accuracy=1.000, val_loss=0.225, val_accuracy=0.906]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.93it/s][A
Epoch 104:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.135, v_num=3, train_loss

Epoch 104, global step 23729: val_loss reached 0.19103 (best 0.19103), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-28.ckpt" as top 2


Epoch 105:  89%|████████▊ | 226/255 [02:42<00:20,  1.39it/s, loss=0.114, v_num=3, train_loss=0.110, train_accuracy=0.944, val_loss=0.191, val_accuracy=0.925] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 105:  89%|████████▉ | 228/255 [02:44<00:19,  1.38it/s, loss=0.114, v_num=3, train_loss=0.110, train_accuracy=0.944, val_loss=0.191, val_accuracy=0.925]
Validating:   7%|▋         | 2/29 [00:03<00:35,  1.33s/it][A
Epoch 105:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.114, v_num=3, train_loss=0.110, train_accuracy=0.944, val_loss=0.191, val_accuracy=0.925]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.71it/s][A
Epoch 105:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.114, v_num=3, train_loss=0.110, train_accuracy=0.944, val_loss=0.191, val_accuracy=0.925]
Validating:  21%|██        | 6/29 [00:03<00:08,  2.83it/s][A
Epoch 105:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.114, v_num=3, train_loss=

Epoch 105, global step 23955: val_loss was not in top 2


Epoch 106:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.226, v_num=3, train_loss=0.0988, train_accuracy=1.000, val_loss=0.244, val_accuracy=0.923]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 106:  89%|████████▉ | 228/255 [02:44<00:19,  1.38it/s, loss=0.226, v_num=3, train_loss=0.0988, train_accuracy=1.000, val_loss=0.244, val_accuracy=0.923]
Validating:   7%|▋         | 2/29 [00:03<00:35,  1.33s/it][A
Epoch 106:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.226, v_num=3, train_loss=0.0988, train_accuracy=1.000, val_loss=0.244, val_accuracy=0.923]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.78it/s][A
Epoch 106:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.226, v_num=3, train_loss=0.0988, train_accuracy=1.000, val_loss=0.244, val_accuracy=0.923]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.90it/s][A
Epoch 106:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.226, v_num=3, train_lo

Epoch 106, global step 24181: val_loss was not in top 2


Epoch 107:  89%|████████▊ | 226/255 [02:42<00:20,  1.39it/s, loss=0.153, v_num=3, train_loss=0.0469, train_accuracy=1.000, val_loss=0.320, val_accuracy=0.864]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 107:  89%|████████▉ | 228/255 [02:45<00:19,  1.38it/s, loss=0.153, v_num=3, train_loss=0.0469, train_accuracy=1.000, val_loss=0.320, val_accuracy=0.864]
Validating:   7%|▋         | 2/29 [00:03<00:36,  1.34s/it][A
Epoch 107:  90%|█████████ | 230/255 [02:45<00:18,  1.39it/s, loss=0.153, v_num=3, train_loss=0.0469, train_accuracy=1.000, val_loss=0.320, val_accuracy=0.864]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.76it/s][A
Epoch 107:  91%|█████████ | 232/255 [02:46<00:16,  1.40it/s, loss=0.153, v_num=3, train_loss=0.0469, train_accuracy=1.000, val_loss=0.320, val_accuracy=0.864]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.91it/s][A
Epoch 107:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.153, v_num=3, train_lo

Epoch 107, global step 24407: val_loss was not in top 2


Epoch 108:  42%|████▏     | 108/255 [01:18<01:47,  1.37it/s, loss=0.154, v_num=3, train_loss=0.226, train_accuracy=0.860, val_loss=0.237, val_accuracy=0.908] 

IOPub message rate exceeded.
The notebook server will temporarily stop sending output
to the client in order to avoid crashing it.
To change this limit, set the config variable
`--NotebookApp.iopub_msg_rate_limit`.

Current values:
NotebookApp.iopub_msg_rate_limit=1000.0 (msgs/sec)
NotebookApp.rate_limit_window=3.0 (secs)



Epoch 111:  96%|█████████▋| 246/255 [02:48<00:06,  1.46it/s, loss=0.181, v_num=3, train_loss=0.151, train_accuracy=0.944, val_loss=0.236, val_accuracy=0.909]
Validating:  69%|██████▉   | 20/29 [00:06<00:01,  5.59it/s][A
Epoch 111:  97%|█████████▋| 248/255 [02:48<00:04,  1.47it/s, loss=0.181, v_num=3, train_loss=0.151, train_accuracy=0.944, val_loss=0.236, val_accuracy=0.909]
Validating:  76%|███████▌  | 22/29 [00:06<00:01,  5.47it/s][A
Epoch 111:  98%|█████████▊| 250/255 [02:49<00:03,  1.48it/s, loss=0.181, v_num=3, train_loss=0.151, train_accuracy=0.944, val_loss=0.236, val_accuracy=0.909]
Validating:  83%|████████▎ | 24/29 [00:07<00:00,  5.47it/s][A
Epoch 111:  99%|█████████▉| 252/255 [02:49<00:02,  1.49it/s, loss=0.181, v_num=3, train_loss=0.151, train_accuracy=0.944, val_loss=0.236, val_accuracy=0.909]
Validating:  90%|████████▉ | 26/29 [00:07<00:00,  5.38it/s][A
Epoch 111: 100%|█████████▉| 254/255 [02:50<00:00,  1.49it/s, loss=0.181, v_num=3, train_loss=0.151, train_accuracy=0

Epoch 111, global step 25311: val_loss was not in top 2


Epoch 112:  89%|████████▊ | 226/255 [02:42<00:20,  1.39it/s, loss=0.193, v_num=3, train_loss=0.141, train_accuracy=0.944, val_loss=0.238, val_accuracy=0.905] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 112:  89%|████████▉ | 228/255 [02:45<00:19,  1.38it/s, loss=0.193, v_num=3, train_loss=0.141, train_accuracy=0.944, val_loss=0.238, val_accuracy=0.905]
Validating:   7%|▋         | 2/29 [00:03<00:36,  1.35s/it][A
Epoch 112:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.193, v_num=3, train_loss=0.141, train_accuracy=0.944, val_loss=0.238, val_accuracy=0.905]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.74it/s][A
Epoch 112:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.193, v_num=3, train_loss=0.141, train_accuracy=0.944, val_loss=0.238, val_accuracy=0.905]
Validating:  21%|██        | 6/29 [00:03<00:08,  2.82it/s][A
Epoch 112:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.193, v_num=3, train_loss=

Epoch 112, global step 25537: val_loss was not in top 2


Epoch 113:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.155, v_num=3, train_loss=0.124, train_accuracy=0.944, val_loss=0.233, val_accuracy=0.885] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 113:  89%|████████▉ | 228/255 [02:44<00:19,  1.38it/s, loss=0.155, v_num=3, train_loss=0.124, train_accuracy=0.944, val_loss=0.233, val_accuracy=0.885]
Validating:   7%|▋         | 2/29 [00:03<00:35,  1.33s/it][A
Epoch 113:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.155, v_num=3, train_loss=0.124, train_accuracy=0.944, val_loss=0.233, val_accuracy=0.885]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.77it/s][A
Epoch 113:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.155, v_num=3, train_loss=0.124, train_accuracy=0.944, val_loss=0.233, val_accuracy=0.885]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.92it/s][A
Epoch 113:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.155, v_num=3, train_loss=

Epoch 113, global step 25763: val_loss was not in top 2


Epoch 114:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.143, v_num=3, train_loss=0.0408, train_accuracy=1.000, val_loss=0.203, val_accuracy=0.913] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 114:  89%|████████▉ | 228/255 [02:44<00:19,  1.38it/s, loss=0.143, v_num=3, train_loss=0.0408, train_accuracy=1.000, val_loss=0.203, val_accuracy=0.913]
Validating:   7%|▋         | 2/29 [00:03<00:36,  1.33s/it][A
Epoch 114:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.143, v_num=3, train_loss=0.0408, train_accuracy=1.000, val_loss=0.203, val_accuracy=0.913]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.77it/s][A
Epoch 114:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.143, v_num=3, train_loss=0.0408, train_accuracy=1.000, val_loss=0.203, val_accuracy=0.913]
Validating:  21%|██        | 6/29 [00:03<00:08,  2.87it/s][A
Epoch 114:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.143, v_num=3, train_l

Epoch 114, global step 25989: val_loss reached 0.19298 (best 0.19103), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-28-v1.ckpt" as top 2


Epoch 115:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.139, v_num=3, train_loss=0.0256, train_accuracy=1.000, val_loss=0.193, val_accuracy=0.925]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 115:  89%|████████▉ | 228/255 [02:44<00:19,  1.38it/s, loss=0.139, v_num=3, train_loss=0.0256, train_accuracy=1.000, val_loss=0.193, val_accuracy=0.925]
Validating:   7%|▋         | 2/29 [00:03<00:36,  1.36s/it][A
Epoch 115:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.139, v_num=3, train_loss=0.0256, train_accuracy=1.000, val_loss=0.193, val_accuracy=0.925]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.77it/s][A
Epoch 115:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.139, v_num=3, train_loss=0.0256, train_accuracy=1.000, val_loss=0.193, val_accuracy=0.925]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.91it/s][A
Epoch 115:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.139, v_num=3, train_lo

Epoch 115, global step 26215: val_loss was not in top 2


Epoch 116:  89%|████████▊ | 226/255 [02:42<00:20,  1.39it/s, loss=0.123, v_num=3, train_loss=0.144, train_accuracy=0.889, val_loss=0.197, val_accuracy=0.913]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 116:  89%|████████▉ | 228/255 [02:45<00:19,  1.38it/s, loss=0.123, v_num=3, train_loss=0.144, train_accuracy=0.889, val_loss=0.197, val_accuracy=0.913]
Validating:   7%|▋         | 2/29 [00:03<00:37,  1.38s/it][A
Epoch 116:  90%|█████████ | 230/255 [02:45<00:18,  1.39it/s, loss=0.123, v_num=3, train_loss=0.144, train_accuracy=0.889, val_loss=0.197, val_accuracy=0.913]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.74it/s][A
Epoch 116:  91%|█████████ | 232/255 [02:46<00:16,  1.40it/s, loss=0.123, v_num=3, train_loss=0.144, train_accuracy=0.889, val_loss=0.197, val_accuracy=0.913]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.88it/s][A
Epoch 116:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.123, v_num=3, train_loss

Epoch 116, global step 26441: val_loss was not in top 2


Epoch 117:  89%|████████▊ | 226/255 [02:42<00:20,  1.39it/s, loss=0.118, v_num=3, train_loss=0.235, train_accuracy=0.833, val_loss=0.195, val_accuracy=0.930] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 117:  89%|████████▉ | 228/255 [02:45<00:19,  1.38it/s, loss=0.118, v_num=3, train_loss=0.235, train_accuracy=0.833, val_loss=0.195, val_accuracy=0.930]
Validating:   7%|▋         | 2/29 [00:03<00:36,  1.35s/it][A
Epoch 117:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.118, v_num=3, train_loss=0.235, train_accuracy=0.833, val_loss=0.195, val_accuracy=0.930]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.75it/s][A
Epoch 117:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.118, v_num=3, train_loss=0.235, train_accuracy=0.833, val_loss=0.195, val_accuracy=0.930]
Validating:  21%|██        | 6/29 [00:03<00:08,  2.86it/s][A
Epoch 117:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.118, v_num=3, train_loss=

Epoch 117, global step 26667: val_loss was not in top 2


Epoch 118:  89%|████████▊ | 226/255 [02:42<00:20,  1.39it/s, loss=0.109, v_num=3, train_loss=0.0212, train_accuracy=1.000, val_loss=0.222, val_accuracy=0.921] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 118:  89%|████████▉ | 228/255 [02:45<00:19,  1.38it/s, loss=0.109, v_num=3, train_loss=0.0212, train_accuracy=1.000, val_loss=0.222, val_accuracy=0.921]
Validating:   7%|▋         | 2/29 [00:03<00:37,  1.39s/it][A
Epoch 118:  90%|█████████ | 230/255 [02:46<00:18,  1.38it/s, loss=0.109, v_num=3, train_loss=0.0212, train_accuracy=1.000, val_loss=0.222, val_accuracy=0.921]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.73it/s][A
Epoch 118:  91%|█████████ | 232/255 [02:46<00:16,  1.39it/s, loss=0.109, v_num=3, train_loss=0.0212, train_accuracy=1.000, val_loss=0.222, val_accuracy=0.921]
Validating:  21%|██        | 6/29 [00:04<00:07,  2.90it/s][A
Epoch 118:  92%|█████████▏| 234/255 [02:46<00:14,  1.40it/s, loss=0.109, v_num=3, train_l

Epoch 118, global step 26893: val_loss was not in top 2


Epoch 119:  89%|████████▊ | 226/255 [02:42<00:20,  1.39it/s, loss=0.107, v_num=3, train_loss=0.0158, train_accuracy=1.000, val_loss=0.194, val_accuracy=0.922] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 119:  89%|████████▉ | 228/255 [02:45<00:19,  1.38it/s, loss=0.107, v_num=3, train_loss=0.0158, train_accuracy=1.000, val_loss=0.194, val_accuracy=0.922]
Validating:   7%|▋         | 2/29 [00:03<00:35,  1.33s/it][A
Epoch 119:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.107, v_num=3, train_loss=0.0158, train_accuracy=1.000, val_loss=0.194, val_accuracy=0.922]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.76it/s][A
Epoch 119:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.107, v_num=3, train_loss=0.0158, train_accuracy=1.000, val_loss=0.194, val_accuracy=0.922]
Validating:  21%|██        | 6/29 [00:03<00:08,  2.84it/s][A
Epoch 119:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.107, v_num=3, train_l

Epoch 119, global step 27119: val_loss reached 0.18296 (best 0.18296), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-28-v1.ckpt" as top 2


Epoch 120:  89%|████████▊ | 226/255 [02:42<00:20,  1.39it/s, loss=0.119, v_num=3, train_loss=0.0141, train_accuracy=1.000, val_loss=0.183, val_accuracy=0.921] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 120:  89%|████████▉ | 228/255 [02:45<00:19,  1.38it/s, loss=0.119, v_num=3, train_loss=0.0141, train_accuracy=1.000, val_loss=0.183, val_accuracy=0.921]
Validating:   7%|▋         | 2/29 [00:03<00:36,  1.34s/it][A
Epoch 120:  90%|█████████ | 230/255 [02:45<00:18,  1.39it/s, loss=0.119, v_num=3, train_loss=0.0141, train_accuracy=1.000, val_loss=0.183, val_accuracy=0.921]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.76it/s][A
Epoch 120:  91%|█████████ | 232/255 [02:46<00:16,  1.40it/s, loss=0.119, v_num=3, train_loss=0.0141, train_accuracy=1.000, val_loss=0.183, val_accuracy=0.921]
Validating:  21%|██        | 6/29 [00:03<00:08,  2.87it/s][A
Epoch 120:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.119, v_num=3, train_l

Epoch 120, global step 27345: val_loss was not in top 2


Epoch 121:  89%|████████▊ | 226/255 [02:42<00:20,  1.39it/s, loss=0.126, v_num=3, train_loss=0.270, train_accuracy=0.944, val_loss=0.218, val_accuracy=0.918]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 121:  89%|████████▉ | 228/255 [02:45<00:19,  1.38it/s, loss=0.126, v_num=3, train_loss=0.270, train_accuracy=0.944, val_loss=0.218, val_accuracy=0.918]
Validating:   7%|▋         | 2/29 [00:03<00:35,  1.33s/it][A
Epoch 121:  90%|█████████ | 230/255 [02:45<00:18,  1.39it/s, loss=0.126, v_num=3, train_loss=0.270, train_accuracy=0.944, val_loss=0.218, val_accuracy=0.918]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.75it/s][A
Epoch 121:  91%|█████████ | 232/255 [02:46<00:16,  1.40it/s, loss=0.126, v_num=3, train_loss=0.270, train_accuracy=0.944, val_loss=0.218, val_accuracy=0.918]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.92it/s][A
Epoch 121:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.126, v_num=3, train_loss

Epoch 121, global step 27571: val_loss was not in top 2


Epoch 122:  89%|████████▊ | 226/255 [02:42<00:20,  1.39it/s, loss=0.103, v_num=3, train_loss=0.201, train_accuracy=0.944, val_loss=0.240, val_accuracy=0.913]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 122:  89%|████████▉ | 228/255 [02:45<00:19,  1.38it/s, loss=0.103, v_num=3, train_loss=0.201, train_accuracy=0.944, val_loss=0.240, val_accuracy=0.913]
Validating:   7%|▋         | 2/29 [00:03<00:36,  1.34s/it][A
Epoch 122:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.103, v_num=3, train_loss=0.201, train_accuracy=0.944, val_loss=0.240, val_accuracy=0.913]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.76it/s][A
Epoch 122:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.103, v_num=3, train_loss=0.201, train_accuracy=0.944, val_loss=0.240, val_accuracy=0.913]
Validating:  21%|██        | 6/29 [00:03<00:08,  2.87it/s][A
Epoch 122:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.103, v_num=3, train_loss

Epoch 122, global step 27797: val_loss was not in top 2


Epoch 123:  89%|████████▊ | 226/255 [02:42<00:20,  1.39it/s, loss=0.107, v_num=3, train_loss=0.0696, train_accuracy=0.944, val_loss=0.204, val_accuracy=0.922] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 123:  89%|████████▉ | 228/255 [02:45<00:19,  1.38it/s, loss=0.107, v_num=3, train_loss=0.0696, train_accuracy=0.944, val_loss=0.204, val_accuracy=0.922]
Validating:   7%|▋         | 2/29 [00:03<00:36,  1.34s/it][A
Epoch 123:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.107, v_num=3, train_loss=0.0696, train_accuracy=0.944, val_loss=0.204, val_accuracy=0.922]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.77it/s][A
Epoch 123:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.107, v_num=3, train_loss=0.0696, train_accuracy=0.944, val_loss=0.204, val_accuracy=0.922]
Validating:  21%|██        | 6/29 [00:03<00:08,  2.86it/s][A
Epoch 123:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.107, v_num=3, train_l

Epoch 123, global step 28023: val_loss was not in top 2


Epoch 124:  89%|████████▊ | 226/255 [02:42<00:20,  1.39it/s, loss=0.0816, v_num=3, train_loss=0.0163, train_accuracy=1.000, val_loss=0.220, val_accuracy=0.923]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 124:  89%|████████▉ | 228/255 [02:45<00:19,  1.38it/s, loss=0.0816, v_num=3, train_loss=0.0163, train_accuracy=1.000, val_loss=0.220, val_accuracy=0.923]
Validating:   7%|▋         | 2/29 [00:03<00:35,  1.33s/it][A
Epoch 124:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.0816, v_num=3, train_loss=0.0163, train_accuracy=1.000, val_loss=0.220, val_accuracy=0.923]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.78it/s][A
Epoch 124:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.0816, v_num=3, train_loss=0.0163, train_accuracy=1.000, val_loss=0.220, val_accuracy=0.923]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.90it/s][A
Epoch 124:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.0816, v_num=3, tra

Epoch 124, global step 28249: val_loss was not in top 2


Epoch 125:  89%|████████▊ | 226/255 [02:42<00:20,  1.39it/s, loss=0.114, v_num=3, train_loss=0.268, train_accuracy=0.944, val_loss=0.203, val_accuracy=0.925]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 125:  89%|████████▉ | 228/255 [02:45<00:19,  1.38it/s, loss=0.114, v_num=3, train_loss=0.268, train_accuracy=0.944, val_loss=0.203, val_accuracy=0.925]
Validating:   7%|▋         | 2/29 [00:03<00:35,  1.32s/it][A
Epoch 125:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.114, v_num=3, train_loss=0.268, train_accuracy=0.944, val_loss=0.203, val_accuracy=0.925]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.77it/s][A
Epoch 125:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.114, v_num=3, train_loss=0.268, train_accuracy=0.944, val_loss=0.203, val_accuracy=0.925]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.89it/s][A
Epoch 125:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.114, v_num=3, train_loss

Epoch 125, global step 28475: val_loss reached 0.17998 (best 0.17998), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-28.ckpt" as top 2


Epoch 126:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.128, v_num=3, train_loss=0.0735, train_accuracy=0.944, val_loss=0.180, val_accuracy=0.924] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 126:  89%|████████▉ | 228/255 [02:44<00:19,  1.38it/s, loss=0.128, v_num=3, train_loss=0.0735, train_accuracy=0.944, val_loss=0.180, val_accuracy=0.924]
Validating:   7%|▋         | 2/29 [00:03<00:36,  1.34s/it][A
Epoch 126:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.128, v_num=3, train_loss=0.0735, train_accuracy=0.944, val_loss=0.180, val_accuracy=0.924]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.77it/s][A
Epoch 126:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.128, v_num=3, train_loss=0.0735, train_accuracy=0.944, val_loss=0.180, val_accuracy=0.924]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.93it/s][A
Epoch 126:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.128, v_num=3, train_l

Epoch 126, global step 28701: val_loss was not in top 2


Epoch 127:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.0927, v_num=3, train_loss=0.110, train_accuracy=1.000, val_loss=0.228, val_accuracy=0.916] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 127:  89%|████████▉ | 228/255 [02:44<00:19,  1.38it/s, loss=0.0927, v_num=3, train_loss=0.110, train_accuracy=1.000, val_loss=0.228, val_accuracy=0.916]
Validating:   7%|▋         | 2/29 [00:03<00:36,  1.35s/it][A
Epoch 127:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.0927, v_num=3, train_loss=0.110, train_accuracy=1.000, val_loss=0.228, val_accuracy=0.916]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.75it/s][A
Epoch 127:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.0927, v_num=3, train_loss=0.110, train_accuracy=1.000, val_loss=0.228, val_accuracy=0.916]
Validating:  21%|██        | 6/29 [00:03<00:08,  2.84it/s][A
Epoch 127:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.0927, v_num=3, train_

Epoch 127, global step 28927: val_loss reached 0.17980 (best 0.17980), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-28-v1.ckpt" as top 2


Epoch 128:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.148, v_num=3, train_loss=0.301, train_accuracy=0.833, val_loss=0.180, val_accuracy=0.930]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 128:  89%|████████▉ | 228/255 [02:44<00:19,  1.38it/s, loss=0.148, v_num=3, train_loss=0.301, train_accuracy=0.833, val_loss=0.180, val_accuracy=0.930]
Validating:   7%|▋         | 2/29 [00:03<00:36,  1.36s/it][A
Epoch 128:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.148, v_num=3, train_loss=0.301, train_accuracy=0.833, val_loss=0.180, val_accuracy=0.930]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.74it/s][A
Epoch 128:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.148, v_num=3, train_loss=0.301, train_accuracy=0.833, val_loss=0.180, val_accuracy=0.930]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.88it/s][A
Epoch 128:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.148, v_num=3, train_loss

Epoch 128, global step 29153: val_loss was not in top 2


Epoch 129:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.11, v_num=3, train_loss=0.0672, train_accuracy=1.000, val_loss=0.206, val_accuracy=0.925]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 129:  89%|████████▉ | 228/255 [02:44<00:19,  1.38it/s, loss=0.11, v_num=3, train_loss=0.0672, train_accuracy=1.000, val_loss=0.206, val_accuracy=0.925]
Validating:   7%|▋         | 2/29 [00:03<00:35,  1.33s/it][A
Epoch 129:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.11, v_num=3, train_loss=0.0672, train_accuracy=1.000, val_loss=0.206, val_accuracy=0.925]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.79it/s][A
Epoch 129:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.11, v_num=3, train_loss=0.0672, train_accuracy=1.000, val_loss=0.206, val_accuracy=0.925]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.93it/s][A
Epoch 129:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.11, v_num=3, train_loss=

Epoch 145, global step 32995: val_loss was not in top 2


Epoch 146:  89%|████████▊ | 226/255 [02:42<00:20,  1.39it/s, loss=0.309, v_num=3, train_loss=0.295, train_accuracy=0.833, val_loss=0.378, val_accuracy=0.866] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 146:  89%|████████▉ | 228/255 [02:45<00:19,  1.38it/s, loss=0.309, v_num=3, train_loss=0.295, train_accuracy=0.833, val_loss=0.378, val_accuracy=0.866]
Validating:   7%|▋         | 2/29 [00:03<00:35,  1.33s/it][A
Epoch 146:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.309, v_num=3, train_loss=0.295, train_accuracy=0.833, val_loss=0.378, val_accuracy=0.866]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.77it/s][A
Epoch 146:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.309, v_num=3, train_loss=0.295, train_accuracy=0.833, val_loss=0.378, val_accuracy=0.866]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.90it/s][A
Epoch 146:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.309, v_num=3, train_loss=

Epoch 146, global step 33221: val_loss was not in top 2


Epoch 147:  89%|████████▊ | 226/255 [02:42<00:20,  1.39it/s, loss=0.215, v_num=3, train_loss=0.266, train_accuracy=0.833, val_loss=0.341, val_accuracy=0.845]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 147:  89%|████████▉ | 228/255 [02:45<00:19,  1.38it/s, loss=0.215, v_num=3, train_loss=0.266, train_accuracy=0.833, val_loss=0.341, val_accuracy=0.845]
Validating:   7%|▋         | 2/29 [00:03<00:36,  1.35s/it][A
Epoch 147:  90%|█████████ | 230/255 [02:45<00:18,  1.39it/s, loss=0.215, v_num=3, train_loss=0.266, train_accuracy=0.833, val_loss=0.341, val_accuracy=0.845]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.73it/s][A
Epoch 147:  91%|█████████ | 232/255 [02:46<00:16,  1.40it/s, loss=0.215, v_num=3, train_loss=0.266, train_accuracy=0.833, val_loss=0.341, val_accuracy=0.845]
Validating:  21%|██        | 6/29 [00:03<00:08,  2.86it/s][A
Epoch 147:  92%|█████████▏| 234/255 [02:46<00:14,  1.40it/s, loss=0.215, v_num=3, train_loss=0

Epoch 147, global step 33447: val_loss was not in top 2


Epoch 148:  89%|████████▊ | 226/255 [02:42<00:20,  1.39it/s, loss=0.294, v_num=3, train_loss=0.308, train_accuracy=0.833, val_loss=0.292, val_accuracy=0.875] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 148:  89%|████████▉ | 228/255 [02:45<00:19,  1.38it/s, loss=0.294, v_num=3, train_loss=0.308, train_accuracy=0.833, val_loss=0.292, val_accuracy=0.875]
Validating:   7%|▋         | 2/29 [00:03<00:36,  1.34s/it][A
Epoch 148:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.294, v_num=3, train_loss=0.308, train_accuracy=0.833, val_loss=0.292, val_accuracy=0.875]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.78it/s][A
Epoch 148:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.294, v_num=3, train_loss=0.308, train_accuracy=0.833, val_loss=0.292, val_accuracy=0.875]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.91it/s][A
Epoch 148:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.294, v_num=3, train_loss=

Epoch 148, global step 33673: val_loss was not in top 2


Epoch 149:  89%|████████▊ | 226/255 [02:42<00:20,  1.39it/s, loss=0.22, v_num=3, train_loss=0.347, train_accuracy=0.833, val_loss=0.327, val_accuracy=0.863]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 149:  89%|████████▉ | 228/255 [02:45<00:19,  1.38it/s, loss=0.22, v_num=3, train_loss=0.347, train_accuracy=0.833, val_loss=0.327, val_accuracy=0.863]
Validating:   7%|▋         | 2/29 [00:03<00:36,  1.35s/it][A
Epoch 149:  90%|█████████ | 230/255 [02:45<00:18,  1.39it/s, loss=0.22, v_num=3, train_loss=0.347, train_accuracy=0.833, val_loss=0.327, val_accuracy=0.863]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.76it/s][A
Epoch 149:  91%|█████████ | 232/255 [02:46<00:16,  1.40it/s, loss=0.22, v_num=3, train_loss=0.347, train_accuracy=0.833, val_loss=0.327, val_accuracy=0.863]
Validating:  21%|██        | 6/29 [00:03<00:08,  2.83it/s][A
Epoch 149:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.22, v_num=3, train_loss=0.34

Epoch 149, global step 33899: val_loss was not in top 2


Epoch 150:  89%|████████▊ | 226/255 [02:42<00:20,  1.39it/s, loss=0.253, v_num=3, train_loss=0.245, train_accuracy=0.778, val_loss=0.275, val_accuracy=0.887] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 150:  89%|████████▉ | 228/255 [02:45<00:19,  1.38it/s, loss=0.253, v_num=3, train_loss=0.245, train_accuracy=0.778, val_loss=0.275, val_accuracy=0.887]
Validating:   7%|▋         | 2/29 [00:03<00:37,  1.37s/it][A
Epoch 150:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.253, v_num=3, train_loss=0.245, train_accuracy=0.778, val_loss=0.275, val_accuracy=0.887]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.75it/s][A
Epoch 150:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.253, v_num=3, train_loss=0.245, train_accuracy=0.778, val_loss=0.275, val_accuracy=0.887]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.91it/s][A
Epoch 150:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.253, v_num=3, train_loss=

Epoch 150, global step 34125: val_loss was not in top 2


Epoch 151:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.248, v_num=3, train_loss=0.267, train_accuracy=0.889, val_loss=0.308, val_accuracy=0.886]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 151:  89%|████████▉ | 228/255 [02:44<00:19,  1.38it/s, loss=0.248, v_num=3, train_loss=0.267, train_accuracy=0.889, val_loss=0.308, val_accuracy=0.886]
Validating:   7%|▋         | 2/29 [00:03<00:36,  1.36s/it][A
Epoch 151:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.248, v_num=3, train_loss=0.267, train_accuracy=0.889, val_loss=0.308, val_accuracy=0.886]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.74it/s][A
Epoch 151:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.248, v_num=3, train_loss=0.267, train_accuracy=0.889, val_loss=0.308, val_accuracy=0.886]
Validating:  21%|██        | 6/29 [00:03<00:08,  2.83it/s][A
Epoch 151:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.248, v_num=3, train_loss=0

Epoch 151, global step 34351: val_loss was not in top 2


Epoch 152:  89%|████████▊ | 226/255 [02:42<00:20,  1.39it/s, loss=0.239, v_num=3, train_loss=0.224, train_accuracy=0.944, val_loss=0.291, val_accuracy=0.883] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 152:  89%|████████▉ | 228/255 [02:45<00:19,  1.38it/s, loss=0.239, v_num=3, train_loss=0.224, train_accuracy=0.944, val_loss=0.291, val_accuracy=0.883]
Validating:   7%|▋         | 2/29 [00:03<00:38,  1.41s/it][A
Epoch 152:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.239, v_num=3, train_loss=0.224, train_accuracy=0.944, val_loss=0.291, val_accuracy=0.883]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.67it/s][A
Epoch 152:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.239, v_num=3, train_loss=0.224, train_accuracy=0.944, val_loss=0.291, val_accuracy=0.883]
Validating:  21%|██        | 6/29 [00:04<00:08,  2.77it/s][A
Epoch 152:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.239, v_num=3, train_loss=

Epoch 152, global step 34577: val_loss was not in top 2


Epoch 153:  89%|████████▊ | 226/255 [02:42<00:20,  1.39it/s, loss=0.199, v_num=3, train_loss=0.163, train_accuracy=0.889, val_loss=0.383, val_accuracy=0.854] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 153:  89%|████████▉ | 228/255 [02:45<00:19,  1.38it/s, loss=0.199, v_num=3, train_loss=0.163, train_accuracy=0.889, val_loss=0.383, val_accuracy=0.854]
Validating:   7%|▋         | 2/29 [00:03<00:37,  1.38s/it][A
Epoch 153:  90%|█████████ | 230/255 [02:45<00:18,  1.39it/s, loss=0.199, v_num=3, train_loss=0.163, train_accuracy=0.889, val_loss=0.383, val_accuracy=0.854]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.76it/s][A
Epoch 153:  91%|█████████ | 232/255 [02:46<00:16,  1.40it/s, loss=0.199, v_num=3, train_loss=0.163, train_accuracy=0.889, val_loss=0.383, val_accuracy=0.854]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.94it/s][A
Epoch 153:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.199, v_num=3, train_loss=

Epoch 153, global step 34803: val_loss was not in top 2


Epoch 154:  89%|████████▊ | 226/255 [02:42<00:20,  1.39it/s, loss=0.172, v_num=3, train_loss=0.114, train_accuracy=0.944, val_loss=0.271, val_accuracy=0.886] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 154:  89%|████████▉ | 228/255 [02:45<00:19,  1.38it/s, loss=0.172, v_num=3, train_loss=0.114, train_accuracy=0.944, val_loss=0.271, val_accuracy=0.886]
Validating:   7%|▋         | 2/29 [00:03<00:36,  1.35s/it][A
Epoch 154:  90%|█████████ | 230/255 [02:45<00:18,  1.39it/s, loss=0.172, v_num=3, train_loss=0.114, train_accuracy=0.944, val_loss=0.271, val_accuracy=0.886]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.76it/s][A
Epoch 154:  91%|█████████ | 232/255 [02:46<00:16,  1.40it/s, loss=0.172, v_num=3, train_loss=0.114, train_accuracy=0.944, val_loss=0.271, val_accuracy=0.886]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.89it/s][A
Epoch 154:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.172, v_num=3, train_loss=

Epoch 154, global step 35029: val_loss was not in top 2


Epoch 155:  89%|████████▊ | 226/255 [02:42<00:20,  1.39it/s, loss=0.197, v_num=3, train_loss=0.110, train_accuracy=1.000, val_loss=0.263, val_accuracy=0.894] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 155:  89%|████████▉ | 228/255 [02:45<00:19,  1.38it/s, loss=0.197, v_num=3, train_loss=0.110, train_accuracy=1.000, val_loss=0.263, val_accuracy=0.894]
Validating:   7%|▋         | 2/29 [00:03<00:36,  1.36s/it][A
Epoch 155:  90%|█████████ | 230/255 [02:46<00:18,  1.39it/s, loss=0.197, v_num=3, train_loss=0.110, train_accuracy=1.000, val_loss=0.263, val_accuracy=0.894]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.77it/s][A
Epoch 155:  91%|█████████ | 232/255 [02:46<00:16,  1.39it/s, loss=0.197, v_num=3, train_loss=0.110, train_accuracy=1.000, val_loss=0.263, val_accuracy=0.894]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.97it/s][A
Epoch 155:  92%|█████████▏| 234/255 [02:46<00:14,  1.40it/s, loss=0.197, v_num=3, train_loss=

Epoch 155, global step 35255: val_loss was not in top 2


Epoch 156:  89%|████████▊ | 226/255 [02:42<00:20,  1.39it/s, loss=0.153, v_num=3, train_loss=0.169, train_accuracy=0.944, val_loss=0.261, val_accuracy=0.896] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 156:  89%|████████▉ | 228/255 [02:45<00:19,  1.38it/s, loss=0.153, v_num=3, train_loss=0.169, train_accuracy=0.944, val_loss=0.261, val_accuracy=0.896]
Validating:   7%|▋         | 2/29 [00:03<00:36,  1.34s/it][A
Epoch 156:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.153, v_num=3, train_loss=0.169, train_accuracy=0.944, val_loss=0.261, val_accuracy=0.896]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.74it/s][A
Epoch 156:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.153, v_num=3, train_loss=0.169, train_accuracy=0.944, val_loss=0.261, val_accuracy=0.896]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.91it/s][A
Epoch 156:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.153, v_num=3, train_loss=

Epoch 156, global step 35481: val_loss was not in top 2


Epoch 157:  89%|████████▊ | 226/255 [02:42<00:20,  1.39it/s, loss=0.26, v_num=3, train_loss=0.247, train_accuracy=0.944, val_loss=0.224, val_accuracy=0.917]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 157:  89%|████████▉ | 228/255 [02:45<00:19,  1.38it/s, loss=0.26, v_num=3, train_loss=0.247, train_accuracy=0.944, val_loss=0.224, val_accuracy=0.917]
Validating:   7%|▋         | 2/29 [00:03<00:36,  1.34s/it][A
Epoch 157:  90%|█████████ | 230/255 [02:45<00:18,  1.39it/s, loss=0.26, v_num=3, train_loss=0.247, train_accuracy=0.944, val_loss=0.224, val_accuracy=0.917]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.76it/s][A
Epoch 157:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.26, v_num=3, train_loss=0.247, train_accuracy=0.944, val_loss=0.224, val_accuracy=0.917]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.88it/s][A
Epoch 157:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.26, v_num=3, train_loss=0.24

Epoch 157, global step 35707: val_loss was not in top 2


Epoch 158:  89%|████████▊ | 226/255 [02:42<00:20,  1.39it/s, loss=0.156, v_num=3, train_loss=0.0688, train_accuracy=1.000, val_loss=0.299, val_accuracy=0.877]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 158:  89%|████████▉ | 228/255 [02:45<00:19,  1.38it/s, loss=0.156, v_num=3, train_loss=0.0688, train_accuracy=1.000, val_loss=0.299, val_accuracy=0.877]
Validating:   7%|▋         | 2/29 [00:03<00:35,  1.33s/it][A
Epoch 158:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.156, v_num=3, train_loss=0.0688, train_accuracy=1.000, val_loss=0.299, val_accuracy=0.877]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.79it/s][A
Epoch 158:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.156, v_num=3, train_loss=0.0688, train_accuracy=1.000, val_loss=0.299, val_accuracy=0.877]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.93it/s][A
Epoch 158:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.156, v_num=3, train_lo

Epoch 158, global step 35933: val_loss was not in top 2


Epoch 159:  89%|████████▊ | 226/255 [02:42<00:20,  1.39it/s, loss=0.137, v_num=3, train_loss=0.0736, train_accuracy=1.000, val_loss=0.208, val_accuracy=0.925]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 159:  89%|████████▉ | 228/255 [02:45<00:19,  1.38it/s, loss=0.137, v_num=3, train_loss=0.0736, train_accuracy=1.000, val_loss=0.208, val_accuracy=0.925]
Validating:   7%|▋         | 2/29 [00:03<00:36,  1.35s/it][A
Epoch 159:  90%|█████████ | 230/255 [02:45<00:18,  1.39it/s, loss=0.137, v_num=3, train_loss=0.0736, train_accuracy=1.000, val_loss=0.208, val_accuracy=0.925]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.76it/s][A
Epoch 159:  91%|█████████ | 232/255 [02:46<00:16,  1.40it/s, loss=0.137, v_num=3, train_loss=0.0736, train_accuracy=1.000, val_loss=0.208, val_accuracy=0.925]
Validating:  21%|██        | 6/29 [00:03<00:08,  2.87it/s][A
Epoch 159:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.137, v_num=3, train_lo

Epoch 159, global step 36159: val_loss was not in top 2


Epoch 160:  89%|████████▊ | 226/255 [02:42<00:20,  1.39it/s, loss=0.12, v_num=3, train_loss=0.0141, train_accuracy=1.000, val_loss=0.204, val_accuracy=0.923] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 160:  89%|████████▉ | 228/255 [02:45<00:19,  1.38it/s, loss=0.12, v_num=3, train_loss=0.0141, train_accuracy=1.000, val_loss=0.204, val_accuracy=0.923]
Validating:   7%|▋         | 2/29 [00:03<00:36,  1.36s/it][A
Epoch 160:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.12, v_num=3, train_loss=0.0141, train_accuracy=1.000, val_loss=0.204, val_accuracy=0.923]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.75it/s][A
Epoch 160:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.12, v_num=3, train_loss=0.0141, train_accuracy=1.000, val_loss=0.204, val_accuracy=0.923]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.88it/s][A
Epoch 160:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.12, v_num=3, train_loss=0

Epoch 160, global step 36385: val_loss was not in top 2


Epoch 161:  89%|████████▊ | 226/255 [02:42<00:20,  1.39it/s, loss=0.204, v_num=3, train_loss=0.439, train_accuracy=0.778, val_loss=0.228, val_accuracy=0.921] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 161:  89%|████████▉ | 228/255 [02:45<00:19,  1.38it/s, loss=0.204, v_num=3, train_loss=0.439, train_accuracy=0.778, val_loss=0.228, val_accuracy=0.921]
Validating:   7%|▋         | 2/29 [00:03<00:36,  1.34s/it][A
Epoch 161:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.204, v_num=3, train_loss=0.439, train_accuracy=0.778, val_loss=0.228, val_accuracy=0.921]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.77it/s][A
Epoch 161:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.204, v_num=3, train_loss=0.439, train_accuracy=0.778, val_loss=0.228, val_accuracy=0.921]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.89it/s][A
Epoch 161:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.204, v_num=3, train_loss=

Epoch 161, global step 36611: val_loss was not in top 2


Epoch 162:  89%|████████▊ | 226/255 [02:42<00:20,  1.40it/s, loss=0.255, v_num=3, train_loss=0.150, train_accuracy=0.944, val_loss=0.212, val_accuracy=0.916] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 162:  89%|████████▉ | 228/255 [02:44<00:19,  1.38it/s, loss=0.255, v_num=3, train_loss=0.150, train_accuracy=0.944, val_loss=0.212, val_accuracy=0.916]
Validating:   7%|▋         | 2/29 [00:03<00:36,  1.35s/it][A
Epoch 162:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.255, v_num=3, train_loss=0.150, train_accuracy=0.944, val_loss=0.212, val_accuracy=0.916]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.77it/s][A
Epoch 162:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.255, v_num=3, train_loss=0.150, train_accuracy=0.944, val_loss=0.212, val_accuracy=0.916]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.93it/s][A
Epoch 162:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.255, v_num=3, train_loss=

Epoch 162, global step 36837: val_loss was not in top 2


Epoch 163:  89%|████████▊ | 226/255 [02:42<00:20,  1.39it/s, loss=0.211, v_num=3, train_loss=0.146, train_accuracy=0.944, val_loss=0.302, val_accuracy=0.872] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 163:  89%|████████▉ | 228/255 [02:45<00:19,  1.38it/s, loss=0.211, v_num=3, train_loss=0.146, train_accuracy=0.944, val_loss=0.302, val_accuracy=0.872]
Validating:   7%|▋         | 2/29 [00:03<00:36,  1.34s/it][A
Epoch 163:  90%|█████████ | 230/255 [02:45<00:18,  1.39it/s, loss=0.211, v_num=3, train_loss=0.146, train_accuracy=0.944, val_loss=0.302, val_accuracy=0.872]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.74it/s][A
Epoch 163:  91%|█████████ | 232/255 [02:46<00:16,  1.40it/s, loss=0.211, v_num=3, train_loss=0.146, train_accuracy=0.944, val_loss=0.302, val_accuracy=0.872]
Validating:  21%|██        | 6/29 [00:03<00:08,  2.87it/s][A
Epoch 163:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.211, v_num=3, train_loss=

Epoch 163, global step 37063: val_loss was not in top 2


Epoch 164:  89%|████████▊ | 226/255 [02:42<00:20,  1.39it/s, loss=0.139, v_num=3, train_loss=0.0552, train_accuracy=1.000, val_loss=0.239, val_accuracy=0.901]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 164:  89%|████████▉ | 228/255 [02:45<00:19,  1.38it/s, loss=0.139, v_num=3, train_loss=0.0552, train_accuracy=1.000, val_loss=0.239, val_accuracy=0.901]
Validating:   7%|▋         | 2/29 [00:03<00:36,  1.36s/it][A
Epoch 164:  90%|█████████ | 230/255 [02:45<00:18,  1.39it/s, loss=0.139, v_num=3, train_loss=0.0552, train_accuracy=1.000, val_loss=0.239, val_accuracy=0.901]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.73it/s][A
Epoch 164:  91%|█████████ | 232/255 [02:46<00:16,  1.40it/s, loss=0.139, v_num=3, train_loss=0.0552, train_accuracy=1.000, val_loss=0.239, val_accuracy=0.901]
Validating:  21%|██        | 6/29 [00:03<00:08,  2.81it/s][A
Epoch 164:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.139, v_num=3, train_lo

Epoch 164, global step 37289: val_loss was not in top 2


Epoch 165:  89%|████████▊ | 226/255 [02:42<00:20,  1.39it/s, loss=0.143, v_num=3, train_loss=0.115, train_accuracy=0.944, val_loss=0.222, val_accuracy=0.920] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 165:  89%|████████▉ | 228/255 [02:45<00:19,  1.38it/s, loss=0.143, v_num=3, train_loss=0.115, train_accuracy=0.944, val_loss=0.222, val_accuracy=0.920]
Validating:   7%|▋         | 2/29 [00:03<00:36,  1.36s/it][A
Epoch 165:  90%|█████████ | 230/255 [02:45<00:18,  1.39it/s, loss=0.143, v_num=3, train_loss=0.115, train_accuracy=0.944, val_loss=0.222, val_accuracy=0.920]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.75it/s][A
Epoch 165:  91%|█████████ | 232/255 [02:46<00:16,  1.40it/s, loss=0.143, v_num=3, train_loss=0.115, train_accuracy=0.944, val_loss=0.222, val_accuracy=0.920]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.90it/s][A
Epoch 165:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.143, v_num=3, train_loss=

Epoch 165, global step 37515: val_loss was not in top 2


Epoch 166:  89%|████████▊ | 226/255 [02:42<00:20,  1.39it/s, loss=0.151, v_num=3, train_loss=0.0497, train_accuracy=1.000, val_loss=0.216, val_accuracy=0.923]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 166:  89%|████████▉ | 228/255 [02:45<00:19,  1.38it/s, loss=0.151, v_num=3, train_loss=0.0497, train_accuracy=1.000, val_loss=0.216, val_accuracy=0.923]
Validating:   7%|▋         | 2/29 [00:03<00:36,  1.34s/it][A
Epoch 166:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.151, v_num=3, train_loss=0.0497, train_accuracy=1.000, val_loss=0.216, val_accuracy=0.923]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.76it/s][A
Epoch 166:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.151, v_num=3, train_loss=0.0497, train_accuracy=1.000, val_loss=0.216, val_accuracy=0.923]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.88it/s][A
Epoch 166:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.151, v_num=3, train_lo

Epoch 166, global step 37741: val_loss was not in top 2


Epoch 167:  89%|████████▊ | 226/255 [02:42<00:20,  1.39it/s, loss=0.63, v_num=3, train_loss=0.550, train_accuracy=0.722, val_loss=0.225, val_accuracy=0.913]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 167:  89%|████████▉ | 228/255 [02:45<00:19,  1.38it/s, loss=0.63, v_num=3, train_loss=0.550, train_accuracy=0.722, val_loss=0.225, val_accuracy=0.913]
Validating:   7%|▋         | 2/29 [00:03<00:36,  1.35s/it][A
Epoch 167:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.63, v_num=3, train_loss=0.550, train_accuracy=0.722, val_loss=0.225, val_accuracy=0.913]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.78it/s][A
Epoch 167:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.63, v_num=3, train_loss=0.550, train_accuracy=0.722, val_loss=0.225, val_accuracy=0.913]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.90it/s][A
Epoch 167:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.63, v_num=3, train_loss=0.55

Epoch 167, global step 37967: val_loss was not in top 2


Epoch 168:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.488, v_num=3, train_loss=0.536, train_accuracy=0.611, val_loss=0.652, val_accuracy=0.634]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 168:  89%|████████▉ | 228/255 [02:44<00:19,  1.38it/s, loss=0.488, v_num=3, train_loss=0.536, train_accuracy=0.611, val_loss=0.652, val_accuracy=0.634]
Validating:   7%|▋         | 2/29 [00:03<00:36,  1.35s/it][A
Epoch 168:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.488, v_num=3, train_loss=0.536, train_accuracy=0.611, val_loss=0.652, val_accuracy=0.634]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.75it/s][A
Epoch 168:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.488, v_num=3, train_loss=0.536, train_accuracy=0.611, val_loss=0.652, val_accuracy=0.634]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.89it/s][A
Epoch 168:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.488, v_num=3, train_loss=0

Epoch 168, global step 38193: val_loss was not in top 2


Epoch 169:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.459, v_num=3, train_loss=0.480, train_accuracy=0.722, val_loss=0.519, val_accuracy=0.756]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 169:  89%|████████▉ | 228/255 [02:44<00:19,  1.38it/s, loss=0.459, v_num=3, train_loss=0.480, train_accuracy=0.722, val_loss=0.519, val_accuracy=0.756]
Validating:   7%|▋         | 2/29 [00:03<00:36,  1.36s/it][A
Epoch 169:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.459, v_num=3, train_loss=0.480, train_accuracy=0.722, val_loss=0.519, val_accuracy=0.756]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.73it/s][A
Epoch 169:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.459, v_num=3, train_loss=0.480, train_accuracy=0.722, val_loss=0.519, val_accuracy=0.756]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.89it/s][A
Epoch 169:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.459, v_num=3, train_loss=0

Epoch 169, global step 38419: val_loss was not in top 2


Epoch 170:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.421, v_num=3, train_loss=0.384, train_accuracy=0.833, val_loss=0.500, val_accuracy=0.761]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 170:  89%|████████▉ | 228/255 [02:44<00:19,  1.38it/s, loss=0.421, v_num=3, train_loss=0.384, train_accuracy=0.833, val_loss=0.500, val_accuracy=0.761]
Validating:   7%|▋         | 2/29 [00:03<00:36,  1.35s/it][A
Epoch 170:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.421, v_num=3, train_loss=0.384, train_accuracy=0.833, val_loss=0.500, val_accuracy=0.761]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.75it/s][A
Epoch 170:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.421, v_num=3, train_loss=0.384, train_accuracy=0.833, val_loss=0.500, val_accuracy=0.761]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.90it/s][A
Epoch 170:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.421, v_num=3, train_loss=0

Epoch 170, global step 38645: val_loss was not in top 2


Epoch 171:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.29, v_num=3, train_loss=0.302, train_accuracy=0.889, val_loss=0.424, val_accuracy=0.825] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 171:  89%|████████▉ | 228/255 [02:44<00:19,  1.38it/s, loss=0.29, v_num=3, train_loss=0.302, train_accuracy=0.889, val_loss=0.424, val_accuracy=0.825]
Validating:   7%|▋         | 2/29 [00:03<00:36,  1.34s/it][A
Epoch 171:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.29, v_num=3, train_loss=0.302, train_accuracy=0.889, val_loss=0.424, val_accuracy=0.825]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.79it/s][A
Epoch 171:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.29, v_num=3, train_loss=0.302, train_accuracy=0.889, val_loss=0.424, val_accuracy=0.825]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.89it/s][A
Epoch 171:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.29, v_num=3, train_loss=0.302

Epoch 171, global step 38871: val_loss was not in top 2


Epoch 172:  89%|████████▊ | 226/255 [02:42<00:20,  1.39it/s, loss=0.269, v_num=3, train_loss=0.280, train_accuracy=0.944, val_loss=0.353, val_accuracy=0.854]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 172:  89%|████████▉ | 228/255 [02:45<00:19,  1.38it/s, loss=0.269, v_num=3, train_loss=0.280, train_accuracy=0.944, val_loss=0.353, val_accuracy=0.854]
Validating:   7%|▋         | 2/29 [00:03<00:36,  1.36s/it][A
Epoch 172:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.269, v_num=3, train_loss=0.280, train_accuracy=0.944, val_loss=0.353, val_accuracy=0.854]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.73it/s][A
Epoch 172:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.269, v_num=3, train_loss=0.280, train_accuracy=0.944, val_loss=0.353, val_accuracy=0.854]
Validating:  21%|██        | 6/29 [00:03<00:08,  2.87it/s][A
Epoch 172:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.269, v_num=3, train_loss=0

Epoch 172, global step 39097: val_loss was not in top 2


Epoch 173:  89%|████████▊ | 226/255 [02:42<00:20,  1.39it/s, loss=0.241, v_num=3, train_loss=0.279, train_accuracy=0.889, val_loss=0.324, val_accuracy=0.872]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 173:  89%|████████▉ | 228/255 [02:45<00:19,  1.38it/s, loss=0.241, v_num=3, train_loss=0.279, train_accuracy=0.889, val_loss=0.324, val_accuracy=0.872]
Validating:   7%|▋         | 2/29 [00:03<00:36,  1.34s/it][A
Epoch 173:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.241, v_num=3, train_loss=0.279, train_accuracy=0.889, val_loss=0.324, val_accuracy=0.872]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.78it/s][A
Epoch 173:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.241, v_num=3, train_loss=0.279, train_accuracy=0.889, val_loss=0.324, val_accuracy=0.872]
Validating:  21%|██        | 6/29 [00:03<00:08,  2.87it/s][A
Epoch 173:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.241, v_num=3, train_loss=0

Epoch 173, global step 39323: val_loss was not in top 2


Epoch 174:  89%|████████▊ | 226/255 [02:42<00:20,  1.39it/s, loss=0.226, v_num=3, train_loss=0.249, train_accuracy=0.889, val_loss=0.279, val_accuracy=0.892] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 174:  89%|████████▉ | 228/255 [02:45<00:19,  1.38it/s, loss=0.226, v_num=3, train_loss=0.249, train_accuracy=0.889, val_loss=0.279, val_accuracy=0.892]
Validating:   7%|▋         | 2/29 [00:03<00:35,  1.33s/it][A
Epoch 174:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.226, v_num=3, train_loss=0.249, train_accuracy=0.889, val_loss=0.279, val_accuracy=0.892]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.78it/s][A
Epoch 174:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.226, v_num=3, train_loss=0.249, train_accuracy=0.889, val_loss=0.279, val_accuracy=0.892]
Validating:  21%|██        | 6/29 [00:03<00:08,  2.86it/s][A
Epoch 174:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.226, v_num=3, train_loss=

Epoch 174, global step 39549: val_loss was not in top 2


Epoch 175:  89%|████████▊ | 226/255 [02:42<00:20,  1.39it/s, loss=0.199, v_num=3, train_loss=0.101, train_accuracy=0.944, val_loss=0.281, val_accuracy=0.892]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 175:  89%|████████▉ | 228/255 [02:45<00:19,  1.38it/s, loss=0.199, v_num=3, train_loss=0.101, train_accuracy=0.944, val_loss=0.281, val_accuracy=0.892]
Validating:   7%|▋         | 2/29 [00:03<00:36,  1.34s/it][A
Epoch 175:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.199, v_num=3, train_loss=0.101, train_accuracy=0.944, val_loss=0.281, val_accuracy=0.892]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.75it/s][A
Epoch 175:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.199, v_num=3, train_loss=0.101, train_accuracy=0.944, val_loss=0.281, val_accuracy=0.892]
Validating:  21%|██        | 6/29 [00:03<00:08,  2.85it/s][A
Epoch 175:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.199, v_num=3, train_loss=0

Epoch 175, global step 39775: val_loss was not in top 2


Epoch 176:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.182, v_num=3, train_loss=0.131, train_accuracy=0.944, val_loss=0.264, val_accuracy=0.891] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 176:  89%|████████▉ | 228/255 [02:44<00:19,  1.38it/s, loss=0.182, v_num=3, train_loss=0.131, train_accuracy=0.944, val_loss=0.264, val_accuracy=0.891]
Validating:   7%|▋         | 2/29 [00:03<00:36,  1.35s/it][A
Epoch 176:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.182, v_num=3, train_loss=0.131, train_accuracy=0.944, val_loss=0.264, val_accuracy=0.891]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.76it/s][A
Epoch 176:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.182, v_num=3, train_loss=0.131, train_accuracy=0.944, val_loss=0.264, val_accuracy=0.891]
Validating:  21%|██        | 6/29 [00:03<00:08,  2.86it/s][A
Epoch 176:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.182, v_num=3, train_loss=

Epoch 176, global step 40001: val_loss was not in top 2


Epoch 177:  89%|████████▊ | 226/255 [02:42<00:20,  1.39it/s, loss=0.165, v_num=3, train_loss=0.201, train_accuracy=0.889, val_loss=0.263, val_accuracy=0.898] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 177:  89%|████████▉ | 228/255 [02:45<00:19,  1.38it/s, loss=0.165, v_num=3, train_loss=0.201, train_accuracy=0.889, val_loss=0.263, val_accuracy=0.898]
Validating:   7%|▋         | 2/29 [00:03<00:36,  1.34s/it][A
Epoch 177:  90%|█████████ | 230/255 [02:45<00:18,  1.39it/s, loss=0.165, v_num=3, train_loss=0.201, train_accuracy=0.889, val_loss=0.263, val_accuracy=0.898]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.74it/s][A
Epoch 177:  91%|█████████ | 232/255 [02:46<00:16,  1.40it/s, loss=0.165, v_num=3, train_loss=0.201, train_accuracy=0.889, val_loss=0.263, val_accuracy=0.898]
Validating:  21%|██        | 6/29 [00:03<00:08,  2.79it/s][A
Epoch 177:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.165, v_num=3, train_loss=

Epoch 177, global step 40227: val_loss was not in top 2


Epoch 178:  89%|████████▊ | 226/255 [02:42<00:20,  1.39it/s, loss=0.157, v_num=3, train_loss=0.0525, train_accuracy=1.000, val_loss=0.234, val_accuracy=0.903]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 178:  89%|████████▉ | 228/255 [02:45<00:19,  1.38it/s, loss=0.157, v_num=3, train_loss=0.0525, train_accuracy=1.000, val_loss=0.234, val_accuracy=0.903]
Validating:   7%|▋         | 2/29 [00:03<00:36,  1.34s/it][A
Epoch 178:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.157, v_num=3, train_loss=0.0525, train_accuracy=1.000, val_loss=0.234, val_accuracy=0.903]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.75it/s][A
Epoch 178:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.157, v_num=3, train_loss=0.0525, train_accuracy=1.000, val_loss=0.234, val_accuracy=0.903]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.91it/s][A
Epoch 178:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.157, v_num=3, train_lo

Epoch 178, global step 40453: val_loss was not in top 2


Epoch 179:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.167, v_num=3, train_loss=0.0725, train_accuracy=1.000, val_loss=0.226, val_accuracy=0.902]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 179:  89%|████████▉ | 228/255 [02:44<00:19,  1.38it/s, loss=0.167, v_num=3, train_loss=0.0725, train_accuracy=1.000, val_loss=0.226, val_accuracy=0.902]
Validating:   7%|▋         | 2/29 [00:03<00:36,  1.35s/it][A
Epoch 179:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.167, v_num=3, train_loss=0.0725, train_accuracy=1.000, val_loss=0.226, val_accuracy=0.902]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.76it/s][A
Epoch 179:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.167, v_num=3, train_loss=0.0725, train_accuracy=1.000, val_loss=0.226, val_accuracy=0.902]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.89it/s][A
Epoch 179:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.167, v_num=3, train_lo

Epoch 179, global step 40679: val_loss was not in top 2


Epoch 180:  89%|████████▊ | 226/255 [02:42<00:20,  1.39it/s, loss=0.162, v_num=3, train_loss=0.183, train_accuracy=0.889, val_loss=0.232, val_accuracy=0.906] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 180:  89%|████████▉ | 228/255 [02:45<00:19,  1.38it/s, loss=0.162, v_num=3, train_loss=0.183, train_accuracy=0.889, val_loss=0.232, val_accuracy=0.906]
Validating:   7%|▋         | 2/29 [00:03<00:35,  1.33s/it][A
Epoch 180:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.162, v_num=3, train_loss=0.183, train_accuracy=0.889, val_loss=0.232, val_accuracy=0.906]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.75it/s][A
Epoch 180:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.162, v_num=3, train_loss=0.183, train_accuracy=0.889, val_loss=0.232, val_accuracy=0.906]
Validating:  21%|██        | 6/29 [00:03<00:08,  2.87it/s][A
Epoch 180:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.162, v_num=3, train_loss=

Epoch 180, global step 40905: val_loss was not in top 2


Epoch 181:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.138, v_num=3, train_loss=0.0402, train_accuracy=1.000, val_loss=0.211, val_accuracy=0.916]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 181:  89%|████████▉ | 228/255 [02:44<00:19,  1.38it/s, loss=0.138, v_num=3, train_loss=0.0402, train_accuracy=1.000, val_loss=0.211, val_accuracy=0.916]
Validating:   7%|▋         | 2/29 [00:03<00:35,  1.33s/it][A
Epoch 181:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.138, v_num=3, train_loss=0.0402, train_accuracy=1.000, val_loss=0.211, val_accuracy=0.916]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.78it/s][A
Epoch 181:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.138, v_num=3, train_loss=0.0402, train_accuracy=1.000, val_loss=0.211, val_accuracy=0.916]
Validating:  21%|██        | 6/29 [00:03<00:08,  2.84it/s][A
Epoch 181:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.138, v_num=3, train_lo

Epoch 181, global step 41131: val_loss was not in top 2


Epoch 182:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.103, v_num=3, train_loss=0.106, train_accuracy=0.944, val_loss=0.209, val_accuracy=0.915] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 182:  89%|████████▉ | 228/255 [02:44<00:19,  1.38it/s, loss=0.103, v_num=3, train_loss=0.106, train_accuracy=0.944, val_loss=0.209, val_accuracy=0.915]
Validating:   7%|▋         | 2/29 [00:03<00:36,  1.34s/it][A
Epoch 182:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.103, v_num=3, train_loss=0.106, train_accuracy=0.944, val_loss=0.209, val_accuracy=0.915]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.77it/s][A
Epoch 182:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.103, v_num=3, train_loss=0.106, train_accuracy=0.944, val_loss=0.209, val_accuracy=0.915]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.90it/s][A
Epoch 182:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.103, v_num=3, train_loss=

Epoch 182, global step 41357: val_loss was not in top 2


Epoch 183:  89%|████████▊ | 226/255 [02:42<00:20,  1.39it/s, loss=0.11, v_num=3, train_loss=0.134, train_accuracy=0.944, val_loss=0.206, val_accuracy=0.928]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 183:  89%|████████▉ | 228/255 [02:45<00:19,  1.38it/s, loss=0.11, v_num=3, train_loss=0.134, train_accuracy=0.944, val_loss=0.206, val_accuracy=0.928]
Validating:   7%|▋         | 2/29 [00:03<00:36,  1.34s/it][A
Epoch 183:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.11, v_num=3, train_loss=0.134, train_accuracy=0.944, val_loss=0.206, val_accuracy=0.928]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.78it/s][A
Epoch 183:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.11, v_num=3, train_loss=0.134, train_accuracy=0.944, val_loss=0.206, val_accuracy=0.928]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.88it/s][A
Epoch 183:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.11, v_num=3, train_loss=0.13

Epoch 183, global step 41583: val_loss was not in top 2


Epoch 184:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.111, v_num=3, train_loss=0.0233, train_accuracy=1.000, val_loss=0.199, val_accuracy=0.926]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 184:  89%|████████▉ | 228/255 [02:44<00:19,  1.38it/s, loss=0.111, v_num=3, train_loss=0.0233, train_accuracy=1.000, val_loss=0.199, val_accuracy=0.926]
Validating:   7%|▋         | 2/29 [00:03<00:36,  1.34s/it][A
Epoch 184:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.111, v_num=3, train_loss=0.0233, train_accuracy=1.000, val_loss=0.199, val_accuracy=0.926]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.76it/s][A
Epoch 184:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.111, v_num=3, train_loss=0.0233, train_accuracy=1.000, val_loss=0.199, val_accuracy=0.926]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.92it/s][A
Epoch 184:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.111, v_num=3, train_lo

Epoch 184, global step 41809: val_loss was not in top 2


Epoch 185:  89%|████████▊ | 226/255 [02:42<00:20,  1.40it/s, loss=0.124, v_num=3, train_loss=0.212, train_accuracy=0.889, val_loss=0.215, val_accuracy=0.924]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 185:  89%|████████▉ | 228/255 [02:45<00:19,  1.38it/s, loss=0.124, v_num=3, train_loss=0.212, train_accuracy=0.889, val_loss=0.215, val_accuracy=0.924]
Validating:   7%|▋         | 2/29 [00:03<00:36,  1.34s/it][A
Epoch 185:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.124, v_num=3, train_loss=0.212, train_accuracy=0.889, val_loss=0.215, val_accuracy=0.924]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.77it/s][A
Epoch 185:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.124, v_num=3, train_loss=0.212, train_accuracy=0.889, val_loss=0.215, val_accuracy=0.924]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.91it/s][A
Epoch 185:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.124, v_num=3, train_loss

Epoch 185, global step 42035: val_loss was not in top 2


Epoch 186:  89%|████████▊ | 226/255 [02:42<00:20,  1.39it/s, loss=0.113, v_num=3, train_loss=0.0795, train_accuracy=1.000, val_loss=0.240, val_accuracy=0.906] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 186:  89%|████████▉ | 228/255 [02:45<00:19,  1.38it/s, loss=0.113, v_num=3, train_loss=0.0795, train_accuracy=1.000, val_loss=0.240, val_accuracy=0.906]
Validating:   7%|▋         | 2/29 [00:03<00:36,  1.35s/it][A
Epoch 186:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.113, v_num=3, train_loss=0.0795, train_accuracy=1.000, val_loss=0.240, val_accuracy=0.906]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.76it/s][A
Epoch 186:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.113, v_num=3, train_loss=0.0795, train_accuracy=1.000, val_loss=0.240, val_accuracy=0.906]
Validating:  21%|██        | 6/29 [00:03<00:08,  2.85it/s][A
Epoch 186:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.113, v_num=3, train_l

Epoch 186, global step 42261: val_loss was not in top 2


Epoch 187:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.0931, v_num=3, train_loss=0.0308, train_accuracy=1.000, val_loss=0.201, val_accuracy=0.925]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 187:  89%|████████▉ | 228/255 [02:44<00:19,  1.38it/s, loss=0.0931, v_num=3, train_loss=0.0308, train_accuracy=1.000, val_loss=0.201, val_accuracy=0.925]
Validating:   7%|▋         | 2/29 [00:03<00:36,  1.35s/it][A
Epoch 187:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.0931, v_num=3, train_loss=0.0308, train_accuracy=1.000, val_loss=0.201, val_accuracy=0.925]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.77it/s][A
Epoch 187:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.0931, v_num=3, train_loss=0.0308, train_accuracy=1.000, val_loss=0.201, val_accuracy=0.925]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.88it/s][A
Epoch 187:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.0931, v_num=3, tra

Epoch 187, global step 42487: val_loss was not in top 2


Epoch 188:  89%|████████▊ | 226/255 [02:42<00:20,  1.39it/s, loss=0.126, v_num=3, train_loss=0.246, train_accuracy=0.944, val_loss=0.182, val_accuracy=0.929]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 188:  89%|████████▉ | 228/255 [02:44<00:19,  1.38it/s, loss=0.126, v_num=3, train_loss=0.246, train_accuracy=0.944, val_loss=0.182, val_accuracy=0.929]
Validating:   7%|▋         | 2/29 [00:03<00:36,  1.34s/it][A
Epoch 188:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.126, v_num=3, train_loss=0.246, train_accuracy=0.944, val_loss=0.182, val_accuracy=0.929]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.76it/s][A
Epoch 188:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.126, v_num=3, train_loss=0.246, train_accuracy=0.944, val_loss=0.182, val_accuracy=0.929]
Validating:  21%|██        | 6/29 [00:03<00:08,  2.86it/s][A
Epoch 188:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.126, v_num=3, train_loss

Epoch 188, global step 42713: val_loss was not in top 2


Epoch 189:  89%|████████▊ | 226/255 [02:42<00:20,  1.39it/s, loss=0.0958, v_num=3, train_loss=0.206, train_accuracy=0.889, val_loss=0.192, val_accuracy=0.925] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 189:  89%|████████▉ | 228/255 [02:45<00:19,  1.38it/s, loss=0.0958, v_num=3, train_loss=0.206, train_accuracy=0.889, val_loss=0.192, val_accuracy=0.925]
Validating:   7%|▋         | 2/29 [00:03<00:36,  1.35s/it][A
Epoch 189:  90%|█████████ | 230/255 [02:45<00:18,  1.39it/s, loss=0.0958, v_num=3, train_loss=0.206, train_accuracy=0.889, val_loss=0.192, val_accuracy=0.925]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.75it/s][A
Epoch 189:  91%|█████████ | 232/255 [02:46<00:16,  1.40it/s, loss=0.0958, v_num=3, train_loss=0.206, train_accuracy=0.889, val_loss=0.192, val_accuracy=0.925]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.88it/s][A
Epoch 189:  92%|█████████▏| 234/255 [02:46<00:14,  1.40it/s, loss=0.0958, v_num=3, train_

Epoch 189, global step 42939: val_loss was not in top 2


Epoch 190:  87%|████████▋ | 221/255 [02:38<00:24,  1.39it/s, loss=0.0823, v_num=3, train_loss=0.0629, train_accuracy=0.960, val_loss=0.216, val_accuracy=0.929]

IOPub message rate exceeded.
The notebook server will temporarily stop sending output
to the client in order to avoid crashing it.
To change this limit, set the config variable
`--NotebookApp.iopub_msg_rate_limit`.

Current values:
NotebookApp.iopub_msg_rate_limit=1000.0 (msgs/sec)
NotebookApp.rate_limit_window=3.0 (secs)



Epoch 194:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.102, v_num=3, train_loss=0.0429, train_accuracy=1.000, val_loss=0.198, val_accuracy=0.921] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 194:  89%|████████▉ | 228/255 [02:44<00:19,  1.38it/s, loss=0.102, v_num=3, train_loss=0.0429, train_accuracy=1.000, val_loss=0.198, val_accuracy=0.921]
Validating:   7%|▋         | 2/29 [00:03<00:36,  1.34s/it][A
Epoch 194:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.102, v_num=3, train_loss=0.0429, train_accuracy=1.000, val_loss=0.198, val_accuracy=0.921]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.78it/s][A
Epoch 194:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.102, v_num=3, train_loss=0.0429, train_accuracy=1.000, val_loss=0.198, val_accuracy=0.921]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.97it/s][A
Epoch 194:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.102, v_num=3, train_l

Epoch 194, global step 44069: val_loss was not in top 2


Epoch 195:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.107, v_num=3, train_loss=0.108, train_accuracy=0.944, val_loss=0.203, val_accuracy=0.922]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 195:  89%|████████▉ | 228/255 [02:44<00:19,  1.38it/s, loss=0.107, v_num=3, train_loss=0.108, train_accuracy=0.944, val_loss=0.203, val_accuracy=0.922]
Validating:   7%|▋         | 2/29 [00:03<00:34,  1.27s/it][A
Epoch 195:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.107, v_num=3, train_loss=0.108, train_accuracy=0.944, val_loss=0.203, val_accuracy=0.922]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.85it/s][A
Epoch 195:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.107, v_num=3, train_loss=0.108, train_accuracy=0.944, val_loss=0.203, val_accuracy=0.922]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.01it/s][A
Epoch 195:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.107, v_num=3, train_loss

Epoch 195, global step 44295: val_loss was not in top 2


Epoch 196:  89%|████████▊ | 226/255 [02:42<00:20,  1.39it/s, loss=0.139, v_num=3, train_loss=0.0801, train_accuracy=0.944, val_loss=0.198, val_accuracy=0.924] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 196:  89%|████████▉ | 228/255 [02:45<00:19,  1.38it/s, loss=0.139, v_num=3, train_loss=0.0801, train_accuracy=0.944, val_loss=0.198, val_accuracy=0.924]
Validating:   7%|▋         | 2/29 [00:03<00:35,  1.31s/it][A
Epoch 196:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.139, v_num=3, train_loss=0.0801, train_accuracy=0.944, val_loss=0.198, val_accuracy=0.924]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.80it/s][A
Epoch 196:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.139, v_num=3, train_loss=0.0801, train_accuracy=0.944, val_loss=0.198, val_accuracy=0.924]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.92it/s][A
Epoch 196:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.139, v_num=3, train_l

Epoch 196, global step 44521: val_loss was not in top 2


Epoch 197:  89%|████████▊ | 226/255 [02:42<00:20,  1.39it/s, loss=0.145, v_num=3, train_loss=0.161, train_accuracy=0.889, val_loss=0.221, val_accuracy=0.923]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 197:  89%|████████▉ | 228/255 [02:45<00:19,  1.38it/s, loss=0.145, v_num=3, train_loss=0.161, train_accuracy=0.889, val_loss=0.221, val_accuracy=0.923]
Validating:   7%|▋         | 2/29 [00:03<00:35,  1.33s/it][A
Epoch 197:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.145, v_num=3, train_loss=0.161, train_accuracy=0.889, val_loss=0.221, val_accuracy=0.923]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.79it/s][A
Epoch 197:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.145, v_num=3, train_loss=0.161, train_accuracy=0.889, val_loss=0.221, val_accuracy=0.923]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.89it/s][A
Epoch 197:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.145, v_num=3, train_loss

Epoch 197, global step 44747: val_loss was not in top 2


Epoch 198:  89%|████████▊ | 226/255 [02:41<00:20,  1.40it/s, loss=0.113, v_num=3, train_loss=0.0364, train_accuracy=1.000, val_loss=0.227, val_accuracy=0.918]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 198:  89%|████████▉ | 228/255 [02:44<00:19,  1.38it/s, loss=0.113, v_num=3, train_loss=0.0364, train_accuracy=1.000, val_loss=0.227, val_accuracy=0.918]
Validating:   7%|▋         | 2/29 [00:03<00:36,  1.34s/it][A
Epoch 198:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.113, v_num=3, train_loss=0.0364, train_accuracy=1.000, val_loss=0.227, val_accuracy=0.918]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.76it/s][A
Epoch 198:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.113, v_num=3, train_loss=0.0364, train_accuracy=1.000, val_loss=0.227, val_accuracy=0.918]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.91it/s][A
Epoch 198:  92%|█████████▏| 234/255 [02:45<00:14,  1.41it/s, loss=0.113, v_num=3, train_lo

Epoch 198, global step 44973: val_loss was not in top 2


Epoch 199:  89%|████████▊ | 226/255 [02:42<00:20,  1.39it/s, loss=0.113, v_num=3, train_loss=0.0147, train_accuracy=1.000, val_loss=0.216, val_accuracy=0.917]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 199:  89%|████████▉ | 228/255 [02:45<00:19,  1.38it/s, loss=0.113, v_num=3, train_loss=0.0147, train_accuracy=1.000, val_loss=0.216, val_accuracy=0.917]
Validating:   7%|▋         | 2/29 [00:03<00:35,  1.31s/it][A
Epoch 199:  90%|█████████ | 230/255 [02:45<00:17,  1.39it/s, loss=0.113, v_num=3, train_loss=0.0147, train_accuracy=1.000, val_loss=0.216, val_accuracy=0.917]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.80it/s][A
Epoch 199:  91%|█████████ | 232/255 [02:45<00:16,  1.40it/s, loss=0.113, v_num=3, train_loss=0.0147, train_accuracy=1.000, val_loss=0.216, val_accuracy=0.917]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.89it/s][A
Epoch 199:  92%|█████████▏| 234/255 [02:46<00:14,  1.41it/s, loss=0.113, v_num=3, train_lo

Epoch 199, global step 45199: val_loss was not in top 2


Epoch 199: 100%|██████████| 255/255 [02:50<00:00,  1.49it/s, loss=0.113, v_num=3, train_loss=0.0147, train_accuracy=1.000, val_loss=0.197, val_accuracy=0.921]


LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1,2]


Testing: 100%|██████████| 29/29 [00:08<00:00,  3.15it/s]--------------------------------------------------------------------------------
DATALOADER:0 TEST RESULTS
{'test_accuracy': 0.9339957237243652, 'test_loss': 0.16499805450439453}
--------------------------------------------------------------------------------
Testing: 100%|██████████| 29/29 [00:08<00:00,  3.44it/s]
------------------ Round: 29 ------------------
['FT9', 'F8', 'OZ', 'CZ', 'FC4', 'FC3', 'FP1', 'PO1', 'T3', 'T4', 'PO2']
Len: 11


GPU available: True, used: True
TPU available: False, using: 0 TPU cores
IPU available: False, using: 0 IPUs
LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1,2]

  | Name      | Type             | Params
-----------------------------------------------
0 | model     | DrowsyModel      | 1.3 M 
1 | criterion | CrossEntropyLoss | 0     
-----------------------------------------------
1.3 M     Trainable params
0         Non-trainable params
1.3 M     Total params
5.315     Total estimated model params size (MB)
  rank_zero_warn(f"Checkpoint directory {dirpath} exists and is not empty.")


                                                                      

Global seed set to 42


Epoch 0:  89%|████████▊ | 226/255 [02:42<00:20,  1.39it/s, loss=0.665, v_num=3, train_loss=0.694, train_accuracy=0.611]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 0:  89%|████████▉ | 228/255 [02:45<00:19,  1.37it/s, loss=0.665, v_num=3, train_loss=0.694, train_accuracy=0.611]
Validating:   7%|▋         | 2/29 [00:03<00:41,  1.53s/it][A
Epoch 0:  90%|█████████ | 230/255 [02:46<00:18,  1.38it/s, loss=0.665, v_num=3, train_loss=0.694, train_accuracy=0.611]
Validating:  14%|█▍        | 4/29 [00:04<00:15,  1.58it/s][A
Epoch 0:  91%|█████████ | 232/255 [02:46<00:16,  1.39it/s, loss=0.665, v_num=3, train_loss=0.694, train_accuracy=0.611]
Validating:  21%|██        | 6/29 [00:04<00:08,  2.67it/s][A
Epoch 0:  92%|█████████▏| 234/255 [02:46<00:14,  1.40it/s, loss=0.665, v_num=3, train_loss=0.694, train_accuracy=0.611]
Validating:  28%|██▊       | 8/29 [00:04<00:05,  3.76it/s][A
Epoch 0:  93%|█████████▎| 236/255 [02:47<00:13,  1.41it/s, loss=

Epoch 0, global step 225: val_loss reached 0.67346 (best 0.67346), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-29.ckpt" as top 2


Epoch 1:  89%|████████▊ | 226/255 [02:42<00:20,  1.39it/s, loss=0.6, v_num=3, train_loss=0.653, train_accuracy=0.611, val_loss=0.673, val_accuracy=0.580]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 1:  89%|████████▉ | 228/255 [02:46<00:19,  1.37it/s, loss=0.6, v_num=3, train_loss=0.653, train_accuracy=0.611, val_loss=0.673, val_accuracy=0.580]
Validating:   7%|▋         | 2/29 [00:03<00:41,  1.55s/it][A
Epoch 1:  90%|█████████ | 230/255 [02:46<00:18,  1.38it/s, loss=0.6, v_num=3, train_loss=0.653, train_accuracy=0.611, val_loss=0.673, val_accuracy=0.580]
Validating:  14%|█▍        | 4/29 [00:04<00:16,  1.55it/s][A
Epoch 1:  91%|█████████ | 232/255 [02:46<00:16,  1.39it/s, loss=0.6, v_num=3, train_loss=0.653, train_accuracy=0.611, val_loss=0.673, val_accuracy=0.580]
Validating:  21%|██        | 6/29 [00:04<00:08,  2.61it/s][A
Epoch 1:  92%|█████████▏| 234/255 [02:47<00:15,  1.40it/s, loss=0.6, v_num=3, train_loss=0.653, train_accura

Epoch 1, global step 451: val_loss reached 0.58750 (best 0.58750), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-29-v1.ckpt" as top 2


Epoch 2:  89%|████████▊ | 226/255 [02:42<00:20,  1.39it/s, loss=0.573, v_num=3, train_loss=0.696, train_accuracy=0.611, val_loss=0.588, val_accuracy=0.720]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 2:  89%|████████▉ | 228/255 [02:45<00:19,  1.37it/s, loss=0.573, v_num=3, train_loss=0.696, train_accuracy=0.611, val_loss=0.588, val_accuracy=0.720]
Validating:   7%|▋         | 2/29 [00:03<00:41,  1.55s/it][A
Epoch 2:  90%|█████████ | 230/255 [02:46<00:18,  1.38it/s, loss=0.573, v_num=3, train_loss=0.696, train_accuracy=0.611, val_loss=0.588, val_accuracy=0.720]
Validating:  14%|█▍        | 4/29 [00:04<00:15,  1.59it/s][A
Epoch 2:  91%|█████████ | 232/255 [02:46<00:16,  1.39it/s, loss=0.573, v_num=3, train_loss=0.696, train_accuracy=0.611, val_loss=0.588, val_accuracy=0.720]
Validating:  21%|██        | 6/29 [00:04<00:08,  2.64it/s][A
Epoch 2:  92%|█████████▏| 234/255 [02:47<00:14,  1.40it/s, loss=0.573, v_num=3, train_loss=0.696, trai

Epoch 2, global step 677: val_loss reached 0.58456 (best 0.58456), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-29.ckpt" as top 2


Epoch 3:  89%|████████▊ | 226/255 [02:42<00:20,  1.39it/s, loss=0.523, v_num=3, train_loss=0.410, train_accuracy=0.778, val_loss=0.585, val_accuracy=0.715]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 3:  89%|████████▉ | 228/255 [02:45<00:19,  1.38it/s, loss=0.523, v_num=3, train_loss=0.410, train_accuracy=0.778, val_loss=0.585, val_accuracy=0.715]
Validating:   7%|▋         | 2/29 [00:03<00:42,  1.56s/it][A
Epoch 3:  90%|█████████ | 230/255 [02:46<00:18,  1.38it/s, loss=0.523, v_num=3, train_loss=0.410, train_accuracy=0.778, val_loss=0.585, val_accuracy=0.715]
Validating:  14%|█▍        | 4/29 [00:04<00:15,  1.58it/s][A
Epoch 3:  91%|█████████ | 232/255 [02:46<00:16,  1.39it/s, loss=0.523, v_num=3, train_loss=0.410, train_accuracy=0.778, val_loss=0.585, val_accuracy=0.715]
Validating:  21%|██        | 6/29 [00:04<00:08,  2.64it/s][A
Epoch 3:  92%|█████████▏| 234/255 [02:46<00:14,  1.40it/s, loss=0.523, v_num=3, train_loss=0.410, trai

Epoch 3, global step 903: val_loss was not in top 2


Epoch 4:  89%|████████▊ | 226/255 [02:42<00:20,  1.39it/s, loss=0.551, v_num=3, train_loss=0.484, train_accuracy=0.778, val_loss=0.589, val_accuracy=0.732]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 4:  89%|████████▉ | 228/255 [02:46<00:19,  1.37it/s, loss=0.551, v_num=3, train_loss=0.484, train_accuracy=0.778, val_loss=0.589, val_accuracy=0.732]
Validating:   7%|▋         | 2/29 [00:03<00:41,  1.55s/it][A
Epoch 4:  90%|█████████ | 230/255 [02:46<00:18,  1.38it/s, loss=0.551, v_num=3, train_loss=0.484, train_accuracy=0.778, val_loss=0.589, val_accuracy=0.732]
Validating:  14%|█▍        | 4/29 [00:04<00:15,  1.59it/s][A
Epoch 4:  91%|█████████ | 232/255 [02:47<00:16,  1.39it/s, loss=0.551, v_num=3, train_loss=0.484, train_accuracy=0.778, val_loss=0.589, val_accuracy=0.732]
Validating:  21%|██        | 6/29 [00:04<00:08,  2.65it/s][A
Epoch 4:  92%|█████████▏| 234/255 [02:47<00:15,  1.40it/s, loss=0.551, v_num=3, train_loss=0.484, trai

Epoch 4, global step 1129: val_loss was not in top 2


Epoch 5:  89%|████████▊ | 226/255 [02:42<00:20,  1.39it/s, loss=0.583, v_num=3, train_loss=0.675, train_accuracy=0.611, val_loss=0.630, val_accuracy=0.688]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 5:  89%|████████▉ | 228/255 [02:46<00:19,  1.37it/s, loss=0.583, v_num=3, train_loss=0.675, train_accuracy=0.611, val_loss=0.630, val_accuracy=0.688]
Validating:   7%|▋         | 2/29 [00:03<00:43,  1.59s/it][A
Epoch 5:  90%|█████████ | 230/255 [02:46<00:18,  1.38it/s, loss=0.583, v_num=3, train_loss=0.675, train_accuracy=0.611, val_loss=0.630, val_accuracy=0.688]
Validating:  14%|█▍        | 4/29 [00:04<00:16,  1.56it/s][A
Epoch 5:  91%|█████████ | 232/255 [02:46<00:16,  1.39it/s, loss=0.583, v_num=3, train_loss=0.675, train_accuracy=0.611, val_loss=0.630, val_accuracy=0.688]
Validating:  21%|██        | 6/29 [00:04<00:08,  2.67it/s][A
Epoch 5:  92%|█████████▏| 234/255 [02:47<00:14,  1.40it/s, loss=0.583, v_num=3, train_loss=0.675, trai

Epoch 5, global step 1355: val_loss reached 0.58238 (best 0.58238), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-29-v1.ckpt" as top 2


Epoch 6:  89%|████████▊ | 226/255 [02:39<00:20,  1.42it/s, loss=0.503, v_num=3, train_loss=0.281, train_accuracy=0.889, val_loss=0.582, val_accuracy=0.700]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 6:  89%|████████▉ | 228/255 [02:43<00:19,  1.40it/s, loss=0.503, v_num=3, train_loss=0.281, train_accuracy=0.889, val_loss=0.582, val_accuracy=0.700]
Validating:   7%|▋         | 2/29 [00:03<00:42,  1.59s/it][A
Epoch 6:  90%|█████████ | 230/255 [02:43<00:17,  1.41it/s, loss=0.503, v_num=3, train_loss=0.281, train_accuracy=0.889, val_loss=0.582, val_accuracy=0.700]
Validating:  14%|█▍        | 4/29 [00:04<00:16,  1.55it/s][A
Epoch 6:  91%|█████████ | 232/255 [02:44<00:16,  1.41it/s, loss=0.503, v_num=3, train_loss=0.281, train_accuracy=0.889, val_loss=0.582, val_accuracy=0.700]
Validating:  21%|██        | 6/29 [00:04<00:08,  2.66it/s][A
Epoch 6:  92%|█████████▏| 234/255 [02:44<00:14,  1.42it/s, loss=0.503, v_num=3, train_loss=0.281, trai

Epoch 6, global step 1581: val_loss reached 0.57178 (best 0.57178), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-29.ckpt" as top 2


Epoch 7:  89%|████████▊ | 226/255 [02:42<00:20,  1.39it/s, loss=0.532, v_num=3, train_loss=0.459, train_accuracy=0.778, val_loss=0.572, val_accuracy=0.740]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 7:  89%|████████▉ | 228/255 [02:45<00:19,  1.37it/s, loss=0.532, v_num=3, train_loss=0.459, train_accuracy=0.778, val_loss=0.572, val_accuracy=0.740]
Validating:   7%|▋         | 2/29 [00:03<00:42,  1.58s/it][A
Epoch 7:  90%|█████████ | 230/255 [02:46<00:18,  1.38it/s, loss=0.532, v_num=3, train_loss=0.459, train_accuracy=0.778, val_loss=0.572, val_accuracy=0.740]
Validating:  14%|█▍        | 4/29 [00:04<00:16,  1.54it/s][A
Epoch 7:  91%|█████████ | 232/255 [02:46<00:16,  1.39it/s, loss=0.532, v_num=3, train_loss=0.459, train_accuracy=0.778, val_loss=0.572, val_accuracy=0.740]
Validating:  21%|██        | 6/29 [00:04<00:08,  2.61it/s][A
Epoch 7:  92%|█████████▏| 234/255 [02:47<00:14,  1.40it/s, loss=0.532, v_num=3, train_loss=0.459, trai

Epoch 7, global step 1807: val_loss was not in top 2


Epoch 8:  22%|██▏       | 57/255 [00:43<02:30,  1.31it/s, loss=0.527, v_num=3, train_loss=0.626, train_accuracy=0.640, val_loss=0.617, val_accuracy=0.733] 

## Load Checkpoint 

In [None]:
# best-checkpoint-corr-3-v1.ckptn
# trainer.fit(model, data_module, ckpt_path="/Workspace/code/checkpoints/best-checkpoint-corr-3-v1.ckpt")