In [1]:
import os
import pandas as pd
import numpy as np
from sklearn.preprocessing import LabelEncoder
from sklearn.model_selection import train_test_split
from sklearn.metrics import classification_report, confusion_matrix
import matplotlib.pyplot as plt

import torch
from torch import nn, optim
from torch.nn import functional as F
from torch.utils.data import Dataset, DataLoader

import torchmetrics
from torchmetrics.functional import accuracy

import pytorch_lightning as pl
from pytorch_lightning.loggers import TensorBoardLogger
from pytorch_lightning.callbacks import ModelCheckpoint

device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
print(device)

cuda


## Model Setup 

In [2]:
pl.seed_everything(42, workers=True)

class DrowsyDataset(Dataset):
    
    def __init__(self, sequences):
        self.sequences = sequences
        
    def __len__(self):
        return len(self.sequences)
    
    def __getitem__(self, idx):
        sequence, label = self.sequences[idx]
        return dict(
            sequence=torch.Tensor(sequence.to_numpy()),
            label=torch.tensor(label).long()
        )
    
class DrowsyDataModule(pl.LightningDataModule):
    
    def __init__(self, train_sequences, val_sequences, test_sequences, batch_size):
        super().__init__()
        self.train_sequences = train_sequences
        self.val_sequences = val_sequences
        self.test_sequences = test_sequences
        self.batch_size = batch_size

    def setup(self, stage=None):
        self.train_dataset = DrowsyDataset(self.train_sequences)
        self.val_dataset = DrowsyDataset(self.val_sequences)
        self.test_dataset = DrowsyDataset(self.test_sequences)
        
    def train_dataloader(self):
        return DataLoader(
            self.train_dataset,
            batch_size=self.batch_size,
            shuffle=True,
            num_workers=os.cpu_count()
        )
    
    def val_dataloader(self):
        return DataLoader(
            self.val_dataset,
            batch_size=self.batch_size,
            shuffle=False,
            num_workers=os.cpu_count()
        )
    
    def test_dataloader(self):
        return DataLoader(
            self.test_dataset,
            batch_size=self.batch_size,
            shuffle=False,
            num_workers=os.cpu_count()
        ) 

class DrowsyModel(nn.Module):
    
    def __init__(self, n_features, n_classes, n_hidden=256, n_layers=3):
        super().__init__()
        
        self.n_hidden = n_hidden
        
        self.lstm = nn.LSTM(
            input_size=n_features,
            hidden_size=n_hidden,
            num_layers=n_layers,
            batch_first=True,
            dropout=0.75
        )
        
        self.classifier = nn.Linear(n_hidden, n_classes)
        
    def forward(self, x):
        self.lstm.flatten_parameters()
        _, (hidden, _) = self.lstm(x)
        
        out = hidden[-1]
        return self.classifier(out)
    
class DrowsyPredictor(pl.LightningModule):
    
    def __init__(self, n_features: int, n_classes: int):
        super().__init__()
        self.model = DrowsyModel(n_features, n_classes)
        self.criterion = nn.CrossEntropyLoss()
        
    def forward(self, x, label=None):
        output = self.model(x)
        loss = 0
        if label is not None:
            loss = self.criterion(output, label)
        return loss, output
        
    def training_step(self, batch, batch_idx):
        sequences = batch["sequence"]
        labels = batch["label"]
        loss, outputs = self(sequences, labels)
        predictions = torch.argmax(outputs, dim=1)
        step_accuracy = accuracy(predictions, labels)
        
        self.log("train_loss", loss, prog_bar=True, logger=True)
        self.log("train_accuracy", step_accuracy, prog_bar=True, logger=True)
        
        return {"loss": loss, "accuracy": step_accuracy}
    
    def validation_step(self, batch, batch_idx):
        sequences = batch["sequence"]
        labels = batch["label"]
        loss, outputs = self(sequences, labels)
        predictions = torch.argmax(outputs, dim=1)
        step_accuracy = accuracy(predictions, labels)
        
        self.log("val_loss", loss, prog_bar=True, logger=True)
        self.log("val_accuracy", step_accuracy, prog_bar=True, logger=True)
        
        return {"loss": loss, "accuracy": step_accuracy}
    
    def test_step(self, batch, batch_idx):
        sequences = batch["sequence"]
        labels = batch["label"]
        loss, outputs = self(sequences, labels)
        predictions = torch.argmax(outputs, dim=1)
        step_accuracy = accuracy(predictions, labels)
        
        self.log("test_loss", loss, prog_bar=True, logger=True)
        self.log("test_accuracy", step_accuracy, prog_bar=True, logger=True)
        
        return {"loss": loss, "accuracy": step_accuracy}
    
    def configure_optimizers(self):
        return optim.Adam(self.parameters(), lr=0.0001)

Global seed set to 42


## 參數設置

In [3]:
%load_ext tensorboard
%reload_ext tensorboard
%tensorboard --logdir ./lightning_logs --host 0.0.0.0 --port=8888

In [4]:
X_train = pd.read_csv('../data2.csv')

In [5]:
N_EPOCHS = 200
BATCH_SIZE = 50

ORG_FEATURE_COLUMNS = ['TP8', 'FP2', 'FCZ', 'FT10', 'O2', 'O1', 'FT7', 'F4', 'TP7', 'C3', 'C4', 'F3', 'FT8', 'T6', 'HEOR', 'T5', 'VEOL', 'F7', 'FZ', 'VEOU', 'A1', 'P3', 'PZ', 'CP3', 'P4', 'CPZ', 'A2', 'HEOL', 'CP4', 'FT9', 'F8', 'OZ', 'CZ', 'FC4', 'FC3', 'FP1', 'PO1', 'T3', 'T4', 'PO2']
g = X_train.groupby("group")


## Main

In [None]:
n = 34
FEATURE_COLUMNS = ORG_FEATURE_COLUMNS[n:]

while(n < 35):
    print("------------------ Round: " + str(n) + " ------------------")
    print(FEATURE_COLUMNS)
    print("Len:", len(FEATURE_COLUMNS))
    
    label_encoder = LabelEncoder()
    encoded_labels = label_encoder.fit_transform(X_train.state)

    label_encoder.classes_

    X_train['label'] = encoded_labels

    # Prepare data ###########################################
    sequences = [] 

    for name, group in g:
        sequence_features = group[FEATURE_COLUMNS]
        label = group.label.iloc[0]

        # print((sequence_features, label))
        sequences.append((sequence_features, label))

    # Setting up train, test, val gruop #######################
    train_sequences, test_sequences = train_test_split(sequences, test_size=0.2)
    val_sequences, test_sequences = train_test_split(test_sequences, test_size=0.5)


    # Setting up data module ##################################
    data_module = DrowsyDataModule(
        train_sequences, val_sequences, test_sequences, BATCH_SIZE
    )

    model = DrowsyPredictor(
        n_features=len(FEATURE_COLUMNS), 
        n_classes=len(label_encoder.classes_)
    )

    # Check points and logger #################################
    checkpoint_callback = ModelCheckpoint(
        dirpath="checkpoints",
        filename="best-checkpoint-corr-" + str(n),
        save_top_k=2,
        verbose=True,
        monitor="val_loss",
        mode="min"
    )

    logger = TensorBoardLogger("lightning_logs", name="Drowsy_" + str(n))
 
    trainer = pl.Trainer(
        logger=logger,
        callbacks=[checkpoint_callback],
        max_epochs=N_EPOCHS,
        gpus=[0],
        # gpus=2, 
        # auto_select_gpus=True,
        auto_lr_find=True, 
        # check_val_every_n_epoch=10
        # refresh_rate=20,
    )
    
    # Training start
    if (n == 34):
        trainer.fit(model, data_module, ckpt_path="/Workspace/code/checkpoints/best-checkpoint-corr-34.ckpt")
    else:
        trainer.fit(model, data_module)
    trainer.test(model, data_module)
    
    FEATURE_COLUMNS.pop(0)
    n = n + 1

------------------ Round: 33 ------------------
['FC4', 'FC3', 'FP1', 'PO1', 'T3', 'T4', 'PO2']
Len: 7


GPU available: True, used: True
TPU available: False, using: 0 TPU cores
IPU available: False, using: 0 IPUs
Restoring states from the checkpoint path at /Workspace/code/checkpoints/best-checkpoint-corr-33-v1.ckpt
LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1,2]
  "You're resuming from a checkpoint that ended mid-epoch."
Restored all states from the checkpoint file at /Workspace/code/checkpoints/best-checkpoint-corr-33-v1.ckpt

  | Name      | Type             | Params
-----------------------------------------------
0 | model     | DrowsyModel      | 1.3 M 
1 | criterion | CrossEntropyLoss | 0     
-----------------------------------------------
1.3 M     Trainable params
0         Non-trainable params
1.3 M     Total params
5.298     Total estimated model params size (MB)
  rank_zero_warn(f"Checkpoint directory {dirpath} exists and is not empty.")


                                                                      

Global seed set to 42


Epoch 97:  89%|████████▊ | 226/255 [02:36<00:20,  1.44it/s, loss=0.0974, v_num=2, train_loss=0.127, train_accuracy=0.944] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 97:  89%|████████▉ | 228/255 [02:38<00:18,  1.44it/s, loss=0.0974, v_num=2, train_loss=0.127, train_accuracy=0.944]
Validating:   7%|▋         | 2/29 [00:01<00:20,  1.32it/s][A
Epoch 97:  90%|█████████ | 230/255 [02:38<00:17,  1.45it/s, loss=0.0974, v_num=2, train_loss=0.127, train_accuracy=0.944]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.68it/s][A
Epoch 97:  91%|█████████ | 232/255 [02:39<00:15,  1.46it/s, loss=0.0974, v_num=2, train_loss=0.127, train_accuracy=0.944]
Validating:  21%|██        | 6/29 [00:02<00:05,  3.91it/s][A
Epoch 97:  92%|█████████▏| 234/255 [02:39<00:14,  1.47it/s, loss=0.0974, v_num=2, train_loss=0.127, train_accuracy=0.944]
Validating:  28%|██▊       | 8/29 [00:02<00:04,  4.76it/s][A
Epoch 97:  93%|█████████▎| 236/255 [02:39<00:12,  1.4

Epoch 97, global step 22147: val_loss was not in top 2


Epoch 98:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.0839, v_num=2, train_loss=0.376, train_accuracy=0.889, val_loss=0.173, val_accuracy=0.931]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 98:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0839, v_num=2, train_loss=0.376, train_accuracy=0.889, val_loss=0.173, val_accuracy=0.931]
Validating:   7%|▋         | 2/29 [00:01<00:20,  1.29it/s][A
Epoch 98:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.0839, v_num=2, train_loss=0.376, train_accuracy=0.889, val_loss=0.173, val_accuracy=0.931]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.69it/s][A
Epoch 98:  91%|█████████ | 232/255 [02:37<00:15,  1.48it/s, loss=0.0839, v_num=2, train_loss=0.376, train_accuracy=0.889, val_loss=0.173, val_accuracy=0.931]
Validating:  21%|██        | 6/29 [00:02<00:05,  3.87it/s][A
Epoch 98:  92%|█████████▏| 234/255 [02:37<00:14,  1.48it/s, loss=0.0839, v_num=2, train_loss

Epoch 98, global step 22373: val_loss reached 0.15569 (best 0.15569), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-33-v1.ckpt" as top 2


Epoch 99:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.0699, v_num=2, train_loss=0.0365, train_accuracy=1.000, val_loss=0.156, val_accuracy=0.947] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 99:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0699, v_num=2, train_loss=0.0365, train_accuracy=1.000, val_loss=0.156, val_accuracy=0.947]
Validating:   7%|▋         | 2/29 [00:01<00:21,  1.26it/s][A
Epoch 99:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.0699, v_num=2, train_loss=0.0365, train_accuracy=1.000, val_loss=0.156, val_accuracy=0.947]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.66it/s][A
Epoch 99:  91%|█████████ | 232/255 [02:37<00:15,  1.48it/s, loss=0.0699, v_num=2, train_loss=0.0365, train_accuracy=1.000, val_loss=0.156, val_accuracy=0.947]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.83it/s][A
Epoch 99:  92%|█████████▏| 234/255 [02:37<00:14,  1.49it/s, loss=0.0699, v_num=2, train_l

Epoch 99, global step 22599: val_loss was not in top 2


Epoch 100:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.0654, v_num=2, train_loss=0.0638, train_accuracy=0.944, val_loss=0.169, val_accuracy=0.943] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 100:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0654, v_num=2, train_loss=0.0638, train_accuracy=0.944, val_loss=0.169, val_accuracy=0.943]
Validating:   7%|▋         | 2/29 [00:01<00:21,  1.23it/s][A
Epoch 100:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.0654, v_num=2, train_loss=0.0638, train_accuracy=0.944, val_loss=0.169, val_accuracy=0.943]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.60it/s][A
Epoch 100:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.0654, v_num=2, train_loss=0.0638, train_accuracy=0.944, val_loss=0.169, val_accuracy=0.943]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.80it/s][A
Epoch 100:  92%|█████████▏| 234/255 [02:37<00:14,  1.48it/s, loss=0.0654, v_num=2, tr

Epoch 100, global step 22825: val_loss was not in top 2


Epoch 101:  89%|████████▊ | 226/255 [02:35<00:19,  1.46it/s, loss=0.0967, v_num=2, train_loss=0.258, train_accuracy=0.944, val_loss=0.171, val_accuracy=0.937]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 101:  89%|████████▉ | 228/255 [02:36<00:18,  1.45it/s, loss=0.0967, v_num=2, train_loss=0.258, train_accuracy=0.944, val_loss=0.171, val_accuracy=0.937]
Validating:   7%|▋         | 2/29 [00:01<00:21,  1.23it/s][A
Epoch 101:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.0967, v_num=2, train_loss=0.258, train_accuracy=0.944, val_loss=0.171, val_accuracy=0.937]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.55it/s][A
Epoch 101:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.0967, v_num=2, train_loss=0.258, train_accuracy=0.944, val_loss=0.171, val_accuracy=0.937]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.78it/s][A
Epoch 101:  92%|█████████▏| 234/255 [02:37<00:14,  1.48it/s, loss=0.0967, v_num=2, train

Epoch 101, global step 23051: val_loss was not in top 2


Epoch 102:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.088, v_num=2, train_loss=0.170, train_accuracy=0.944, val_loss=0.210, val_accuracy=0.925]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 102:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.088, v_num=2, train_loss=0.170, train_accuracy=0.944, val_loss=0.210, val_accuracy=0.925]
Validating:   7%|▋         | 2/29 [00:01<00:21,  1.24it/s][A
Epoch 102:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.088, v_num=2, train_loss=0.170, train_accuracy=0.944, val_loss=0.210, val_accuracy=0.925]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.60it/s][A
Epoch 102:  91%|█████████ | 232/255 [02:37<00:15,  1.48it/s, loss=0.088, v_num=2, train_loss=0.170, train_accuracy=0.944, val_loss=0.210, val_accuracy=0.925]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.78it/s][A
Epoch 102:  92%|█████████▏| 234/255 [02:37<00:14,  1.49it/s, loss=0.088, v_num=2, train_loss

Epoch 102, global step 23277: val_loss was not in top 2


Epoch 103:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.101, v_num=2, train_loss=0.0536, train_accuracy=1.000, val_loss=0.181, val_accuracy=0.934] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 103:  89%|████████▉ | 228/255 [02:36<00:18,  1.45it/s, loss=0.101, v_num=2, train_loss=0.0536, train_accuracy=1.000, val_loss=0.181, val_accuracy=0.934]
Validating:   7%|▋         | 2/29 [00:01<00:22,  1.22it/s][A
Epoch 103:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.101, v_num=2, train_loss=0.0536, train_accuracy=1.000, val_loss=0.181, val_accuracy=0.934]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.57it/s][A
Epoch 103:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.101, v_num=2, train_loss=0.0536, train_accuracy=1.000, val_loss=0.181, val_accuracy=0.934]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.64it/s][A
Epoch 103:  92%|█████████▏| 234/255 [02:37<00:14,  1.48it/s, loss=0.101, v_num=2, train_l

Epoch 103, global step 23503: val_loss was not in top 2


Epoch 104:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.236, v_num=2, train_loss=0.204, train_accuracy=0.889, val_loss=0.164, val_accuracy=0.944]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 104:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.236, v_num=2, train_loss=0.204, train_accuracy=0.889, val_loss=0.164, val_accuracy=0.944]
Validating:   7%|▋         | 2/29 [00:02<00:23,  1.14it/s][A
Epoch 104:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.236, v_num=2, train_loss=0.204, train_accuracy=0.889, val_loss=0.164, val_accuracy=0.944]
Validating:  14%|█▍        | 4/29 [00:02<00:10,  2.42it/s][A
Epoch 104:  91%|█████████ | 232/255 [02:37<00:15,  1.48it/s, loss=0.236, v_num=2, train_loss=0.204, train_accuracy=0.889, val_loss=0.164, val_accuracy=0.944]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.64it/s][A
Epoch 104:  92%|█████████▏| 234/255 [02:37<00:14,  1.48it/s, loss=0.236, v_num=2, train_loss

Epoch 104, global step 23729: val_loss was not in top 2


Epoch 105:  89%|████████▊ | 226/255 [02:35<00:19,  1.46it/s, loss=0.0779, v_num=2, train_loss=0.0484, train_accuracy=1.000, val_loss=0.269, val_accuracy=0.903]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 105:  89%|████████▉ | 228/255 [02:36<00:18,  1.45it/s, loss=0.0779, v_num=2, train_loss=0.0484, train_accuracy=1.000, val_loss=0.269, val_accuracy=0.903]
Validating:   7%|▋         | 2/29 [00:01<00:21,  1.23it/s][A
Epoch 105:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.0779, v_num=2, train_loss=0.0484, train_accuracy=1.000, val_loss=0.269, val_accuracy=0.903]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.54it/s][A
Epoch 105:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.0779, v_num=2, train_loss=0.0484, train_accuracy=1.000, val_loss=0.269, val_accuracy=0.903]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.76it/s][A
Epoch 105:  92%|█████████▏| 234/255 [02:37<00:14,  1.48it/s, loss=0.0779, v_num=2, tra

Epoch 105, global step 23955: val_loss reached 0.15047 (best 0.15047), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-33.ckpt" as top 2


Epoch 106:  89%|████████▊ | 226/255 [02:35<00:19,  1.46it/s, loss=0.0517, v_num=2, train_loss=0.124, train_accuracy=0.944, val_loss=0.150, val_accuracy=0.942]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 106:  89%|████████▉ | 228/255 [02:36<00:18,  1.45it/s, loss=0.0517, v_num=2, train_loss=0.124, train_accuracy=0.944, val_loss=0.150, val_accuracy=0.942]
Validating:   7%|▋         | 2/29 [00:01<00:21,  1.23it/s][A
Epoch 106:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.0517, v_num=2, train_loss=0.124, train_accuracy=0.944, val_loss=0.150, val_accuracy=0.942]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.61it/s][A
Epoch 106:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.0517, v_num=2, train_loss=0.124, train_accuracy=0.944, val_loss=0.150, val_accuracy=0.942]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.82it/s][A
Epoch 106:  92%|█████████▏| 234/255 [02:37<00:14,  1.48it/s, loss=0.0517, v_num=2, train

Epoch 106, global step 24181: val_loss was not in top 2


Epoch 107:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.0708, v_num=2, train_loss=0.174, train_accuracy=0.944, val_loss=0.169, val_accuracy=0.944]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 107:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0708, v_num=2, train_loss=0.174, train_accuracy=0.944, val_loss=0.169, val_accuracy=0.944]
Validating:   7%|▋         | 2/29 [00:01<00:22,  1.22it/s][A
Epoch 107:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.0708, v_num=2, train_loss=0.174, train_accuracy=0.944, val_loss=0.169, val_accuracy=0.944]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.60it/s][A
Epoch 107:  91%|█████████ | 232/255 [02:37<00:15,  1.48it/s, loss=0.0708, v_num=2, train_loss=0.174, train_accuracy=0.944, val_loss=0.169, val_accuracy=0.944]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.83it/s][A
Epoch 107:  92%|█████████▏| 234/255 [02:37<00:14,  1.49it/s, loss=0.0708, v_num=2, train

Epoch 107, global step 24407: val_loss was not in top 2


Epoch 108:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.0673, v_num=2, train_loss=0.102, train_accuracy=0.944, val_loss=0.177, val_accuracy=0.945]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 108:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0673, v_num=2, train_loss=0.102, train_accuracy=0.944, val_loss=0.177, val_accuracy=0.945]
Validating:   7%|▋         | 2/29 [00:01<00:22,  1.21it/s][A
Epoch 108:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.0673, v_num=2, train_loss=0.102, train_accuracy=0.944, val_loss=0.177, val_accuracy=0.945]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.56it/s][A
Epoch 108:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.0673, v_num=2, train_loss=0.102, train_accuracy=0.944, val_loss=0.177, val_accuracy=0.945]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.78it/s][A
Epoch 108:  92%|█████████▏| 234/255 [02:37<00:14,  1.48it/s, loss=0.0673, v_num=2, train

Epoch 108, global step 24633: val_loss was not in top 2


Epoch 109:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.0781, v_num=2, train_loss=0.0591, train_accuracy=0.944, val_loss=0.176, val_accuracy=0.940] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 109:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0781, v_num=2, train_loss=0.0591, train_accuracy=0.944, val_loss=0.176, val_accuracy=0.940]
Validating:   7%|▋         | 2/29 [00:01<00:22,  1.21it/s][A
Epoch 109:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.0781, v_num=2, train_loss=0.0591, train_accuracy=0.944, val_loss=0.176, val_accuracy=0.940]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.58it/s][A
Epoch 109:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.0781, v_num=2, train_loss=0.0591, train_accuracy=0.944, val_loss=0.176, val_accuracy=0.940]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.81it/s][A
Epoch 109:  92%|█████████▏| 234/255 [02:37<00:14,  1.48it/s, loss=0.0781, v_num=2, tr

Epoch 109, global step 24859: val_loss was not in top 2


Epoch 110:  89%|████████▊ | 226/255 [02:35<00:19,  1.46it/s, loss=0.0717, v_num=2, train_loss=0.165, train_accuracy=0.944, val_loss=0.197, val_accuracy=0.938]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 110:  89%|████████▉ | 228/255 [02:36<00:18,  1.45it/s, loss=0.0717, v_num=2, train_loss=0.165, train_accuracy=0.944, val_loss=0.197, val_accuracy=0.938]
Validating:   7%|▋         | 2/29 [00:01<00:22,  1.22it/s][A
Epoch 110:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.0717, v_num=2, train_loss=0.165, train_accuracy=0.944, val_loss=0.197, val_accuracy=0.938]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.58it/s][A
Epoch 110:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.0717, v_num=2, train_loss=0.165, train_accuracy=0.944, val_loss=0.197, val_accuracy=0.938]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.79it/s][A
Epoch 110:  92%|█████████▏| 234/255 [02:37<00:14,  1.48it/s, loss=0.0717, v_num=2, train

Epoch 110, global step 25085: val_loss was not in top 2


Epoch 111:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.0605, v_num=2, train_loss=0.0065, train_accuracy=1.000, val_loss=0.245, val_accuracy=0.926] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 111:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0605, v_num=2, train_loss=0.0065, train_accuracy=1.000, val_loss=0.245, val_accuracy=0.926]
Validating:   7%|▋         | 2/29 [00:01<00:22,  1.23it/s][A
Epoch 111:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.0605, v_num=2, train_loss=0.0065, train_accuracy=1.000, val_loss=0.245, val_accuracy=0.926]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.61it/s][A
Epoch 111:  91%|█████████ | 232/255 [02:37<00:15,  1.48it/s, loss=0.0605, v_num=2, train_loss=0.0065, train_accuracy=1.000, val_loss=0.245, val_accuracy=0.926]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.82it/s][A
Epoch 111:  92%|█████████▏| 234/255 [02:37<00:14,  1.49it/s, loss=0.0605, v_num=2, tr

Epoch 111, global step 25311: val_loss was not in top 2


Epoch 112:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.108, v_num=2, train_loss=0.0229, train_accuracy=1.000, val_loss=0.171, val_accuracy=0.941]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 112:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.108, v_num=2, train_loss=0.0229, train_accuracy=1.000, val_loss=0.171, val_accuracy=0.941]
Validating:   7%|▋         | 2/29 [00:01<00:22,  1.22it/s][A
Epoch 112:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.108, v_num=2, train_loss=0.0229, train_accuracy=1.000, val_loss=0.171, val_accuracy=0.941]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.58it/s][A
Epoch 112:  91%|█████████ | 232/255 [02:37<00:15,  1.48it/s, loss=0.108, v_num=2, train_loss=0.0229, train_accuracy=1.000, val_loss=0.171, val_accuracy=0.941]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.73it/s][A
Epoch 112:  92%|█████████▏| 234/255 [02:37<00:14,  1.48it/s, loss=0.108, v_num=2, train_

Epoch 112, global step 25537: val_loss was not in top 2


Epoch 113:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.085, v_num=2, train_loss=0.0082, train_accuracy=1.000, val_loss=0.185, val_accuracy=0.937]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 113:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.085, v_num=2, train_loss=0.0082, train_accuracy=1.000, val_loss=0.185, val_accuracy=0.937]
Validating:   7%|▋         | 2/29 [00:01<00:22,  1.23it/s][A
Epoch 113:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.085, v_num=2, train_loss=0.0082, train_accuracy=1.000, val_loss=0.185, val_accuracy=0.937]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.57it/s][A
Epoch 113:  91%|█████████ | 232/255 [02:37<00:15,  1.48it/s, loss=0.085, v_num=2, train_loss=0.0082, train_accuracy=1.000, val_loss=0.185, val_accuracy=0.937]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.78it/s][A
Epoch 113:  92%|█████████▏| 234/255 [02:37<00:14,  1.48it/s, loss=0.085, v_num=2, train_

Epoch 113, global step 25763: val_loss was not in top 2


Epoch 114:  89%|████████▊ | 226/255 [02:35<00:19,  1.46it/s, loss=0.0549, v_num=2, train_loss=0.00985, train_accuracy=1.000, val_loss=0.193, val_accuracy=0.932]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 114:  89%|████████▉ | 228/255 [02:36<00:18,  1.45it/s, loss=0.0549, v_num=2, train_loss=0.00985, train_accuracy=1.000, val_loss=0.193, val_accuracy=0.932]
Validating:   7%|▋         | 2/29 [00:01<00:22,  1.21it/s][A
Epoch 114:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.0549, v_num=2, train_loss=0.00985, train_accuracy=1.000, val_loss=0.193, val_accuracy=0.932]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.56it/s][A
Epoch 114:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.0549, v_num=2, train_loss=0.00985, train_accuracy=1.000, val_loss=0.193, val_accuracy=0.932]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.79it/s][A
Epoch 114:  92%|█████████▏| 234/255 [02:37<00:14,  1.48it/s, loss=0.0549, v_num=2,

Epoch 114, global step 25989: val_loss was not in top 2


Epoch 115:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.229, v_num=2, train_loss=0.203, train_accuracy=0.944, val_loss=0.161, val_accuracy=0.945]   
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 115:  89%|████████▉ | 228/255 [02:36<00:18,  1.45it/s, loss=0.229, v_num=2, train_loss=0.203, train_accuracy=0.944, val_loss=0.161, val_accuracy=0.945]
Validating:   7%|▋         | 2/29 [00:01<00:21,  1.23it/s][A
Epoch 115:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.229, v_num=2, train_loss=0.203, train_accuracy=0.944, val_loss=0.161, val_accuracy=0.945]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.61it/s][A
Epoch 115:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.229, v_num=2, train_loss=0.203, train_accuracy=0.944, val_loss=0.161, val_accuracy=0.945]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.82it/s][A
Epoch 115:  92%|█████████▏| 234/255 [02:37<00:14,  1.48it/s, loss=0.229, v_num=2, train_los

Epoch 115, global step 26215: val_loss was not in top 2


Epoch 116:  89%|████████▊ | 226/255 [02:35<00:19,  1.46it/s, loss=0.0879, v_num=2, train_loss=0.0303, train_accuracy=1.000, val_loss=0.293, val_accuracy=0.880]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 116:  89%|████████▉ | 228/255 [02:36<00:18,  1.45it/s, loss=0.0879, v_num=2, train_loss=0.0303, train_accuracy=1.000, val_loss=0.293, val_accuracy=0.880]
Validating:   7%|▋         | 2/29 [00:01<00:22,  1.22it/s][A
Epoch 116:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.0879, v_num=2, train_loss=0.0303, train_accuracy=1.000, val_loss=0.293, val_accuracy=0.880]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.59it/s][A
Epoch 116:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.0879, v_num=2, train_loss=0.0303, train_accuracy=1.000, val_loss=0.293, val_accuracy=0.880]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.82it/s][A
Epoch 116:  92%|█████████▏| 234/255 [02:37<00:14,  1.48it/s, loss=0.0879, v_num=2, tra

Epoch 116, global step 26441: val_loss was not in top 2


Epoch 117:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.0774, v_num=2, train_loss=0.212, train_accuracy=0.944, val_loss=0.169, val_accuracy=0.938] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 117:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0774, v_num=2, train_loss=0.212, train_accuracy=0.944, val_loss=0.169, val_accuracy=0.938]
Validating:   7%|▋         | 2/29 [00:01<00:22,  1.21it/s][A
Epoch 117:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.0774, v_num=2, train_loss=0.212, train_accuracy=0.944, val_loss=0.169, val_accuracy=0.938]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.55it/s][A
Epoch 117:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.0774, v_num=2, train_loss=0.212, train_accuracy=0.944, val_loss=0.169, val_accuracy=0.938]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.76it/s][A
Epoch 117:  92%|█████████▏| 234/255 [02:37<00:14,  1.48it/s, loss=0.0774, v_num=2, train_

Epoch 117, global step 26667: val_loss was not in top 2


Epoch 118:  89%|████████▊ | 226/255 [02:35<00:19,  1.46it/s, loss=0.0901, v_num=2, train_loss=0.0302, train_accuracy=1.000, val_loss=0.172, val_accuracy=0.942] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 118:  89%|████████▉ | 228/255 [02:36<00:18,  1.45it/s, loss=0.0901, v_num=2, train_loss=0.0302, train_accuracy=1.000, val_loss=0.172, val_accuracy=0.942]
Validating:   7%|▋         | 2/29 [00:01<00:22,  1.21it/s][A
Epoch 118:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.0901, v_num=2, train_loss=0.0302, train_accuracy=1.000, val_loss=0.172, val_accuracy=0.942]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.57it/s][A
Epoch 118:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.0901, v_num=2, train_loss=0.0302, train_accuracy=1.000, val_loss=0.172, val_accuracy=0.942]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.78it/s][A
Epoch 118:  92%|█████████▏| 234/255 [02:37<00:14,  1.48it/s, loss=0.0901, v_num=2, tr

Epoch 118, global step 26893: val_loss was not in top 2


Epoch 119:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.0911, v_num=2, train_loss=0.0362, train_accuracy=1.000, val_loss=0.193, val_accuracy=0.931]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 119:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0911, v_num=2, train_loss=0.0362, train_accuracy=1.000, val_loss=0.193, val_accuracy=0.931]
Validating:   7%|▋         | 2/29 [00:01<00:22,  1.20it/s][A
Epoch 119:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.0911, v_num=2, train_loss=0.0362, train_accuracy=1.000, val_loss=0.193, val_accuracy=0.931]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.58it/s][A
Epoch 119:  91%|█████████ | 232/255 [02:37<00:15,  1.48it/s, loss=0.0911, v_num=2, train_loss=0.0362, train_accuracy=1.000, val_loss=0.193, val_accuracy=0.931]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.78it/s][A
Epoch 119:  92%|█████████▏| 234/255 [02:37<00:14,  1.48it/s, loss=0.0911, v_num=2, tra

Epoch 119, global step 27119: val_loss was not in top 2


Epoch 120:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.097, v_num=2, train_loss=0.269, train_accuracy=0.889, val_loss=0.195, val_accuracy=0.933]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 120:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.097, v_num=2, train_loss=0.269, train_accuracy=0.889, val_loss=0.195, val_accuracy=0.933]
Validating:   7%|▋         | 2/29 [00:01<00:22,  1.21it/s][A
Epoch 120:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.097, v_num=2, train_loss=0.269, train_accuracy=0.889, val_loss=0.195, val_accuracy=0.933]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.57it/s][A
Epoch 120:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.097, v_num=2, train_loss=0.269, train_accuracy=0.889, val_loss=0.195, val_accuracy=0.933]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.77it/s][A
Epoch 120:  92%|█████████▏| 234/255 [02:37<00:14,  1.48it/s, loss=0.097, v_num=2, train_loss

Epoch 120, global step 27345: val_loss was not in top 2


Epoch 121:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.102, v_num=2, train_loss=0.00923, train_accuracy=1.000, val_loss=0.169, val_accuracy=0.935]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 121:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.102, v_num=2, train_loss=0.00923, train_accuracy=1.000, val_loss=0.169, val_accuracy=0.935]
Validating:   7%|▋         | 2/29 [00:01<00:22,  1.21it/s][A
Epoch 121:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.102, v_num=2, train_loss=0.00923, train_accuracy=1.000, val_loss=0.169, val_accuracy=0.935]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.60it/s][A
Epoch 121:  91%|█████████ | 232/255 [02:37<00:15,  1.48it/s, loss=0.102, v_num=2, train_loss=0.00923, train_accuracy=1.000, val_loss=0.169, val_accuracy=0.935]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.82it/s][A
Epoch 121:  92%|█████████▏| 234/255 [02:37<00:14,  1.49it/s, loss=0.102, v_num=2, trai

Epoch 121, global step 27571: val_loss was not in top 2


Epoch 122:  89%|████████▊ | 226/255 [02:35<00:19,  1.46it/s, loss=0.0937, v_num=2, train_loss=0.0953, train_accuracy=0.944, val_loss=0.160, val_accuracy=0.939]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 122:  89%|████████▉ | 228/255 [02:36<00:18,  1.45it/s, loss=0.0937, v_num=2, train_loss=0.0953, train_accuracy=0.944, val_loss=0.160, val_accuracy=0.939]
Validating:   7%|▋         | 2/29 [00:01<00:21,  1.23it/s][A
Epoch 122:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.0937, v_num=2, train_loss=0.0953, train_accuracy=0.944, val_loss=0.160, val_accuracy=0.939]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.57it/s][A
Epoch 122:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.0937, v_num=2, train_loss=0.0953, train_accuracy=0.944, val_loss=0.160, val_accuracy=0.939]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.81it/s][A
Epoch 122:  92%|█████████▏| 234/255 [02:37<00:14,  1.48it/s, loss=0.0937, v_num=2, tra

Epoch 122, global step 27797: val_loss was not in top 2


Epoch 123:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.0697, v_num=2, train_loss=0.0773, train_accuracy=0.944, val_loss=0.236, val_accuracy=0.922]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 123:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0697, v_num=2, train_loss=0.0773, train_accuracy=0.944, val_loss=0.236, val_accuracy=0.922]
Validating:   7%|▋         | 2/29 [00:01<00:22,  1.20it/s][A
Epoch 123:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.0697, v_num=2, train_loss=0.0773, train_accuracy=0.944, val_loss=0.236, val_accuracy=0.922]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.56it/s][A
Epoch 123:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.0697, v_num=2, train_loss=0.0773, train_accuracy=0.944, val_loss=0.236, val_accuracy=0.922]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.79it/s][A
Epoch 123:  92%|█████████▏| 234/255 [02:37<00:14,  1.48it/s, loss=0.0697, v_num=2, tra

Epoch 123, global step 28023: val_loss was not in top 2


Epoch 124:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.0641, v_num=2, train_loss=0.0565, train_accuracy=1.000, val_loss=0.161, val_accuracy=0.940] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 124:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0641, v_num=2, train_loss=0.0565, train_accuracy=1.000, val_loss=0.161, val_accuracy=0.940]
Validating:   7%|▋         | 2/29 [00:01<00:22,  1.21it/s][A
Epoch 124:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.0641, v_num=2, train_loss=0.0565, train_accuracy=1.000, val_loss=0.161, val_accuracy=0.940]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.55it/s][A
Epoch 124:  91%|█████████ | 232/255 [02:37<00:15,  1.48it/s, loss=0.0641, v_num=2, train_loss=0.0565, train_accuracy=1.000, val_loss=0.161, val_accuracy=0.940]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.79it/s][A
Epoch 124:  92%|█████████▏| 234/255 [02:37<00:14,  1.49it/s, loss=0.0641, v_num=2, tr

Epoch 124, global step 28249: val_loss reached 0.14899 (best 0.14899), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-33-v1.ckpt" as top 2


Epoch 125:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.0491, v_num=2, train_loss=0.0208, train_accuracy=1.000, val_loss=0.149, val_accuracy=0.947] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 125:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0491, v_num=2, train_loss=0.0208, train_accuracy=1.000, val_loss=0.149, val_accuracy=0.947]
Validating:   7%|▋         | 2/29 [00:01<00:22,  1.22it/s][A
Epoch 125:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.0491, v_num=2, train_loss=0.0208, train_accuracy=1.000, val_loss=0.149, val_accuracy=0.947]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.60it/s][A
Epoch 125:  91%|█████████ | 232/255 [02:37<00:15,  1.48it/s, loss=0.0491, v_num=2, train_loss=0.0208, train_accuracy=1.000, val_loss=0.149, val_accuracy=0.947]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.82it/s][A
Epoch 125:  92%|█████████▏| 234/255 [02:37<00:14,  1.49it/s, loss=0.0491, v_num=2, tr

Epoch 125, global step 28475: val_loss reached 0.15007 (best 0.14899), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-33.ckpt" as top 2


Epoch 126:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.089, v_num=2, train_loss=0.0243, train_accuracy=1.000, val_loss=0.150, val_accuracy=0.952]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 126:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.089, v_num=2, train_loss=0.0243, train_accuracy=1.000, val_loss=0.150, val_accuracy=0.952]
Validating:   7%|▋         | 2/29 [00:01<00:21,  1.23it/s][A
Epoch 126:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.089, v_num=2, train_loss=0.0243, train_accuracy=1.000, val_loss=0.150, val_accuracy=0.952]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.57it/s][A
Epoch 126:  91%|█████████ | 232/255 [02:37<00:15,  1.48it/s, loss=0.089, v_num=2, train_loss=0.0243, train_accuracy=1.000, val_loss=0.150, val_accuracy=0.952]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.80it/s][A
Epoch 126:  92%|█████████▏| 234/255 [02:37<00:14,  1.49it/s, loss=0.089, v_num=2, train_

Epoch 126, global step 28701: val_loss was not in top 2


Epoch 127:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.064, v_num=2, train_loss=0.0272, train_accuracy=1.000, val_loss=0.161, val_accuracy=0.937]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 127:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.064, v_num=2, train_loss=0.0272, train_accuracy=1.000, val_loss=0.161, val_accuracy=0.937]
Validating:   7%|▋         | 2/29 [00:01<00:22,  1.22it/s][A
Epoch 127:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.064, v_num=2, train_loss=0.0272, train_accuracy=1.000, val_loss=0.161, val_accuracy=0.937]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.57it/s][A
Epoch 127:  91%|█████████ | 232/255 [02:37<00:15,  1.48it/s, loss=0.064, v_num=2, train_loss=0.0272, train_accuracy=1.000, val_loss=0.161, val_accuracy=0.937]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.78it/s][A
Epoch 127:  92%|█████████▏| 234/255 [02:37<00:14,  1.49it/s, loss=0.064, v_num=2, train_

Epoch 127, global step 28927: val_loss was not in top 2


Epoch 128:  89%|████████▊ | 226/255 [02:35<00:19,  1.46it/s, loss=0.0854, v_num=2, train_loss=0.00647, train_accuracy=1.000, val_loss=0.177, val_accuracy=0.944]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 128:  89%|████████▉ | 228/255 [02:36<00:18,  1.45it/s, loss=0.0854, v_num=2, train_loss=0.00647, train_accuracy=1.000, val_loss=0.177, val_accuracy=0.944]
Validating:   7%|▋         | 2/29 [00:01<00:22,  1.22it/s][A
Epoch 128:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.0854, v_num=2, train_loss=0.00647, train_accuracy=1.000, val_loss=0.177, val_accuracy=0.944]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.59it/s][A
Epoch 128:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.0854, v_num=2, train_loss=0.00647, train_accuracy=1.000, val_loss=0.177, val_accuracy=0.944]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.80it/s][A
Epoch 128:  92%|█████████▏| 234/255 [02:37<00:14,  1.48it/s, loss=0.0854, v_num=2,

Epoch 128, global step 29153: val_loss was not in top 2


Epoch 129:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.206, v_num=2, train_loss=0.139, train_accuracy=1.000, val_loss=0.165, val_accuracy=0.948]   
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 129:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.206, v_num=2, train_loss=0.139, train_accuracy=1.000, val_loss=0.165, val_accuracy=0.948]
Validating:   7%|▋         | 2/29 [00:01<00:21,  1.23it/s][A
Epoch 129:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.206, v_num=2, train_loss=0.139, train_accuracy=1.000, val_loss=0.165, val_accuracy=0.948]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.59it/s][A
Epoch 129:  91%|█████████ | 232/255 [02:37<00:15,  1.48it/s, loss=0.206, v_num=2, train_loss=0.139, train_accuracy=1.000, val_loss=0.165, val_accuracy=0.948]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.80it/s][A
Epoch 129:  92%|█████████▏| 234/255 [02:37<00:14,  1.49it/s, loss=0.206, v_num=2, train_los

Epoch 129, global step 29379: val_loss was not in top 2


Epoch 130:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.0677, v_num=2, train_loss=0.0473, train_accuracy=1.000, val_loss=0.221, val_accuracy=0.911]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 130:  89%|████████▉ | 228/255 [02:36<00:18,  1.45it/s, loss=0.0677, v_num=2, train_loss=0.0473, train_accuracy=1.000, val_loss=0.221, val_accuracy=0.911]
Validating:   7%|▋         | 2/29 [00:02<00:23,  1.15it/s][A
Epoch 130:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.0677, v_num=2, train_loss=0.0473, train_accuracy=1.000, val_loss=0.221, val_accuracy=0.911]
Validating:  14%|█▍        | 4/29 [00:02<00:10,  2.48it/s][A
Epoch 130:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.0677, v_num=2, train_loss=0.0473, train_accuracy=1.000, val_loss=0.221, val_accuracy=0.911]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.73it/s][A
Epoch 130:  92%|█████████▏| 234/255 [02:37<00:14,  1.48it/s, loss=0.0677, v_num=2, tra

Epoch 130, global step 29605: val_loss reached 0.13870 (best 0.13870), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-33.ckpt" as top 2


Epoch 131:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.0933, v_num=2, train_loss=0.134, train_accuracy=0.944, val_loss=0.139, val_accuracy=0.946]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 131:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0933, v_num=2, train_loss=0.134, train_accuracy=0.944, val_loss=0.139, val_accuracy=0.946]
Validating:   7%|▋         | 2/29 [00:01<00:22,  1.22it/s][A
Epoch 131:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.0933, v_num=2, train_loss=0.134, train_accuracy=0.944, val_loss=0.139, val_accuracy=0.946]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.58it/s][A
Epoch 131:  91%|█████████ | 232/255 [02:37<00:15,  1.48it/s, loss=0.0933, v_num=2, train_loss=0.134, train_accuracy=0.944, val_loss=0.139, val_accuracy=0.946]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.79it/s][A
Epoch 131:  92%|█████████▏| 234/255 [02:37<00:14,  1.48it/s, loss=0.0933, v_num=2, train

Epoch 131, global step 29831: val_loss was not in top 2


Epoch 132:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.0559, v_num=2, train_loss=0.135, train_accuracy=0.944, val_loss=0.162, val_accuracy=0.945]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 132:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0559, v_num=2, train_loss=0.135, train_accuracy=0.944, val_loss=0.162, val_accuracy=0.945]
Validating:   7%|▋         | 2/29 [00:01<00:22,  1.22it/s][A
Epoch 132:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.0559, v_num=2, train_loss=0.135, train_accuracy=0.944, val_loss=0.162, val_accuracy=0.945]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.55it/s][A
Epoch 132:  91%|█████████ | 232/255 [02:37<00:15,  1.48it/s, loss=0.0559, v_num=2, train_loss=0.135, train_accuracy=0.944, val_loss=0.162, val_accuracy=0.945]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.78it/s][A
Epoch 132:  92%|█████████▏| 234/255 [02:37<00:14,  1.48it/s, loss=0.0559, v_num=2, train

Epoch 132, global step 30057: val_loss reached 0.14788 (best 0.13870), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-33-v1.ckpt" as top 2


Epoch 133:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.0543, v_num=2, train_loss=0.224, train_accuracy=0.944, val_loss=0.148, val_accuracy=0.949]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 133:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0543, v_num=2, train_loss=0.224, train_accuracy=0.944, val_loss=0.148, val_accuracy=0.949]
Validating:   7%|▋         | 2/29 [00:01<00:22,  1.21it/s][A
Epoch 133:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.0543, v_num=2, train_loss=0.224, train_accuracy=0.944, val_loss=0.148, val_accuracy=0.949]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.56it/s][A
Epoch 133:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.0543, v_num=2, train_loss=0.224, train_accuracy=0.944, val_loss=0.148, val_accuracy=0.949]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.82it/s][A
Epoch 133:  92%|█████████▏| 234/255 [02:37<00:14,  1.48it/s, loss=0.0543, v_num=2, train

Epoch 133, global step 30283: val_loss was not in top 2


Epoch 134:  89%|████████▊ | 226/255 [02:35<00:19,  1.46it/s, loss=0.0644, v_num=2, train_loss=0.00931, train_accuracy=1.000, val_loss=0.191, val_accuracy=0.947]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 134:  89%|████████▉ | 228/255 [02:36<00:18,  1.45it/s, loss=0.0644, v_num=2, train_loss=0.00931, train_accuracy=1.000, val_loss=0.191, val_accuracy=0.947]
Validating:   7%|▋         | 2/29 [00:01<00:22,  1.22it/s][A
Epoch 134:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.0644, v_num=2, train_loss=0.00931, train_accuracy=1.000, val_loss=0.191, val_accuracy=0.947]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.60it/s][A
Epoch 134:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.0644, v_num=2, train_loss=0.00931, train_accuracy=1.000, val_loss=0.191, val_accuracy=0.947]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.80it/s][A
Epoch 134:  92%|█████████▏| 234/255 [02:37<00:14,  1.48it/s, loss=0.0644, v_num=2,

Epoch 134, global step 30509: val_loss was not in top 2


Epoch 135:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.0628, v_num=2, train_loss=0.059, train_accuracy=0.944, val_loss=0.204, val_accuracy=0.939]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 135:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0628, v_num=2, train_loss=0.059, train_accuracy=0.944, val_loss=0.204, val_accuracy=0.939]
Validating:   7%|▋         | 2/29 [00:01<00:22,  1.20it/s][A
Epoch 135:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.0628, v_num=2, train_loss=0.059, train_accuracy=0.944, val_loss=0.204, val_accuracy=0.939]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.57it/s][A
Epoch 135:  91%|█████████ | 232/255 [02:37<00:15,  1.48it/s, loss=0.0628, v_num=2, train_loss=0.059, train_accuracy=0.944, val_loss=0.204, val_accuracy=0.939]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.73it/s][A
Epoch 135:  92%|█████████▏| 234/255 [02:37<00:14,  1.48it/s, loss=0.0628, v_num=2, train

Epoch 135, global step 30735: val_loss was not in top 2


Epoch 136:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.0455, v_num=2, train_loss=0.00513, train_accuracy=1.000, val_loss=0.221, val_accuracy=0.943]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 136:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0455, v_num=2, train_loss=0.00513, train_accuracy=1.000, val_loss=0.221, val_accuracy=0.943]
Validating:   7%|▋         | 2/29 [00:01<00:22,  1.21it/s][A
Epoch 136:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.0455, v_num=2, train_loss=0.00513, train_accuracy=1.000, val_loss=0.221, val_accuracy=0.943]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.58it/s][A
Epoch 136:  91%|█████████ | 232/255 [02:37<00:15,  1.48it/s, loss=0.0455, v_num=2, train_loss=0.00513, train_accuracy=1.000, val_loss=0.221, val_accuracy=0.943]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.79it/s][A
Epoch 136:  92%|█████████▏| 234/255 [02:37<00:14,  1.48it/s, loss=0.0455, v_num=2,

Epoch 136, global step 30961: val_loss was not in top 2


Epoch 137:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.0321, v_num=2, train_loss=0.00762, train_accuracy=1.000, val_loss=0.152, val_accuracy=0.948]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 137:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0321, v_num=2, train_loss=0.00762, train_accuracy=1.000, val_loss=0.152, val_accuracy=0.948]
Validating:   7%|▋         | 2/29 [00:01<00:22,  1.19it/s][A
Epoch 137:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.0321, v_num=2, train_loss=0.00762, train_accuracy=1.000, val_loss=0.152, val_accuracy=0.948]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.56it/s][A
Epoch 137:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.0321, v_num=2, train_loss=0.00762, train_accuracy=1.000, val_loss=0.152, val_accuracy=0.948]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.74it/s][A
Epoch 137:  92%|█████████▏| 234/255 [02:37<00:14,  1.48it/s, loss=0.0321, v_num=2,

Epoch 137, global step 31187: val_loss was not in top 2


Epoch 138:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.0576, v_num=2, train_loss=0.00388, train_accuracy=1.000, val_loss=0.150, val_accuracy=0.950]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 138:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0576, v_num=2, train_loss=0.00388, train_accuracy=1.000, val_loss=0.150, val_accuracy=0.950]
Validating:   7%|▋         | 2/29 [00:01<00:22,  1.20it/s][A
Epoch 138:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.0576, v_num=2, train_loss=0.00388, train_accuracy=1.000, val_loss=0.150, val_accuracy=0.950]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.58it/s][A
Epoch 138:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.0576, v_num=2, train_loss=0.00388, train_accuracy=1.000, val_loss=0.150, val_accuracy=0.950]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.77it/s][A
Epoch 138:  92%|█████████▏| 234/255 [02:37<00:14,  1.48it/s, loss=0.0576, v_num=2,

Epoch 138, global step 31413: val_loss was not in top 2


Epoch 139:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.0574, v_num=2, train_loss=0.0276, train_accuracy=1.000, val_loss=0.163, val_accuracy=0.948] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 139:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0574, v_num=2, train_loss=0.0276, train_accuracy=1.000, val_loss=0.163, val_accuracy=0.948]
Validating:   7%|▋         | 2/29 [00:01<00:22,  1.21it/s][A
Epoch 139:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.0574, v_num=2, train_loss=0.0276, train_accuracy=1.000, val_loss=0.163, val_accuracy=0.948]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.58it/s][A
Epoch 139:  91%|█████████ | 232/255 [02:37<00:15,  1.48it/s, loss=0.0574, v_num=2, train_loss=0.0276, train_accuracy=1.000, val_loss=0.163, val_accuracy=0.948]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.80it/s][A
Epoch 139:  92%|█████████▏| 234/255 [02:37<00:14,  1.49it/s, loss=0.0574, v_num=2, tr

Epoch 139, global step 31639: val_loss was not in top 2


Epoch 140:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.0815, v_num=2, train_loss=0.0299, train_accuracy=1.000, val_loss=0.157, val_accuracy=0.947] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 140:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0815, v_num=2, train_loss=0.0299, train_accuracy=1.000, val_loss=0.157, val_accuracy=0.947]
Validating:   7%|▋         | 2/29 [00:01<00:22,  1.20it/s][A
Epoch 140:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.0815, v_num=2, train_loss=0.0299, train_accuracy=1.000, val_loss=0.157, val_accuracy=0.947]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.58it/s][A
Epoch 140:  91%|█████████ | 232/255 [02:37<00:15,  1.48it/s, loss=0.0815, v_num=2, train_loss=0.0299, train_accuracy=1.000, val_loss=0.157, val_accuracy=0.947]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.80it/s][A
Epoch 140:  92%|█████████▏| 234/255 [02:37<00:14,  1.48it/s, loss=0.0815, v_num=2, tr

Epoch 140, global step 31865: val_loss was not in top 2


Epoch 141:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.0573, v_num=2, train_loss=0.0775, train_accuracy=0.944, val_loss=0.185, val_accuracy=0.944] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 141:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0573, v_num=2, train_loss=0.0775, train_accuracy=0.944, val_loss=0.185, val_accuracy=0.944]
Validating:   7%|▋         | 2/29 [00:01<00:22,  1.20it/s][A
Epoch 141:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.0573, v_num=2, train_loss=0.0775, train_accuracy=0.944, val_loss=0.185, val_accuracy=0.944]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.56it/s][A
Epoch 141:  91%|█████████ | 232/255 [02:37<00:15,  1.48it/s, loss=0.0573, v_num=2, train_loss=0.0775, train_accuracy=0.944, val_loss=0.185, val_accuracy=0.944]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.80it/s][A
Epoch 141:  92%|█████████▏| 234/255 [02:37<00:14,  1.49it/s, loss=0.0573, v_num=2, tr

Epoch 141, global step 32091: val_loss reached 0.14571 (best 0.13870), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-33-v1.ckpt" as top 2


Epoch 142:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.0456, v_num=2, train_loss=0.0476, train_accuracy=0.944, val_loss=0.146, val_accuracy=0.947] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 142:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0456, v_num=2, train_loss=0.0476, train_accuracy=0.944, val_loss=0.146, val_accuracy=0.947]
Validating:   7%|▋         | 2/29 [00:01<00:21,  1.23it/s][A
Epoch 142:  90%|█████████ | 230/255 [02:36<00:17,  1.46it/s, loss=0.0456, v_num=2, train_loss=0.0476, train_accuracy=0.944, val_loss=0.146, val_accuracy=0.947]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.60it/s][A
Epoch 142:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.0456, v_num=2, train_loss=0.0476, train_accuracy=0.944, val_loss=0.146, val_accuracy=0.947]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.80it/s][A
Epoch 142:  92%|█████████▏| 234/255 [02:37<00:14,  1.48it/s, loss=0.0456, v_num=2, tr

Epoch 142, global step 32317: val_loss was not in top 2


Epoch 143:  89%|████████▊ | 226/255 [02:35<00:19,  1.46it/s, loss=0.0405, v_num=2, train_loss=0.0112, train_accuracy=1.000, val_loss=0.155, val_accuracy=0.952] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 143:  89%|████████▉ | 228/255 [02:36<00:18,  1.45it/s, loss=0.0405, v_num=2, train_loss=0.0112, train_accuracy=1.000, val_loss=0.155, val_accuracy=0.952]
Validating:   7%|▋         | 2/29 [00:02<00:23,  1.15it/s][A
Epoch 143:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.0405, v_num=2, train_loss=0.0112, train_accuracy=1.000, val_loss=0.155, val_accuracy=0.952]
Validating:  14%|█▍        | 4/29 [00:02<00:10,  2.49it/s][A
Epoch 143:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.0405, v_num=2, train_loss=0.0112, train_accuracy=1.000, val_loss=0.155, val_accuracy=0.952]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.73it/s][A
Epoch 143:  92%|█████████▏| 234/255 [02:38<00:14,  1.48it/s, loss=0.0405, v_num=2, tr

Epoch 143, global step 32543: val_loss was not in top 2


Epoch 144:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.0728, v_num=2, train_loss=0.0426, train_accuracy=1.000, val_loss=0.224, val_accuracy=0.929] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 144:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0728, v_num=2, train_loss=0.0426, train_accuracy=1.000, val_loss=0.224, val_accuracy=0.929]
Validating:   7%|▋         | 2/29 [00:01<00:22,  1.22it/s][A
Epoch 144:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.0728, v_num=2, train_loss=0.0426, train_accuracy=1.000, val_loss=0.224, val_accuracy=0.929]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.55it/s][A
Epoch 144:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.0728, v_num=2, train_loss=0.0426, train_accuracy=1.000, val_loss=0.224, val_accuracy=0.929]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.78it/s][A
Epoch 144:  92%|█████████▏| 234/255 [02:37<00:14,  1.48it/s, loss=0.0728, v_num=2, tr

Epoch 144, global step 32769: val_loss was not in top 2


Epoch 145:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.0559, v_num=2, train_loss=0.0189, train_accuracy=1.000, val_loss=0.178, val_accuracy=0.950] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 145:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0559, v_num=2, train_loss=0.0189, train_accuracy=1.000, val_loss=0.178, val_accuracy=0.950]
Validating:   7%|▋         | 2/29 [00:01<00:22,  1.22it/s][A
Epoch 145:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.0559, v_num=2, train_loss=0.0189, train_accuracy=1.000, val_loss=0.178, val_accuracy=0.950]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.59it/s][A
Epoch 145:  91%|█████████ | 232/255 [02:37<00:15,  1.48it/s, loss=0.0559, v_num=2, train_loss=0.0189, train_accuracy=1.000, val_loss=0.178, val_accuracy=0.950]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.80it/s][A
Epoch 145:  92%|█████████▏| 234/255 [02:37<00:14,  1.48it/s, loss=0.0559, v_num=2, tr

Epoch 145, global step 32995: val_loss was not in top 2


Epoch 146:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.0549, v_num=2, train_loss=0.00207, train_accuracy=1.000, val_loss=0.165, val_accuracy=0.941]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 146:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0549, v_num=2, train_loss=0.00207, train_accuracy=1.000, val_loss=0.165, val_accuracy=0.941]
Validating:   7%|▋         | 2/29 [00:01<00:22,  1.21it/s][A
Epoch 146:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.0549, v_num=2, train_loss=0.00207, train_accuracy=1.000, val_loss=0.165, val_accuracy=0.941]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.55it/s][A
Epoch 146:  91%|█████████ | 232/255 [02:37<00:15,  1.48it/s, loss=0.0549, v_num=2, train_loss=0.00207, train_accuracy=1.000, val_loss=0.165, val_accuracy=0.941]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.78it/s][A
Epoch 146:  92%|█████████▏| 234/255 [02:37<00:14,  1.49it/s, loss=0.0549, v_num=2,

Epoch 146, global step 33221: val_loss was not in top 2


Epoch 147:  89%|████████▊ | 226/255 [02:35<00:19,  1.46it/s, loss=0.0568, v_num=2, train_loss=0.084, train_accuracy=0.944, val_loss=0.287, val_accuracy=0.930]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 147:  89%|████████▉ | 228/255 [02:36<00:18,  1.45it/s, loss=0.0568, v_num=2, train_loss=0.084, train_accuracy=0.944, val_loss=0.287, val_accuracy=0.930]
Validating:   7%|▋         | 2/29 [00:01<00:22,  1.21it/s][A
Epoch 147:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.0568, v_num=2, train_loss=0.084, train_accuracy=0.944, val_loss=0.287, val_accuracy=0.930]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.58it/s][A
Epoch 147:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.0568, v_num=2, train_loss=0.084, train_accuracy=0.944, val_loss=0.287, val_accuracy=0.930]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.79it/s][A
Epoch 147:  92%|█████████▏| 234/255 [02:37<00:14,  1.48it/s, loss=0.0568, v_num=2, train

Epoch 147, global step 33447: val_loss was not in top 2


Epoch 148:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.0682, v_num=2, train_loss=0.441, train_accuracy=0.889, val_loss=0.147, val_accuracy=0.950]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 148:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0682, v_num=2, train_loss=0.441, train_accuracy=0.889, val_loss=0.147, val_accuracy=0.950]
Validating:   7%|▋         | 2/29 [00:01<00:22,  1.22it/s][A
Epoch 148:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.0682, v_num=2, train_loss=0.441, train_accuracy=0.889, val_loss=0.147, val_accuracy=0.950]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.59it/s][A
Epoch 148:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.0682, v_num=2, train_loss=0.441, train_accuracy=0.889, val_loss=0.147, val_accuracy=0.950]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.76it/s][A
Epoch 148:  92%|█████████▏| 234/255 [02:37<00:14,  1.48it/s, loss=0.0682, v_num=2, train

Epoch 148, global step 33673: val_loss was not in top 2


Epoch 149:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.0375, v_num=2, train_loss=0.0587, train_accuracy=0.944, val_loss=0.154, val_accuracy=0.947]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 149:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0375, v_num=2, train_loss=0.0587, train_accuracy=0.944, val_loss=0.154, val_accuracy=0.947]
Validating:   7%|▋         | 2/29 [00:01<00:22,  1.21it/s][A
Epoch 149:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.0375, v_num=2, train_loss=0.0587, train_accuracy=0.944, val_loss=0.154, val_accuracy=0.947]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.57it/s][A
Epoch 149:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.0375, v_num=2, train_loss=0.0587, train_accuracy=0.944, val_loss=0.154, val_accuracy=0.947]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.80it/s][A
Epoch 149:  92%|█████████▏| 234/255 [02:37<00:14,  1.48it/s, loss=0.0375, v_num=2, t

Epoch 149, global step 33899: val_loss was not in top 2


Epoch 150:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.0397, v_num=2, train_loss=0.0236, train_accuracy=1.000, val_loss=0.155, val_accuracy=0.953] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 150:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0397, v_num=2, train_loss=0.0236, train_accuracy=1.000, val_loss=0.155, val_accuracy=0.953]
Validating:   7%|▋         | 2/29 [00:01<00:22,  1.23it/s][A
Epoch 150:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.0397, v_num=2, train_loss=0.0236, train_accuracy=1.000, val_loss=0.155, val_accuracy=0.953]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.59it/s][A
Epoch 150:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.0397, v_num=2, train_loss=0.0236, train_accuracy=1.000, val_loss=0.155, val_accuracy=0.953]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.76it/s][A
Epoch 150:  92%|█████████▏| 234/255 [02:37<00:14,  1.48it/s, loss=0.0397, v_num=2, tr

Epoch 150, global step 34125: val_loss was not in top 2


Epoch 151:  89%|████████▊ | 226/255 [02:35<00:19,  1.46it/s, loss=0.0482, v_num=2, train_loss=0.0541, train_accuracy=1.000, val_loss=0.159, val_accuracy=0.947] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 151:  89%|████████▉ | 228/255 [02:36<00:18,  1.45it/s, loss=0.0482, v_num=2, train_loss=0.0541, train_accuracy=1.000, val_loss=0.159, val_accuracy=0.947]
Validating:   7%|▋         | 2/29 [00:01<00:22,  1.22it/s][A
Epoch 151:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.0482, v_num=2, train_loss=0.0541, train_accuracy=1.000, val_loss=0.159, val_accuracy=0.947]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.56it/s][A
Epoch 151:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.0482, v_num=2, train_loss=0.0541, train_accuracy=1.000, val_loss=0.159, val_accuracy=0.947]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.77it/s][A
Epoch 151:  92%|█████████▏| 234/255 [02:37<00:14,  1.48it/s, loss=0.0482, v_num=2, tr

Epoch 151, global step 34351: val_loss was not in top 2


Epoch 152:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.0411, v_num=2, train_loss=0.141, train_accuracy=0.944, val_loss=0.160, val_accuracy=0.947]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 152:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0411, v_num=2, train_loss=0.141, train_accuracy=0.944, val_loss=0.160, val_accuracy=0.947]
Validating:   7%|▋         | 2/29 [00:01<00:22,  1.21it/s][A
Epoch 152:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.0411, v_num=2, train_loss=0.141, train_accuracy=0.944, val_loss=0.160, val_accuracy=0.947]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.56it/s][A
Epoch 152:  91%|█████████ | 232/255 [02:37<00:15,  1.48it/s, loss=0.0411, v_num=2, train_loss=0.141, train_accuracy=0.944, val_loss=0.160, val_accuracy=0.947]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.75it/s][A
Epoch 152:  92%|█████████▏| 234/255 [02:37<00:14,  1.48it/s, loss=0.0411, v_num=2, train

Epoch 152, global step 34577: val_loss was not in top 2


Epoch 153:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.0711, v_num=2, train_loss=0.068, train_accuracy=1.000, val_loss=0.158, val_accuracy=0.950]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 153:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0711, v_num=2, train_loss=0.068, train_accuracy=1.000, val_loss=0.158, val_accuracy=0.950]
Validating:   7%|▋         | 2/29 [00:01<00:22,  1.21it/s][A
Epoch 153:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.0711, v_num=2, train_loss=0.068, train_accuracy=1.000, val_loss=0.158, val_accuracy=0.950]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.58it/s][A
Epoch 153:  91%|█████████ | 232/255 [02:37<00:15,  1.48it/s, loss=0.0711, v_num=2, train_loss=0.068, train_accuracy=1.000, val_loss=0.158, val_accuracy=0.950]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.81it/s][A
Epoch 153:  92%|█████████▏| 234/255 [02:37<00:14,  1.48it/s, loss=0.0711, v_num=2, train

Epoch 153, global step 34803: val_loss was not in top 2


Epoch 154:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.0549, v_num=2, train_loss=0.156, train_accuracy=0.944, val_loss=0.152, val_accuracy=0.948]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 154:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0549, v_num=2, train_loss=0.156, train_accuracy=0.944, val_loss=0.152, val_accuracy=0.948]
Validating:   7%|▋         | 2/29 [00:01<00:22,  1.22it/s][A
Epoch 154:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.0549, v_num=2, train_loss=0.156, train_accuracy=0.944, val_loss=0.152, val_accuracy=0.948]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.59it/s][A
Epoch 154:  91%|█████████ | 232/255 [02:37<00:15,  1.48it/s, loss=0.0549, v_num=2, train_loss=0.156, train_accuracy=0.944, val_loss=0.152, val_accuracy=0.948]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.81it/s][A
Epoch 154:  92%|█████████▏| 234/255 [02:37<00:14,  1.49it/s, loss=0.0549, v_num=2, train

Epoch 154, global step 35029: val_loss was not in top 2


Epoch 155:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.0363, v_num=2, train_loss=0.133, train_accuracy=0.889, val_loss=0.187, val_accuracy=0.945]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 155:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0363, v_num=2, train_loss=0.133, train_accuracy=0.889, val_loss=0.187, val_accuracy=0.945]
Validating:   7%|▋         | 2/29 [00:01<00:22,  1.21it/s][A
Epoch 155:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.0363, v_num=2, train_loss=0.133, train_accuracy=0.889, val_loss=0.187, val_accuracy=0.945]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.59it/s][A
Epoch 155:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.0363, v_num=2, train_loss=0.133, train_accuracy=0.889, val_loss=0.187, val_accuracy=0.945]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.76it/s][A
Epoch 155:  92%|█████████▏| 234/255 [02:37<00:14,  1.48it/s, loss=0.0363, v_num=2, train

Epoch 155, global step 35255: val_loss was not in top 2


Epoch 156:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.0486, v_num=2, train_loss=0.0599, train_accuracy=1.000, val_loss=0.168, val_accuracy=0.950] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 156:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0486, v_num=2, train_loss=0.0599, train_accuracy=1.000, val_loss=0.168, val_accuracy=0.950]
Validating:   7%|▋         | 2/29 [00:01<00:22,  1.21it/s][A
Epoch 156:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.0486, v_num=2, train_loss=0.0599, train_accuracy=1.000, val_loss=0.168, val_accuracy=0.950]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.59it/s][A
Epoch 156:  91%|█████████ | 232/255 [02:37<00:15,  1.48it/s, loss=0.0486, v_num=2, train_loss=0.0599, train_accuracy=1.000, val_loss=0.168, val_accuracy=0.950]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.77it/s][A
Epoch 156:  92%|█████████▏| 234/255 [02:37<00:14,  1.48it/s, loss=0.0486, v_num=2, tr

Epoch 156, global step 35481: val_loss was not in top 2


Epoch 157:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.0313, v_num=2, train_loss=0.00372, train_accuracy=1.000, val_loss=0.180, val_accuracy=0.945]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 157:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0313, v_num=2, train_loss=0.00372, train_accuracy=1.000, val_loss=0.180, val_accuracy=0.945]
Validating:   7%|▋         | 2/29 [00:01<00:22,  1.21it/s][A
Epoch 157:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.0313, v_num=2, train_loss=0.00372, train_accuracy=1.000, val_loss=0.180, val_accuracy=0.945]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.59it/s][A
Epoch 157:  91%|█████████ | 232/255 [02:37<00:15,  1.48it/s, loss=0.0313, v_num=2, train_loss=0.00372, train_accuracy=1.000, val_loss=0.180, val_accuracy=0.945]
Validating:  21%|██        | 6/29 [00:02<00:05,  3.83it/s][A
Epoch 157:  92%|█████████▏| 234/255 [02:37<00:14,  1.49it/s, loss=0.0313, v_num=2,

Epoch 157, global step 35707: val_loss was not in top 2


Epoch 158:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.0369, v_num=2, train_loss=0.00206, train_accuracy=1.000, val_loss=0.180, val_accuracy=0.950]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 158:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0369, v_num=2, train_loss=0.00206, train_accuracy=1.000, val_loss=0.180, val_accuracy=0.950]
Validating:   7%|▋         | 2/29 [00:01<00:22,  1.21it/s][A
Epoch 158:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.0369, v_num=2, train_loss=0.00206, train_accuracy=1.000, val_loss=0.180, val_accuracy=0.950]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.57it/s][A
Epoch 158:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.0369, v_num=2, train_loss=0.00206, train_accuracy=1.000, val_loss=0.180, val_accuracy=0.950]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.78it/s][A
Epoch 158:  92%|█████████▏| 234/255 [02:37<00:14,  1.48it/s, loss=0.0369, v_num=2,

Epoch 158, global step 35933: val_loss was not in top 2


Epoch 159:  89%|████████▊ | 226/255 [02:35<00:19,  1.46it/s, loss=0.0515, v_num=2, train_loss=0.0219, train_accuracy=1.000, val_loss=0.157, val_accuracy=0.952] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 159:  89%|████████▉ | 228/255 [02:36<00:18,  1.45it/s, loss=0.0515, v_num=2, train_loss=0.0219, train_accuracy=1.000, val_loss=0.157, val_accuracy=0.952]
Validating:   7%|▋         | 2/29 [00:01<00:22,  1.22it/s][A
Epoch 159:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.0515, v_num=2, train_loss=0.0219, train_accuracy=1.000, val_loss=0.157, val_accuracy=0.952]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.59it/s][A
Epoch 159:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.0515, v_num=2, train_loss=0.0219, train_accuracy=1.000, val_loss=0.157, val_accuracy=0.952]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.81it/s][A
Epoch 159:  92%|█████████▏| 234/255 [02:37<00:14,  1.48it/s, loss=0.0515, v_num=2, tr

Epoch 159, global step 36159: val_loss reached 0.14338 (best 0.13870), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-33-v1.ckpt" as top 2


Epoch 160:  83%|████████▎ | 212/255 [02:25<00:29,  1.46it/s, loss=0.0316, v_num=2, train_loss=0.0139, train_accuracy=1.000, val_loss=0.143, val_accuracy=0.954] 

IOPub message rate exceeded.
The notebook server will temporarily stop sending output
to the client in order to avoid crashing it.
To change this limit, set the config variable
`--NotebookApp.iopub_msg_rate_limit`.

Current values:
NotebookApp.iopub_msg_rate_limit=1000.0 (msgs/sec)
NotebookApp.rate_limit_window=3.0 (secs)



Epoch 164:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.0498, v_num=2, train_loss=0.00812, train_accuracy=1.000, val_loss=0.157, val_accuracy=0.954]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 164:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0498, v_num=2, train_loss=0.00812, train_accuracy=1.000, val_loss=0.157, val_accuracy=0.954]
Validating:   7%|▋         | 2/29 [00:01<00:22,  1.19it/s][A
Epoch 164:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.0498, v_num=2, train_loss=0.00812, train_accuracy=1.000, val_loss=0.157, val_accuracy=0.954]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.54it/s][A
Epoch 164:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.0498, v_num=2, train_loss=0.00812, train_accuracy=1.000, val_loss=0.157, val_accuracy=0.954]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.72it/s][A
Epoch 164:  92%|█████████▏| 234/255 [02:37<00:14,  1.48it/s, loss=0.0498, v_num=2,

Epoch 164, global step 37289: val_loss was not in top 2


Epoch 165:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.0342, v_num=2, train_loss=0.00128, train_accuracy=1.000, val_loss=0.151, val_accuracy=0.950]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 165:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0342, v_num=2, train_loss=0.00128, train_accuracy=1.000, val_loss=0.151, val_accuracy=0.950]
Validating:   7%|▋         | 2/29 [00:01<00:22,  1.19it/s][A
Epoch 165:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.0342, v_num=2, train_loss=0.00128, train_accuracy=1.000, val_loss=0.151, val_accuracy=0.950]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.57it/s][A
Epoch 165:  91%|█████████ | 232/255 [02:37<00:15,  1.48it/s, loss=0.0342, v_num=2, train_loss=0.00128, train_accuracy=1.000, val_loss=0.151, val_accuracy=0.950]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.74it/s][A
Epoch 165:  92%|█████████▏| 234/255 [02:37<00:14,  1.48it/s, loss=0.0342, v_num=2,

Epoch 165, global step 37515: val_loss was not in top 2


Epoch 166:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.0442, v_num=2, train_loss=0.146, train_accuracy=0.944, val_loss=0.177, val_accuracy=0.952]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 166:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0442, v_num=2, train_loss=0.146, train_accuracy=0.944, val_loss=0.177, val_accuracy=0.952]
Validating:   7%|▋         | 2/29 [00:01<00:22,  1.22it/s][A
Epoch 166:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.0442, v_num=2, train_loss=0.146, train_accuracy=0.944, val_loss=0.177, val_accuracy=0.952]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.56it/s][A
Epoch 166:  91%|█████████ | 232/255 [02:37<00:15,  1.48it/s, loss=0.0442, v_num=2, train_loss=0.146, train_accuracy=0.944, val_loss=0.177, val_accuracy=0.952]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.78it/s][A
Epoch 166:  92%|█████████▏| 234/255 [02:37<00:14,  1.48it/s, loss=0.0442, v_num=2, train

Epoch 166, global step 37741: val_loss was not in top 2


Epoch 167:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.0449, v_num=2, train_loss=0.153, train_accuracy=0.944, val_loss=0.170, val_accuracy=0.953]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 167:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0449, v_num=2, train_loss=0.153, train_accuracy=0.944, val_loss=0.170, val_accuracy=0.953]
Validating:   7%|▋         | 2/29 [00:01<00:22,  1.22it/s][A
Epoch 167:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.0449, v_num=2, train_loss=0.153, train_accuracy=0.944, val_loss=0.170, val_accuracy=0.953]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.59it/s][A
Epoch 167:  91%|█████████ | 232/255 [02:37<00:15,  1.48it/s, loss=0.0449, v_num=2, train_loss=0.153, train_accuracy=0.944, val_loss=0.170, val_accuracy=0.953]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.79it/s][A
Epoch 167:  92%|█████████▏| 234/255 [02:37<00:14,  1.48it/s, loss=0.0449, v_num=2, train

Epoch 167, global step 37967: val_loss reached 0.13596 (best 0.13596), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-33-v1.ckpt" as top 2


Epoch 168:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.0624, v_num=2, train_loss=0.0149, train_accuracy=1.000, val_loss=0.136, val_accuracy=0.950] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 168:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0624, v_num=2, train_loss=0.0149, train_accuracy=1.000, val_loss=0.136, val_accuracy=0.950]
Validating:   7%|▋         | 2/29 [00:01<00:22,  1.20it/s][A
Epoch 168:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.0624, v_num=2, train_loss=0.0149, train_accuracy=1.000, val_loss=0.136, val_accuracy=0.950]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.56it/s][A
Epoch 168:  91%|█████████ | 232/255 [02:37<00:15,  1.48it/s, loss=0.0624, v_num=2, train_loss=0.0149, train_accuracy=1.000, val_loss=0.136, val_accuracy=0.950]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.73it/s][A
Epoch 168:  92%|█████████▏| 234/255 [02:37<00:14,  1.49it/s, loss=0.0624, v_num=2, tr

Epoch 168, global step 38193: val_loss was not in top 2


Epoch 169:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.0695, v_num=2, train_loss=0.092, train_accuracy=0.944, val_loss=0.145, val_accuracy=0.949]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 169:  89%|████████▉ | 228/255 [02:36<00:18,  1.45it/s, loss=0.0695, v_num=2, train_loss=0.092, train_accuracy=0.944, val_loss=0.145, val_accuracy=0.949]
Validating:   7%|▋         | 2/29 [00:01<00:22,  1.20it/s][A
Epoch 169:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.0695, v_num=2, train_loss=0.092, train_accuracy=0.944, val_loss=0.145, val_accuracy=0.949]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.58it/s][A
Epoch 169:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.0695, v_num=2, train_loss=0.092, train_accuracy=0.944, val_loss=0.145, val_accuracy=0.949]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.76it/s][A
Epoch 169:  92%|█████████▏| 234/255 [02:37<00:14,  1.48it/s, loss=0.0695, v_num=2, train

Epoch 169, global step 38419: val_loss was not in top 2


Epoch 170:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.063, v_num=2, train_loss=0.0175, train_accuracy=1.000, val_loss=0.146, val_accuracy=0.953]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 170:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.063, v_num=2, train_loss=0.0175, train_accuracy=1.000, val_loss=0.146, val_accuracy=0.953]
Validating:   7%|▋         | 2/29 [00:01<00:21,  1.23it/s][A
Epoch 170:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.063, v_num=2, train_loss=0.0175, train_accuracy=1.000, val_loss=0.146, val_accuracy=0.953]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.58it/s][A
Epoch 170:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.063, v_num=2, train_loss=0.0175, train_accuracy=1.000, val_loss=0.146, val_accuracy=0.953]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.74it/s][A
Epoch 170:  92%|█████████▏| 234/255 [02:37<00:14,  1.48it/s, loss=0.063, v_num=2, train_

IOPub message rate exceeded.
The notebook server will temporarily stop sending output
to the client in order to avoid crashing it.
To change this limit, set the config variable
`--NotebookApp.iopub_msg_rate_limit`.

Current values:
NotebookApp.iopub_msg_rate_limit=1000.0 (msgs/sec)
NotebookApp.rate_limit_window=3.0 (secs)



Epoch 173:  89%|████████▊ | 226/255 [02:35<00:19,  1.46it/s, loss=0.0376, v_num=2, train_loss=0.0115, train_accuracy=1.000, val_loss=0.131, val_accuracy=0.956]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 173:  89%|████████▉ | 228/255 [02:36<00:18,  1.45it/s, loss=0.0376, v_num=2, train_loss=0.0115, train_accuracy=1.000, val_loss=0.131, val_accuracy=0.956]
Validating:   7%|▋         | 2/29 [00:01<00:22,  1.21it/s][A
Epoch 173:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.0376, v_num=2, train_loss=0.0115, train_accuracy=1.000, val_loss=0.131, val_accuracy=0.956]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.57it/s][A
Epoch 173:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.0376, v_num=2, train_loss=0.0115, train_accuracy=1.000, val_loss=0.131, val_accuracy=0.956]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.72it/s][A
Epoch 173:  92%|█████████▏| 234/255 [02:37<00:14,  1.48it/s, loss=0.0376, v_num=2, tra

Epoch 173, global step 39323: val_loss was not in top 2


Epoch 174:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.0259, v_num=2, train_loss=0.00647, train_accuracy=1.000, val_loss=0.143, val_accuracy=0.957] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 174:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0259, v_num=2, train_loss=0.00647, train_accuracy=1.000, val_loss=0.143, val_accuracy=0.957]
Validating:   7%|▋         | 2/29 [00:01<00:22,  1.22it/s][A
Epoch 174:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.0259, v_num=2, train_loss=0.00647, train_accuracy=1.000, val_loss=0.143, val_accuracy=0.957]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.59it/s][A
Epoch 174:  91%|█████████ | 232/255 [02:37<00:15,  1.48it/s, loss=0.0259, v_num=2, train_loss=0.00647, train_accuracy=1.000, val_loss=0.143, val_accuracy=0.957]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.78it/s][A
Epoch 174:  92%|█████████▏| 234/255 [02:37<00:14,  1.48it/s, loss=0.0259, v_num=2

Epoch 174, global step 39549: val_loss was not in top 2


Epoch 175:  89%|████████▊ | 226/255 [02:35<00:19,  1.46it/s, loss=0.0449, v_num=2, train_loss=0.00118, train_accuracy=1.000, val_loss=0.158, val_accuracy=0.957]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 175:  89%|████████▉ | 228/255 [02:36<00:18,  1.45it/s, loss=0.0449, v_num=2, train_loss=0.00118, train_accuracy=1.000, val_loss=0.158, val_accuracy=0.957]
Validating:   7%|▋         | 2/29 [00:01<00:22,  1.22it/s][A
Epoch 175:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.0449, v_num=2, train_loss=0.00118, train_accuracy=1.000, val_loss=0.158, val_accuracy=0.957]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.57it/s][A
Epoch 175:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.0449, v_num=2, train_loss=0.00118, train_accuracy=1.000, val_loss=0.158, val_accuracy=0.957]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.80it/s][A
Epoch 175:  92%|█████████▏| 234/255 [02:37<00:14,  1.48it/s, loss=0.0449, v_num=2,

Epoch 175, global step 39775: val_loss was not in top 2


Epoch 176:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.0407, v_num=2, train_loss=0.112, train_accuracy=0.944, val_loss=0.158, val_accuracy=0.952]   
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 176:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0407, v_num=2, train_loss=0.112, train_accuracy=0.944, val_loss=0.158, val_accuracy=0.952]
Validating:   7%|▋         | 2/29 [00:01<00:22,  1.18it/s][A
Epoch 176:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.0407, v_num=2, train_loss=0.112, train_accuracy=0.944, val_loss=0.158, val_accuracy=0.952]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.53it/s][A
Epoch 176:  91%|█████████ | 232/255 [02:37<00:15,  1.48it/s, loss=0.0407, v_num=2, train_loss=0.112, train_accuracy=0.944, val_loss=0.158, val_accuracy=0.952]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.77it/s][A
Epoch 176:  92%|█████████▏| 234/255 [02:37<00:14,  1.49it/s, loss=0.0407, v_num=2, trai

Epoch 176, global step 40001: val_loss was not in top 2


Epoch 177:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.0354, v_num=2, train_loss=0.000302, train_accuracy=1.000, val_loss=0.173, val_accuracy=0.952]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 177:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0354, v_num=2, train_loss=0.000302, train_accuracy=1.000, val_loss=0.173, val_accuracy=0.952]
Validating:   7%|▋         | 2/29 [00:01<00:22,  1.20it/s][A
Epoch 177:  90%|█████████ | 230/255 [02:36<00:17,  1.46it/s, loss=0.0354, v_num=2, train_loss=0.000302, train_accuracy=1.000, val_loss=0.173, val_accuracy=0.952]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.53it/s][A
Epoch 177:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.0354, v_num=2, train_loss=0.000302, train_accuracy=1.000, val_loss=0.173, val_accuracy=0.952]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.74it/s][A
Epoch 177:  92%|█████████▏| 234/255 [02:37<00:14,  1.48it/s, loss=0.0354, v_nu

Epoch 177, global step 40227: val_loss was not in top 2


Epoch 178:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.0292, v_num=2, train_loss=0.00192, train_accuracy=1.000, val_loss=0.157, val_accuracy=0.952] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 178:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0292, v_num=2, train_loss=0.00192, train_accuracy=1.000, val_loss=0.157, val_accuracy=0.952]
Validating:   7%|▋         | 2/29 [00:01<00:22,  1.21it/s][A
Epoch 178:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.0292, v_num=2, train_loss=0.00192, train_accuracy=1.000, val_loss=0.157, val_accuracy=0.952]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.59it/s][A
Epoch 178:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.0292, v_num=2, train_loss=0.00192, train_accuracy=1.000, val_loss=0.157, val_accuracy=0.952]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.78it/s][A
Epoch 178:  92%|█████████▏| 234/255 [02:37<00:14,  1.48it/s, loss=0.0292, v_num=2

Epoch 178, global step 40453: val_loss was not in top 2


Epoch 179:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.0315, v_num=2, train_loss=0.0211, train_accuracy=1.000, val_loss=0.156, val_accuracy=0.960] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 179:  89%|████████▉ | 228/255 [02:36<00:18,  1.45it/s, loss=0.0315, v_num=2, train_loss=0.0211, train_accuracy=1.000, val_loss=0.156, val_accuracy=0.960]
Validating:   7%|▋         | 2/29 [00:01<00:22,  1.21it/s][A
Epoch 179:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.0315, v_num=2, train_loss=0.0211, train_accuracy=1.000, val_loss=0.156, val_accuracy=0.960]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.58it/s][A
Epoch 179:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.0315, v_num=2, train_loss=0.0211, train_accuracy=1.000, val_loss=0.156, val_accuracy=0.960]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.82it/s][A
Epoch 179:  92%|█████████▏| 234/255 [02:37<00:14,  1.48it/s, loss=0.0315, v_num=2, tr

Epoch 179, global step 40679: val_loss was not in top 2


Epoch 180:  42%|████▏     | 106/255 [01:13<01:42,  1.45it/s, loss=0.0297, v_num=2, train_loss=0.00168, train_accuracy=1.000, val_loss=0.133, val_accuracy=0.958]

IOPub message rate exceeded.
The notebook server will temporarily stop sending output
to the client in order to avoid crashing it.
To change this limit, set the config variable
`--NotebookApp.iopub_msg_rate_limit`.

Current values:
NotebookApp.iopub_msg_rate_limit=1000.0 (msgs/sec)
NotebookApp.rate_limit_window=3.0 (secs)




Validating:  48%|████▊     | 14/29 [00:03<00:02,  5.70it/s][A
Epoch 183:  95%|█████████▍| 242/255 [02:39<00:08,  1.52it/s, loss=0.0393, v_num=2, train_loss=0.000868, train_accuracy=1.000, val_loss=0.149, val_accuracy=0.962]
Validating:  55%|█████▌    | 16/29 [00:04<00:02,  5.80it/s][A
Epoch 183:  96%|█████████▌| 244/255 [02:39<00:07,  1.53it/s, loss=0.0393, v_num=2, train_loss=0.000868, train_accuracy=1.000, val_loss=0.149, val_accuracy=0.962]
Validating:  62%|██████▏   | 18/29 [00:04<00:01,  5.82it/s][A
Epoch 183:  96%|█████████▋| 246/255 [02:39<00:05,  1.54it/s, loss=0.0393, v_num=2, train_loss=0.000868, train_accuracy=1.000, val_loss=0.149, val_accuracy=0.962]
Validating:  69%|██████▉   | 20/29 [00:05<00:01,  5.81it/s][A
Epoch 183:  97%|█████████▋| 248/255 [02:40<00:04,  1.55it/s, loss=0.0393, v_num=2, train_loss=0.000868, train_accuracy=1.000, val_loss=0.149, val_accuracy=0.962]
Validating:  76%|███████▌  | 22/29 [00:05<00:01,  5.83it/s][A
Epoch 183:  98%|█████████▊| 250/255 

Epoch 183, global step 41583: val_loss was not in top 2


Epoch 184:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.0551, v_num=2, train_loss=0.0791, train_accuracy=0.944, val_loss=0.142, val_accuracy=0.955]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 184:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0551, v_num=2, train_loss=0.0791, train_accuracy=0.944, val_loss=0.142, val_accuracy=0.955]
Validating:   7%|▋         | 2/29 [00:01<00:22,  1.21it/s][A
Epoch 184:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.0551, v_num=2, train_loss=0.0791, train_accuracy=0.944, val_loss=0.142, val_accuracy=0.955]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.57it/s][A
Epoch 184:  91%|█████████ | 232/255 [02:37<00:15,  1.48it/s, loss=0.0551, v_num=2, train_loss=0.0791, train_accuracy=0.944, val_loss=0.142, val_accuracy=0.955]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.70it/s][A
Epoch 184:  92%|█████████▏| 234/255 [02:37<00:14,  1.49it/s, loss=0.0551, v_num=2, t

Epoch 184, global step 41809: val_loss was not in top 2


Epoch 185:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.0461, v_num=2, train_loss=0.211, train_accuracy=0.944, val_loss=0.174, val_accuracy=0.948]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 185:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0461, v_num=2, train_loss=0.211, train_accuracy=0.944, val_loss=0.174, val_accuracy=0.948]
Validating:   7%|▋         | 2/29 [00:01<00:22,  1.19it/s][A
Epoch 185:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.0461, v_num=2, train_loss=0.211, train_accuracy=0.944, val_loss=0.174, val_accuracy=0.948]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.53it/s][A
Epoch 185:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.0461, v_num=2, train_loss=0.211, train_accuracy=0.944, val_loss=0.174, val_accuracy=0.948]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.76it/s][A
Epoch 185:  92%|█████████▏| 234/255 [02:37<00:14,  1.48it/s, loss=0.0461, v_num=2, train

Epoch 185, global step 42035: val_loss reached 0.12758 (best 0.12758), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-33.ckpt" as top 2


Epoch 186:  89%|████████▊ | 226/255 [02:35<00:19,  1.46it/s, loss=0.0514, v_num=2, train_loss=0.0787, train_accuracy=0.944, val_loss=0.128, val_accuracy=0.959] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 186:  89%|████████▉ | 228/255 [02:36<00:18,  1.45it/s, loss=0.0514, v_num=2, train_loss=0.0787, train_accuracy=0.944, val_loss=0.128, val_accuracy=0.959]
Validating:   7%|▋         | 2/29 [00:01<00:22,  1.22it/s][A
Epoch 186:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.0514, v_num=2, train_loss=0.0787, train_accuracy=0.944, val_loss=0.128, val_accuracy=0.959]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.56it/s][A
Epoch 186:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.0514, v_num=2, train_loss=0.0787, train_accuracy=0.944, val_loss=0.128, val_accuracy=0.959]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.78it/s][A
Epoch 186:  92%|█████████▏| 234/255 [02:37<00:14,  1.48it/s, loss=0.0514, v_num=2, tr

Epoch 186, global step 42261: val_loss was not in top 2


Epoch 187:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.037, v_num=2, train_loss=0.00627, train_accuracy=1.000, val_loss=0.153, val_accuracy=0.957]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 187:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.037, v_num=2, train_loss=0.00627, train_accuracy=1.000, val_loss=0.153, val_accuracy=0.957]
Validating:   7%|▋         | 2/29 [00:01<00:22,  1.22it/s][A
Epoch 187:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.037, v_num=2, train_loss=0.00627, train_accuracy=1.000, val_loss=0.153, val_accuracy=0.957]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.56it/s][A
Epoch 187:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.037, v_num=2, train_loss=0.00627, train_accuracy=1.000, val_loss=0.153, val_accuracy=0.957]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.80it/s][A
Epoch 187:  92%|█████████▏| 234/255 [02:37<00:14,  1.48it/s, loss=0.037, v_num=2, tr

Epoch 187, global step 42487: val_loss was not in top 2


Epoch 188:  89%|████████▊ | 226/255 [02:35<00:19,  1.46it/s, loss=0.0205, v_num=2, train_loss=0.000648, train_accuracy=1.000, val_loss=0.163, val_accuracy=0.958]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 188:  89%|████████▉ | 228/255 [02:36<00:18,  1.45it/s, loss=0.0205, v_num=2, train_loss=0.000648, train_accuracy=1.000, val_loss=0.163, val_accuracy=0.958]
Validating:   7%|▋         | 2/29 [00:01<00:22,  1.21it/s][A
Epoch 188:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.0205, v_num=2, train_loss=0.000648, train_accuracy=1.000, val_loss=0.163, val_accuracy=0.958]
Validating:  14%|█▍        | 4/29 [00:02<00:09,  2.56it/s][A
Epoch 188:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.0205, v_num=2, train_loss=0.000648, train_accuracy=1.000, val_loss=0.163, val_accuracy=0.958]
Validating:  21%|██        | 6/29 [00:02<00:06,  3.79it/s][A
Epoch 188:  92%|█████████▏| 234/255 [02:37<00:14,  1.48it/s, loss=0.0205, v_nu

Epoch 18, global step 4293: val_loss was not in top 2


Epoch 19:  89%|████████▊ | 226/255 [02:35<00:19,  1.45it/s, loss=0.676, v_num=0, train_loss=0.702, train_accuracy=0.667, val_loss=0.682, val_accuracy=0.546]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 19:  89%|████████▉ | 228/255 [02:37<00:18,  1.44it/s, loss=0.676, v_num=0, train_loss=0.702, train_accuracy=0.667, val_loss=0.682, val_accuracy=0.546]
Validating:   7%|▋         | 2/29 [00:02<00:29,  1.08s/it][A
Epoch 19:  90%|█████████ | 230/255 [02:38<00:17,  1.45it/s, loss=0.676, v_num=0, train_loss=0.702, train_accuracy=0.667, val_loss=0.682, val_accuracy=0.546]
Validating:  14%|█▍        | 4/29 [00:02<00:11,  2.13it/s][A
Epoch 19:  91%|█████████ | 232/255 [02:38<00:15,  1.46it/s, loss=0.676, v_num=0, train_loss=0.702, train_accuracy=0.667, val_loss=0.682, val_accuracy=0.546]
Validating:  21%|██        | 6/29 [00:03<00:06,  3.29it/s][A
Epoch 19:  92%|█████████▏| 234/255 [02:38<00:14,  1.47it/s, loss=0.676, v_num=0, train_loss=0.702,

Epoch 19, global step 4519: val_loss was not in top 2


Epoch 20:  89%|████████▊ | 226/255 [02:35<00:19,  1.46it/s, loss=0.666, v_num=0, train_loss=0.652, train_accuracy=0.556, val_loss=0.675, val_accuracy=0.586]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 20:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.666, v_num=0, train_loss=0.652, train_accuracy=0.556, val_loss=0.675, val_accuracy=0.586]
Validating:   7%|▋         | 2/29 [00:02<00:29,  1.09s/it][A
Epoch 20:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.666, v_num=0, train_loss=0.652, train_accuracy=0.556, val_loss=0.675, val_accuracy=0.586]
Validating:  14%|█▍        | 4/29 [00:02<00:11,  2.09it/s][A
Epoch 20:  91%|█████████ | 232/255 [02:38<00:15,  1.47it/s, loss=0.666, v_num=0, train_loss=0.652, train_accuracy=0.556, val_loss=0.675, val_accuracy=0.586]
Validating:  21%|██        | 6/29 [00:03<00:06,  3.31it/s][A
Epoch 20:  92%|█████████▏| 234/255 [02:38<00:14,  1.48it/s, loss=0.666, v_num=0, train_loss=0.652,

Epoch 20, global step 4745: val_loss was not in top 2


Epoch 21:  89%|████████▊ | 226/255 [02:35<00:19,  1.46it/s, loss=0.645, v_num=0, train_loss=0.737, train_accuracy=0.500, val_loss=0.675, val_accuracy=0.570]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 21:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.645, v_num=0, train_loss=0.737, train_accuracy=0.500, val_loss=0.675, val_accuracy=0.570]
Validating:   7%|▋         | 2/29 [00:02<00:29,  1.09s/it][A
Epoch 21:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.645, v_num=0, train_loss=0.737, train_accuracy=0.500, val_loss=0.675, val_accuracy=0.570]
Validating:  14%|█▍        | 4/29 [00:02<00:11,  2.09it/s][A
Epoch 21:  91%|█████████ | 232/255 [02:38<00:15,  1.47it/s, loss=0.645, v_num=0, train_loss=0.737, train_accuracy=0.500, val_loss=0.675, val_accuracy=0.570]
Validating:  21%|██        | 6/29 [00:03<00:06,  3.32it/s][A
Epoch 21:  92%|█████████▏| 234/255 [02:38<00:14,  1.48it/s, loss=0.645, v_num=0, train_loss=0.737,

Epoch 21, global step 4971: val_loss was not in top 2


Epoch 22:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.64, v_num=0, train_loss=0.664, train_accuracy=0.722, val_loss=0.641, val_accuracy=0.662] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 22:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.64, v_num=0, train_loss=0.664, train_accuracy=0.722, val_loss=0.641, val_accuracy=0.662]
Validating:   7%|▋         | 2/29 [00:02<00:29,  1.08s/it][A
Epoch 22:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.64, v_num=0, train_loss=0.664, train_accuracy=0.722, val_loss=0.641, val_accuracy=0.662]
Validating:  14%|█▍        | 4/29 [00:02<00:11,  2.10it/s][A
Epoch 22:  91%|█████████ | 232/255 [02:38<00:15,  1.47it/s, loss=0.64, v_num=0, train_loss=0.664, train_accuracy=0.722, val_loss=0.641, val_accuracy=0.662]
Validating:  21%|██        | 6/29 [00:03<00:06,  3.31it/s][A
Epoch 22:  92%|█████████▏| 234/255 [02:38<00:14,  1.48it/s, loss=0.64, v_num=0, train_loss=0.664, tra

Epoch 22, global step 5197: val_loss was not in top 2


Epoch 23:  89%|████████▊ | 226/255 [02:35<00:19,  1.46it/s, loss=0.624, v_num=0, train_loss=0.633, train_accuracy=0.611, val_loss=0.642, val_accuracy=0.637]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 23:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.624, v_num=0, train_loss=0.633, train_accuracy=0.611, val_loss=0.642, val_accuracy=0.637]
Validating:   7%|▋         | 2/29 [00:02<00:30,  1.12s/it][A
Epoch 23:  90%|█████████ | 230/255 [02:38<00:17,  1.45it/s, loss=0.624, v_num=0, train_loss=0.633, train_accuracy=0.611, val_loss=0.642, val_accuracy=0.637]
Validating:  14%|█▍        | 4/29 [00:02<00:12,  2.06it/s][A
Epoch 23:  91%|█████████ | 232/255 [02:38<00:15,  1.46it/s, loss=0.624, v_num=0, train_loss=0.633, train_accuracy=0.611, val_loss=0.642, val_accuracy=0.637]
Validating:  21%|██        | 6/29 [00:03<00:06,  3.30it/s][A
Epoch 23:  92%|█████████▏| 234/255 [02:38<00:14,  1.47it/s, loss=0.624, v_num=0, train_loss=0.633,

Epoch 23, global step 5423: val_loss was not in top 2


Epoch 24:  89%|████████▊ | 226/255 [02:35<00:19,  1.46it/s, loss=0.682, v_num=0, train_loss=0.698, train_accuracy=0.500, val_loss=0.622, val_accuracy=0.665]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 24:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.682, v_num=0, train_loss=0.698, train_accuracy=0.500, val_loss=0.622, val_accuracy=0.665]
Validating:   7%|▋         | 2/29 [00:02<00:29,  1.08s/it][A
Epoch 24:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.682, v_num=0, train_loss=0.698, train_accuracy=0.500, val_loss=0.622, val_accuracy=0.665]
Validating:  14%|█▍        | 4/29 [00:02<00:11,  2.13it/s][A
Epoch 24:  91%|█████████ | 232/255 [02:38<00:15,  1.47it/s, loss=0.682, v_num=0, train_loss=0.698, train_accuracy=0.500, val_loss=0.622, val_accuracy=0.665]
Validating:  21%|██        | 6/29 [00:03<00:06,  3.32it/s][A
Epoch 24:  92%|█████████▏| 234/255 [02:38<00:14,  1.48it/s, loss=0.682, v_num=0, train_loss=0.698,

Epoch 24, global step 5649: val_loss was not in top 2


Epoch 25:  89%|████████▊ | 226/255 [02:35<00:19,  1.46it/s, loss=0.661, v_num=0, train_loss=0.651, train_accuracy=0.722, val_loss=0.677, val_accuracy=0.577]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 25:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.661, v_num=0, train_loss=0.651, train_accuracy=0.722, val_loss=0.677, val_accuracy=0.577]
Validating:   7%|▋         | 2/29 [00:02<00:29,  1.09s/it][A
Epoch 25:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.661, v_num=0, train_loss=0.651, train_accuracy=0.722, val_loss=0.677, val_accuracy=0.577]
Validating:  14%|█▍        | 4/29 [00:02<00:11,  2.10it/s][A
Epoch 25:  91%|█████████ | 232/255 [02:38<00:15,  1.47it/s, loss=0.661, v_num=0, train_loss=0.651, train_accuracy=0.722, val_loss=0.677, val_accuracy=0.577]
Validating:  21%|██        | 6/29 [00:03<00:06,  3.34it/s][A
Epoch 25:  92%|█████████▏| 234/255 [02:38<00:14,  1.47it/s, loss=0.661, v_num=0, train_loss=0.651,

Epoch 25, global step 5875: val_loss was not in top 2


Epoch 26:  89%|████████▊ | 226/255 [02:35<00:19,  1.46it/s, loss=0.652, v_num=0, train_loss=0.670, train_accuracy=0.611, val_loss=0.667, val_accuracy=0.594]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 26:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.652, v_num=0, train_loss=0.670, train_accuracy=0.611, val_loss=0.667, val_accuracy=0.594]
Validating:   7%|▋         | 2/29 [00:02<00:29,  1.08s/it][A
Epoch 26:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.652, v_num=0, train_loss=0.670, train_accuracy=0.611, val_loss=0.667, val_accuracy=0.594]
Validating:  14%|█▍        | 4/29 [00:02<00:11,  2.13it/s][A
Epoch 26:  91%|█████████ | 232/255 [02:38<00:15,  1.47it/s, loss=0.652, v_num=0, train_loss=0.670, train_accuracy=0.611, val_loss=0.667, val_accuracy=0.594]
Validating:  21%|██        | 6/29 [00:03<00:06,  3.37it/s][A
Epoch 26:  92%|█████████▏| 234/255 [02:38<00:14,  1.48it/s, loss=0.652, v_num=0, train_loss=0.670,

Epoch 26, global step 6101: val_loss was not in top 2


Epoch 27:  89%|████████▊ | 226/255 [02:35<00:19,  1.45it/s, loss=0.667, v_num=0, train_loss=0.635, train_accuracy=0.667, val_loss=0.664, val_accuracy=0.601]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 27:  89%|████████▉ | 228/255 [02:37<00:18,  1.44it/s, loss=0.667, v_num=0, train_loss=0.635, train_accuracy=0.667, val_loss=0.664, val_accuracy=0.601]
Validating:   7%|▋         | 2/29 [00:02<00:29,  1.10s/it][A
Epoch 27:  90%|█████████ | 230/255 [02:38<00:17,  1.45it/s, loss=0.667, v_num=0, train_loss=0.635, train_accuracy=0.667, val_loss=0.664, val_accuracy=0.601]
Validating:  14%|█▍        | 4/29 [00:02<00:11,  2.08it/s][A
Epoch 27:  91%|█████████ | 232/255 [02:38<00:15,  1.46it/s, loss=0.667, v_num=0, train_loss=0.635, train_accuracy=0.667, val_loss=0.664, val_accuracy=0.601]
Validating:  21%|██        | 6/29 [00:03<00:06,  3.30it/s][A
Epoch 27:  92%|█████████▏| 234/255 [02:38<00:14,  1.47it/s, loss=0.667, v_num=0, train_loss=0.635,

Epoch 27, global step 6327: val_loss was not in top 2


Epoch 28:  89%|████████▊ | 226/255 [02:35<00:19,  1.46it/s, loss=0.66, v_num=0, train_loss=0.667, train_accuracy=0.500, val_loss=0.668, val_accuracy=0.576] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 28:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.66, v_num=0, train_loss=0.667, train_accuracy=0.500, val_loss=0.668, val_accuracy=0.576]
Validating:   7%|▋         | 2/29 [00:02<00:29,  1.09s/it][A
Epoch 28:  90%|█████████ | 230/255 [02:38<00:17,  1.46it/s, loss=0.66, v_num=0, train_loss=0.667, train_accuracy=0.500, val_loss=0.668, val_accuracy=0.576]
Validating:  14%|█▍        | 4/29 [00:02<00:11,  2.11it/s][A
Epoch 28:  91%|█████████ | 232/255 [02:38<00:15,  1.47it/s, loss=0.66, v_num=0, train_loss=0.667, train_accuracy=0.500, val_loss=0.668, val_accuracy=0.576]
Validating:  21%|██        | 6/29 [00:03<00:06,  3.34it/s][A
Epoch 28:  92%|█████████▏| 234/255 [02:38<00:14,  1.47it/s, loss=0.66, v_num=0, train_loss=0.667, tra

Epoch 28, global step 6553: val_loss was not in top 2


Epoch 29:  89%|████████▊ | 226/255 [02:35<00:19,  1.46it/s, loss=0.626, v_num=0, train_loss=0.622, train_accuracy=0.667, val_loss=0.659, val_accuracy=0.598]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 29:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.626, v_num=0, train_loss=0.622, train_accuracy=0.667, val_loss=0.659, val_accuracy=0.598]
Validating:   7%|▋         | 2/29 [00:02<00:29,  1.08s/it][A
Epoch 29:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.626, v_num=0, train_loss=0.622, train_accuracy=0.667, val_loss=0.659, val_accuracy=0.598]
Validating:  14%|█▍        | 4/29 [00:02<00:11,  2.10it/s][A
Epoch 29:  91%|█████████ | 232/255 [02:38<00:15,  1.47it/s, loss=0.626, v_num=0, train_loss=0.622, train_accuracy=0.667, val_loss=0.659, val_accuracy=0.598]
Validating:  21%|██        | 6/29 [00:03<00:06,  3.34it/s][A
Epoch 29:  92%|█████████▏| 234/255 [02:38<00:14,  1.47it/s, loss=0.626, v_num=0, train_loss=0.622,

Epoch 29, global step 6779: val_loss was not in top 2


Epoch 30:  89%|████████▊ | 226/255 [02:35<00:19,  1.46it/s, loss=0.653, v_num=0, train_loss=0.721, train_accuracy=0.556, val_loss=0.625, val_accuracy=0.637]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 30:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.653, v_num=0, train_loss=0.721, train_accuracy=0.556, val_loss=0.625, val_accuracy=0.637]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.16s/it][A
Epoch 30:  90%|█████████ | 230/255 [02:38<00:17,  1.46it/s, loss=0.653, v_num=0, train_loss=0.721, train_accuracy=0.556, val_loss=0.625, val_accuracy=0.637]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  2.02it/s][A
Epoch 30:  91%|█████████ | 232/255 [02:38<00:15,  1.46it/s, loss=0.653, v_num=0, train_loss=0.721, train_accuracy=0.556, val_loss=0.625, val_accuracy=0.637]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.22it/s][A
Epoch 30:  92%|█████████▏| 234/255 [02:38<00:14,  1.47it/s, loss=0.653, v_num=0, train_loss=0.721,

Epoch 30, global step 7005: val_loss was not in top 2


Epoch 31:  89%|████████▊ | 226/255 [02:35<00:19,  1.45it/s, loss=0.671, v_num=0, train_loss=0.654, train_accuracy=0.611, val_loss=0.645, val_accuracy=0.624]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 31:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.671, v_num=0, train_loss=0.654, train_accuracy=0.611, val_loss=0.645, val_accuracy=0.624]
Validating:   7%|▋         | 2/29 [00:02<00:29,  1.10s/it][A
Epoch 31:  90%|█████████ | 230/255 [02:38<00:17,  1.45it/s, loss=0.671, v_num=0, train_loss=0.654, train_accuracy=0.611, val_loss=0.645, val_accuracy=0.624]
Validating:  14%|█▍        | 4/29 [00:02<00:11,  2.10it/s][A
Epoch 31:  91%|█████████ | 232/255 [02:38<00:15,  1.46it/s, loss=0.671, v_num=0, train_loss=0.654, train_accuracy=0.611, val_loss=0.645, val_accuracy=0.624]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.25it/s][A
Epoch 31:  92%|█████████▏| 234/255 [02:38<00:14,  1.47it/s, loss=0.671, v_num=0, train_loss=0.654,

Epoch 31, global step 7231: val_loss was not in top 2


Epoch 32:  89%|████████▊ | 226/255 [02:35<00:19,  1.46it/s, loss=0.616, v_num=0, train_loss=0.504, train_accuracy=0.778, val_loss=0.668, val_accuracy=0.550]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 32:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.616, v_num=0, train_loss=0.504, train_accuracy=0.778, val_loss=0.668, val_accuracy=0.550]
Validating:   7%|▋         | 2/29 [00:02<00:29,  1.08s/it][A
Epoch 32:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.616, v_num=0, train_loss=0.504, train_accuracy=0.778, val_loss=0.668, val_accuracy=0.550]
Validating:  14%|█▍        | 4/29 [00:02<00:11,  2.12it/s][A
Epoch 32:  91%|█████████ | 232/255 [02:38<00:15,  1.47it/s, loss=0.616, v_num=0, train_loss=0.504, train_accuracy=0.778, val_loss=0.668, val_accuracy=0.550]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.29it/s][A
Epoch 32:  92%|█████████▏| 234/255 [02:38<00:14,  1.48it/s, loss=0.616, v_num=0, train_loss=0.504,

Epoch 32, global step 7457: val_loss was not in top 2


Epoch 33:  89%|████████▊ | 226/255 [02:35<00:19,  1.46it/s, loss=0.596, v_num=0, train_loss=0.642, train_accuracy=0.667, val_loss=0.619, val_accuracy=0.652]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 33:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.596, v_num=0, train_loss=0.642, train_accuracy=0.667, val_loss=0.619, val_accuracy=0.652]
Validating:   7%|▋         | 2/29 [00:02<00:29,  1.09s/it][A
Epoch 33:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.596, v_num=0, train_loss=0.642, train_accuracy=0.667, val_loss=0.619, val_accuracy=0.652]
Validating:  14%|█▍        | 4/29 [00:02<00:11,  2.10it/s][A
Epoch 33:  91%|█████████ | 232/255 [02:38<00:15,  1.47it/s, loss=0.596, v_num=0, train_loss=0.642, train_accuracy=0.667, val_loss=0.619, val_accuracy=0.652]
Validating:  21%|██        | 6/29 [00:03<00:06,  3.29it/s][A
Epoch 33:  92%|█████████▏| 234/255 [02:38<00:14,  1.48it/s, loss=0.596, v_num=0, train_loss=0.642,

Epoch 33, global step 7683: val_loss reached 0.60548 (best 0.60548), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-34.ckpt" as top 2


Epoch 51:  89%|████████▊ | 226/255 [02:35<00:19,  1.46it/s, loss=0.37, v_num=0, train_loss=0.472, train_accuracy=0.833, val_loss=0.468, val_accuracy=0.770] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 51:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.37, v_num=0, train_loss=0.472, train_accuracy=0.833, val_loss=0.468, val_accuracy=0.770]
Validating:   7%|▋         | 2/29 [00:02<00:29,  1.09s/it][A
Epoch 51:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.37, v_num=0, train_loss=0.472, train_accuracy=0.833, val_loss=0.468, val_accuracy=0.770]
Validating:  14%|█▍        | 4/29 [00:02<00:12,  2.08it/s][A
Epoch 51:  91%|█████████ | 232/255 [02:38<00:15,  1.47it/s, loss=0.37, v_num=0, train_loss=0.472, train_accuracy=0.833, val_loss=0.468, val_accuracy=0.770]
Validating:  21%|██        | 6/29 [00:03<00:06,  3.31it/s][A
Epoch 51:  92%|█████████▏| 234/255 [02:38<00:14,  1.48it/s, loss=0.37, v_num=0, train_loss=0.472, tra

Epoch 51, global step 11751: val_loss reached 0.47004 (best 0.46785), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-34-v1.ckpt" as top 2


Epoch 52:  89%|████████▊ | 226/255 [02:35<00:19,  1.46it/s, loss=0.495, v_num=0, train_loss=0.406, train_accuracy=0.722, val_loss=0.470, val_accuracy=0.779]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 52:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.495, v_num=0, train_loss=0.406, train_accuracy=0.722, val_loss=0.470, val_accuracy=0.779]
Validating:   7%|▋         | 2/29 [00:02<00:29,  1.09s/it][A
Epoch 52:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.495, v_num=0, train_loss=0.406, train_accuracy=0.722, val_loss=0.470, val_accuracy=0.779]
Validating:  14%|█▍        | 4/29 [00:02<00:11,  2.11it/s][A
Epoch 52:  91%|█████████ | 232/255 [02:38<00:15,  1.47it/s, loss=0.495, v_num=0, train_loss=0.406, train_accuracy=0.722, val_loss=0.470, val_accuracy=0.779]
Validating:  21%|██        | 6/29 [00:03<00:06,  3.34it/s][A
Epoch 52:  92%|█████████▏| 234/255 [02:38<00:14,  1.48it/s, loss=0.495, v_num=0, train_loss=0.406,

Epoch 52, global step 11977: val_loss was not in top 2


Epoch 53:  89%|████████▊ | 226/255 [02:35<00:19,  1.45it/s, loss=0.4, v_num=0, train_loss=0.386, train_accuracy=0.778, val_loss=0.505, val_accuracy=0.755]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 53:  89%|████████▉ | 228/255 [02:37<00:18,  1.44it/s, loss=0.4, v_num=0, train_loss=0.386, train_accuracy=0.778, val_loss=0.505, val_accuracy=0.755]
Validating:   7%|▋         | 2/29 [00:02<00:29,  1.09s/it][A
Epoch 53:  90%|█████████ | 230/255 [02:38<00:17,  1.45it/s, loss=0.4, v_num=0, train_loss=0.386, train_accuracy=0.778, val_loss=0.505, val_accuracy=0.755]
Validating:  14%|█▍        | 4/29 [00:02<00:11,  2.11it/s][A
Epoch 53:  91%|█████████ | 232/255 [02:38<00:15,  1.46it/s, loss=0.4, v_num=0, train_loss=0.386, train_accuracy=0.778, val_loss=0.505, val_accuracy=0.755]
Validating:  21%|██        | 6/29 [00:03<00:06,  3.31it/s][A
Epoch 53:  92%|█████████▏| 234/255 [02:38<00:14,  1.47it/s, loss=0.4, v_num=0, train_loss=0.386, train_a

Epoch 53, global step 12203: val_loss reached 0.45214 (best 0.45214), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-34-v1.ckpt" as top 2


Epoch 54:  89%|████████▊ | 226/255 [02:35<00:19,  1.45it/s, loss=0.411, v_num=0, train_loss=0.368, train_accuracy=0.778, val_loss=0.452, val_accuracy=0.778]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 54:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.411, v_num=0, train_loss=0.368, train_accuracy=0.778, val_loss=0.452, val_accuracy=0.778]
Validating:   7%|▋         | 2/29 [00:02<00:29,  1.09s/it][A
Epoch 54:  90%|█████████ | 230/255 [02:38<00:17,  1.45it/s, loss=0.411, v_num=0, train_loss=0.368, train_accuracy=0.778, val_loss=0.452, val_accuracy=0.778]
Validating:  14%|█▍        | 4/29 [00:02<00:11,  2.09it/s][A
Epoch 54:  91%|█████████ | 232/255 [02:38<00:15,  1.46it/s, loss=0.411, v_num=0, train_loss=0.368, train_accuracy=0.778, val_loss=0.452, val_accuracy=0.778]
Validating:  21%|██        | 6/29 [00:03<00:06,  3.32it/s][A
Epoch 54:  92%|█████████▏| 234/255 [02:38<00:14,  1.47it/s, loss=0.411, v_num=0, train_loss=0.368,

Epoch 54, global step 12429: val_loss reached 0.46224 (best 0.45214), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-34.ckpt" as top 2


Epoch 55:  89%|████████▊ | 226/255 [02:35<00:19,  1.45it/s, loss=0.411, v_num=0, train_loss=0.466, train_accuracy=0.833, val_loss=0.462, val_accuracy=0.771]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 55:  89%|████████▉ | 228/255 [02:37<00:18,  1.44it/s, loss=0.411, v_num=0, train_loss=0.466, train_accuracy=0.833, val_loss=0.462, val_accuracy=0.771]
Validating:   7%|▋         | 2/29 [00:02<00:29,  1.10s/it][A
Epoch 55:  90%|█████████ | 230/255 [02:38<00:17,  1.45it/s, loss=0.411, v_num=0, train_loss=0.466, train_accuracy=0.833, val_loss=0.462, val_accuracy=0.771]
Validating:  14%|█▍        | 4/29 [00:02<00:11,  2.10it/s][A
Epoch 55:  91%|█████████ | 232/255 [02:38<00:15,  1.46it/s, loss=0.411, v_num=0, train_loss=0.466, train_accuracy=0.833, val_loss=0.462, val_accuracy=0.771]
Validating:  21%|██        | 6/29 [00:03<00:06,  3.34it/s][A
Epoch 55:  92%|█████████▏| 234/255 [02:38<00:14,  1.47it/s, loss=0.411, v_num=0, train_loss=0.466,

Epoch 55, global step 12655: val_loss reached 0.45565 (best 0.45214), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-34.ckpt" as top 2


Epoch 56:  89%|████████▊ | 226/255 [02:35<00:19,  1.45it/s, loss=0.457, v_num=0, train_loss=0.234, train_accuracy=0.944, val_loss=0.456, val_accuracy=0.790]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 56:  89%|████████▉ | 228/255 [02:38<00:18,  1.44it/s, loss=0.457, v_num=0, train_loss=0.234, train_accuracy=0.944, val_loss=0.456, val_accuracy=0.790]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.16s/it][A
Epoch 56:  90%|█████████ | 230/255 [02:38<00:17,  1.45it/s, loss=0.457, v_num=0, train_loss=0.234, train_accuracy=0.944, val_loss=0.456, val_accuracy=0.790]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  2.02it/s][A
Epoch 56:  91%|█████████ | 232/255 [02:38<00:15,  1.46it/s, loss=0.457, v_num=0, train_loss=0.234, train_accuracy=0.944, val_loss=0.456, val_accuracy=0.790]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.24it/s][A
Epoch 56:  92%|█████████▏| 234/255 [02:39<00:14,  1.47it/s, loss=0.457, v_num=0, train_loss=0.234,

Epoch 56, global step 12881: val_loss was not in top 2


Epoch 57:  89%|████████▊ | 226/255 [02:35<00:19,  1.46it/s, loss=0.41, v_num=0, train_loss=0.165, train_accuracy=1.000, val_loss=0.515, val_accuracy=0.762] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 57:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.41, v_num=0, train_loss=0.165, train_accuracy=1.000, val_loss=0.515, val_accuracy=0.762]
Validating:   7%|▋         | 2/29 [00:02<00:29,  1.11s/it][A
Epoch 57:  90%|█████████ | 230/255 [02:38<00:17,  1.46it/s, loss=0.41, v_num=0, train_loss=0.165, train_accuracy=1.000, val_loss=0.515, val_accuracy=0.762]
Validating:  14%|█▍        | 4/29 [00:02<00:12,  2.08it/s][A
Epoch 57:  91%|█████████ | 232/255 [02:38<00:15,  1.46it/s, loss=0.41, v_num=0, train_loss=0.165, train_accuracy=1.000, val_loss=0.515, val_accuracy=0.762]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.27it/s][A
Epoch 57:  92%|█████████▏| 234/255 [02:38<00:14,  1.47it/s, loss=0.41, v_num=0, train_loss=0.165, tra

Epoch 57, global step 13107: val_loss reached 0.42900 (best 0.42900), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-34.ckpt" as top 2


Epoch 58:  89%|████████▊ | 226/255 [02:35<00:19,  1.45it/s, loss=0.412, v_num=0, train_loss=0.419, train_accuracy=0.722, val_loss=0.429, val_accuracy=0.796]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 58:  89%|████████▉ | 228/255 [02:37<00:18,  1.44it/s, loss=0.412, v_num=0, train_loss=0.419, train_accuracy=0.722, val_loss=0.429, val_accuracy=0.796]
Validating:   7%|▋         | 2/29 [00:02<00:29,  1.10s/it][A
Epoch 58:  90%|█████████ | 230/255 [02:38<00:17,  1.45it/s, loss=0.412, v_num=0, train_loss=0.419, train_accuracy=0.722, val_loss=0.429, val_accuracy=0.796]
Validating:  14%|█▍        | 4/29 [00:02<00:12,  2.08it/s][A
Epoch 58:  91%|█████████ | 232/255 [02:38<00:15,  1.46it/s, loss=0.412, v_num=0, train_loss=0.419, train_accuracy=0.722, val_loss=0.429, val_accuracy=0.796]
Validating:  21%|██        | 6/29 [00:03<00:06,  3.30it/s][A
Epoch 58:  92%|█████████▏| 234/255 [02:38<00:14,  1.47it/s, loss=0.412, v_num=0, train_loss=0.419,

Epoch 58, global step 13333: val_loss reached 0.42377 (best 0.42377), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-34-v1.ckpt" as top 2


Epoch 59:  89%|████████▊ | 226/255 [02:35<00:19,  1.45it/s, loss=0.395, v_num=0, train_loss=0.349, train_accuracy=0.833, val_loss=0.424, val_accuracy=0.801]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 59:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.395, v_num=0, train_loss=0.349, train_accuracy=0.833, val_loss=0.424, val_accuracy=0.801]
Validating:   7%|▋         | 2/29 [00:02<00:28,  1.07s/it][A
Epoch 59:  90%|█████████ | 230/255 [02:38<00:17,  1.45it/s, loss=0.395, v_num=0, train_loss=0.349, train_accuracy=0.833, val_loss=0.424, val_accuracy=0.801]
Validating:  14%|█▍        | 4/29 [00:02<00:11,  2.12it/s][A
Epoch 59:  91%|█████████ | 232/255 [02:38<00:15,  1.46it/s, loss=0.395, v_num=0, train_loss=0.349, train_accuracy=0.833, val_loss=0.424, val_accuracy=0.801]
Validating:  21%|██        | 6/29 [00:03<00:06,  3.37it/s][A
Epoch 59:  92%|█████████▏| 234/255 [02:38<00:14,  1.47it/s, loss=0.395, v_num=0, train_loss=0.349,

Epoch 59, global step 13559: val_loss was not in top 2


Epoch 60:  89%|████████▊ | 226/255 [02:35<00:19,  1.46it/s, loss=0.38, v_num=0, train_loss=0.390, train_accuracy=0.833, val_loss=0.437, val_accuracy=0.776] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 60:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.38, v_num=0, train_loss=0.390, train_accuracy=0.833, val_loss=0.437, val_accuracy=0.776]
Validating:   7%|▋         | 2/29 [00:02<00:29,  1.09s/it][A
Epoch 60:  90%|█████████ | 230/255 [02:38<00:17,  1.46it/s, loss=0.38, v_num=0, train_loss=0.390, train_accuracy=0.833, val_loss=0.437, val_accuracy=0.776]
Validating:  14%|█▍        | 4/29 [00:02<00:11,  2.10it/s][A
Epoch 60:  91%|█████████ | 232/255 [02:38<00:15,  1.47it/s, loss=0.38, v_num=0, train_loss=0.390, train_accuracy=0.833, val_loss=0.437, val_accuracy=0.776]
Validating:  21%|██        | 6/29 [00:03<00:06,  3.31it/s][A
Epoch 60:  92%|█████████▏| 234/255 [02:38<00:14,  1.47it/s, loss=0.38, v_num=0, train_loss=0.390, tra

Epoch 60, global step 13785: val_loss reached 0.42654 (best 0.42377), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-34.ckpt" as top 2


Epoch 61:  89%|████████▊ | 226/255 [02:35<00:19,  1.45it/s, loss=0.361, v_num=0, train_loss=0.133, train_accuracy=1.000, val_loss=0.427, val_accuracy=0.791]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 61:  89%|████████▉ | 228/255 [02:37<00:18,  1.44it/s, loss=0.361, v_num=0, train_loss=0.133, train_accuracy=1.000, val_loss=0.427, val_accuracy=0.791]
Validating:   7%|▋         | 2/29 [00:02<00:29,  1.10s/it][A
Epoch 61:  90%|█████████ | 230/255 [02:38<00:17,  1.45it/s, loss=0.361, v_num=0, train_loss=0.133, train_accuracy=1.000, val_loss=0.427, val_accuracy=0.791]
Validating:  14%|█▍        | 4/29 [00:02<00:11,  2.09it/s][A
Epoch 61:  91%|█████████ | 232/255 [02:38<00:15,  1.46it/s, loss=0.361, v_num=0, train_loss=0.133, train_accuracy=1.000, val_loss=0.427, val_accuracy=0.791]
Validating:  21%|██        | 6/29 [00:03<00:06,  3.31it/s][A
Epoch 61:  92%|█████████▏| 234/255 [02:38<00:14,  1.47it/s, loss=0.361, v_num=0, train_loss=0.133,

Epoch 61, global step 14011: val_loss reached 0.42018 (best 0.42018), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-34.ckpt" as top 2


Epoch 62:  89%|████████▊ | 226/255 [02:35<00:19,  1.45it/s, loss=0.44, v_num=0, train_loss=0.606, train_accuracy=0.778, val_loss=0.420, val_accuracy=0.796] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 62:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.44, v_num=0, train_loss=0.606, train_accuracy=0.778, val_loss=0.420, val_accuracy=0.796]
Validating:   7%|▋         | 2/29 [00:02<00:29,  1.11s/it][A
Epoch 62:  90%|█████████ | 230/255 [02:38<00:17,  1.45it/s, loss=0.44, v_num=0, train_loss=0.606, train_accuracy=0.778, val_loss=0.420, val_accuracy=0.796]
Validating:  14%|█▍        | 4/29 [00:02<00:11,  2.09it/s][A
Epoch 62:  91%|█████████ | 232/255 [02:38<00:15,  1.46it/s, loss=0.44, v_num=0, train_loss=0.606, train_accuracy=0.778, val_loss=0.420, val_accuracy=0.796]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.28it/s][A
Epoch 62:  92%|█████████▏| 234/255 [02:38<00:14,  1.47it/s, loss=0.44, v_num=0, train_loss=0.606, tra

Epoch 62, global step 14237: val_loss was not in top 2


Epoch 63:  89%|████████▊ | 226/255 [02:35<00:19,  1.46it/s, loss=0.454, v_num=0, train_loss=0.704, train_accuracy=0.667, val_loss=0.765, val_accuracy=0.713]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 63:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.454, v_num=0, train_loss=0.704, train_accuracy=0.667, val_loss=0.765, val_accuracy=0.713]
Validating:   7%|▋         | 2/29 [00:02<00:29,  1.09s/it][A
Epoch 63:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.454, v_num=0, train_loss=0.704, train_accuracy=0.667, val_loss=0.765, val_accuracy=0.713]
Validating:  14%|█▍        | 4/29 [00:02<00:11,  2.10it/s][A
Epoch 63:  91%|█████████ | 232/255 [02:38<00:15,  1.47it/s, loss=0.454, v_num=0, train_loss=0.704, train_accuracy=0.667, val_loss=0.765, val_accuracy=0.713]
Validating:  21%|██        | 6/29 [00:03<00:06,  3.34it/s][A
Epoch 63:  92%|█████████▏| 234/255 [02:38<00:14,  1.48it/s, loss=0.454, v_num=0, train_loss=0.704,

Epoch 63, global step 14463: val_loss was not in top 2


Epoch 64:  89%|████████▊ | 226/255 [02:35<00:19,  1.45it/s, loss=0.419, v_num=0, train_loss=0.537, train_accuracy=0.778, val_loss=0.435, val_accuracy=0.789]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 64:  89%|████████▉ | 228/255 [02:37<00:18,  1.44it/s, loss=0.419, v_num=0, train_loss=0.537, train_accuracy=0.778, val_loss=0.435, val_accuracy=0.789]
Validating:   7%|▋         | 2/29 [00:02<00:29,  1.10s/it][A
Epoch 64:  90%|█████████ | 230/255 [02:38<00:17,  1.45it/s, loss=0.419, v_num=0, train_loss=0.537, train_accuracy=0.778, val_loss=0.435, val_accuracy=0.789]
Validating:  14%|█▍        | 4/29 [00:02<00:12,  2.07it/s][A
Epoch 64:  91%|█████████ | 232/255 [02:38<00:15,  1.46it/s, loss=0.419, v_num=0, train_loss=0.537, train_accuracy=0.778, val_loss=0.435, val_accuracy=0.789]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.27it/s][A
Epoch 64:  92%|█████████▏| 234/255 [02:38<00:14,  1.47it/s, loss=0.419, v_num=0, train_loss=0.537,

Epoch 64, global step 14689: val_loss was not in top 2


Epoch 65:  89%|████████▊ | 226/255 [02:35<00:19,  1.46it/s, loss=0.412, v_num=0, train_loss=0.305, train_accuracy=0.889, val_loss=0.439, val_accuracy=0.769]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 65:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.412, v_num=0, train_loss=0.305, train_accuracy=0.889, val_loss=0.439, val_accuracy=0.769]
Validating:   7%|▋         | 2/29 [00:02<00:29,  1.09s/it][A
Epoch 65:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.412, v_num=0, train_loss=0.305, train_accuracy=0.889, val_loss=0.439, val_accuracy=0.769]
Validating:  14%|█▍        | 4/29 [00:02<00:12,  2.08it/s][A
Epoch 65:  91%|█████████ | 232/255 [02:38<00:15,  1.47it/s, loss=0.412, v_num=0, train_loss=0.305, train_accuracy=0.889, val_loss=0.439, val_accuracy=0.769]
Validating:  21%|██        | 6/29 [00:03<00:06,  3.32it/s][A
Epoch 65:  92%|█████████▏| 234/255 [02:38<00:14,  1.48it/s, loss=0.412, v_num=0, train_loss=0.305,

Epoch 65, global step 14915: val_loss reached 0.40238 (best 0.40238), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-34-v1.ckpt" as top 2


Epoch 66:  89%|████████▊ | 226/255 [02:35<00:19,  1.46it/s, loss=0.372, v_num=0, train_loss=0.470, train_accuracy=0.833, val_loss=0.402, val_accuracy=0.806]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 66:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.372, v_num=0, train_loss=0.470, train_accuracy=0.833, val_loss=0.402, val_accuracy=0.806]
Validating:   7%|▋         | 2/29 [00:02<00:29,  1.10s/it][A
Epoch 66:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.372, v_num=0, train_loss=0.470, train_accuracy=0.833, val_loss=0.402, val_accuracy=0.806]
Validating:  14%|█▍        | 4/29 [00:02<00:11,  2.11it/s][A
Epoch 66:  91%|█████████ | 232/255 [02:38<00:15,  1.47it/s, loss=0.372, v_num=0, train_loss=0.470, train_accuracy=0.833, val_loss=0.402, val_accuracy=0.806]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.23it/s][A
Epoch 66:  92%|█████████▏| 234/255 [02:38<00:14,  1.47it/s, loss=0.372, v_num=0, train_loss=0.470,

Epoch 66, global step 15141: val_loss reached 0.40063 (best 0.40063), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-34.ckpt" as top 2


Epoch 67:  89%|████████▊ | 226/255 [02:35<00:19,  1.46it/s, loss=0.398, v_num=0, train_loss=0.330, train_accuracy=0.889, val_loss=0.401, val_accuracy=0.803]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 67:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.398, v_num=0, train_loss=0.330, train_accuracy=0.889, val_loss=0.401, val_accuracy=0.803]
Validating:   7%|▋         | 2/29 [00:02<00:29,  1.10s/it][A
Epoch 67:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.398, v_num=0, train_loss=0.330, train_accuracy=0.889, val_loss=0.401, val_accuracy=0.803]
Validating:  14%|█▍        | 4/29 [00:02<00:11,  2.09it/s][A
Epoch 67:  91%|█████████ | 232/255 [02:38<00:15,  1.47it/s, loss=0.398, v_num=0, train_loss=0.330, train_accuracy=0.889, val_loss=0.401, val_accuracy=0.803]
Validating:  21%|██        | 6/29 [00:03<00:06,  3.31it/s][A
Epoch 67:  92%|█████████▏| 234/255 [02:38<00:14,  1.47it/s, loss=0.398, v_num=0, train_loss=0.330,

Epoch 67, global step 15367: val_loss was not in top 2


Epoch 68:  89%|████████▊ | 226/255 [02:35<00:19,  1.45it/s, loss=0.39, v_num=0, train_loss=0.405, train_accuracy=0.889, val_loss=0.412, val_accuracy=0.797] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 68:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.39, v_num=0, train_loss=0.405, train_accuracy=0.889, val_loss=0.412, val_accuracy=0.797]
Validating:   7%|▋         | 2/29 [00:02<00:29,  1.10s/it][A
Epoch 68:  90%|█████████ | 230/255 [02:38<00:17,  1.45it/s, loss=0.39, v_num=0, train_loss=0.405, train_accuracy=0.889, val_loss=0.412, val_accuracy=0.797]
Validating:  14%|█▍        | 4/29 [00:02<00:11,  2.11it/s][A
Epoch 68:  91%|█████████ | 232/255 [02:38<00:15,  1.46it/s, loss=0.39, v_num=0, train_loss=0.405, train_accuracy=0.889, val_loss=0.412, val_accuracy=0.797]
Validating:  21%|██        | 6/29 [00:03<00:06,  3.33it/s][A
Epoch 68:  92%|█████████▏| 234/255 [02:38<00:14,  1.47it/s, loss=0.39, v_num=0, train_loss=0.405, tra

Epoch 68, global step 15593: val_loss reached 0.40235 (best 0.40063), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-34-v1.ckpt" as top 2


Epoch 69:  89%|████████▊ | 226/255 [02:35<00:19,  1.46it/s, loss=0.355, v_num=0, train_loss=0.391, train_accuracy=0.667, val_loss=0.402, val_accuracy=0.804]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 69:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.355, v_num=0, train_loss=0.391, train_accuracy=0.667, val_loss=0.402, val_accuracy=0.804]
Validating:   7%|▋         | 2/29 [00:02<00:29,  1.10s/it][A
Epoch 69:  90%|█████████ | 230/255 [02:38<00:17,  1.45it/s, loss=0.355, v_num=0, train_loss=0.391, train_accuracy=0.667, val_loss=0.402, val_accuracy=0.804]
Validating:  14%|█▍        | 4/29 [00:02<00:11,  2.10it/s][A
Epoch 69:  91%|█████████ | 232/255 [02:38<00:15,  1.46it/s, loss=0.355, v_num=0, train_loss=0.391, train_accuracy=0.667, val_loss=0.402, val_accuracy=0.804]
Validating:  21%|██        | 6/29 [00:03<00:06,  3.34it/s][A
Epoch 69:  92%|█████████▏| 234/255 [02:38<00:14,  1.47it/s, loss=0.355, v_num=0, train_loss=0.391,

Epoch 69, global step 15819: val_loss was not in top 2


Epoch 70:  89%|████████▊ | 226/255 [02:35<00:19,  1.46it/s, loss=0.379, v_num=0, train_loss=0.374, train_accuracy=0.889, val_loss=0.415, val_accuracy=0.795]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 70:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.379, v_num=0, train_loss=0.374, train_accuracy=0.889, val_loss=0.415, val_accuracy=0.795]
Validating:   7%|▋         | 2/29 [00:02<00:29,  1.11s/it][A
Epoch 70:  90%|█████████ | 230/255 [02:38<00:17,  1.45it/s, loss=0.379, v_num=0, train_loss=0.374, train_accuracy=0.889, val_loss=0.415, val_accuracy=0.795]
Validating:  14%|█▍        | 4/29 [00:02<00:12,  2.06it/s][A
Epoch 70:  91%|█████████ | 232/255 [02:38<00:15,  1.46it/s, loss=0.379, v_num=0, train_loss=0.374, train_accuracy=0.889, val_loss=0.415, val_accuracy=0.795]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.26it/s][A
Epoch 70:  92%|█████████▏| 234/255 [02:38<00:14,  1.47it/s, loss=0.379, v_num=0, train_loss=0.374,

Epoch 70, global step 16045: val_loss was not in top 2


Epoch 71:  89%|████████▊ | 226/255 [02:35<00:19,  1.45it/s, loss=0.379, v_num=0, train_loss=0.312, train_accuracy=0.833, val_loss=0.435, val_accuracy=0.799]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 71:  89%|████████▉ | 228/255 [02:37<00:18,  1.44it/s, loss=0.379, v_num=0, train_loss=0.312, train_accuracy=0.833, val_loss=0.435, val_accuracy=0.799]
Validating:   7%|▋         | 2/29 [00:02<00:29,  1.09s/it][A
Epoch 71:  90%|█████████ | 230/255 [02:38<00:17,  1.45it/s, loss=0.379, v_num=0, train_loss=0.312, train_accuracy=0.833, val_loss=0.435, val_accuracy=0.799]
Validating:  14%|█▍        | 4/29 [00:02<00:11,  2.08it/s][A
Epoch 71:  91%|█████████ | 232/255 [02:38<00:15,  1.46it/s, loss=0.379, v_num=0, train_loss=0.312, train_accuracy=0.833, val_loss=0.435, val_accuracy=0.799]
Validating:  21%|██        | 6/29 [00:03<00:06,  3.31it/s][A
Epoch 71:  92%|█████████▏| 234/255 [02:39<00:14,  1.47it/s, loss=0.379, v_num=0, train_loss=0.312,

Epoch 71, global step 16271: val_loss was not in top 2


Epoch 72:  89%|████████▊ | 226/255 [02:35<00:19,  1.46it/s, loss=0.338, v_num=0, train_loss=0.389, train_accuracy=0.722, val_loss=0.405, val_accuracy=0.796]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 72:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.338, v_num=0, train_loss=0.389, train_accuracy=0.722, val_loss=0.405, val_accuracy=0.796]
Validating:   7%|▋         | 2/29 [00:02<00:29,  1.09s/it][A
Epoch 72:  90%|█████████ | 230/255 [02:38<00:17,  1.45it/s, loss=0.338, v_num=0, train_loss=0.389, train_accuracy=0.722, val_loss=0.405, val_accuracy=0.796]
Validating:  14%|█▍        | 4/29 [00:02<00:11,  2.10it/s][A
Epoch 72:  91%|█████████ | 232/255 [02:38<00:15,  1.46it/s, loss=0.338, v_num=0, train_loss=0.389, train_accuracy=0.722, val_loss=0.405, val_accuracy=0.796]
Validating:  21%|██        | 6/29 [00:03<00:06,  3.31it/s][A
Epoch 72:  92%|█████████▏| 234/255 [02:38<00:14,  1.47it/s, loss=0.338, v_num=0, train_loss=0.389,

Epoch 72, global step 16497: val_loss reached 0.39828 (best 0.39828), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-34-v1.ckpt" as top 2


Epoch 73:  89%|████████▊ | 226/255 [02:35<00:19,  1.46it/s, loss=0.419, v_num=0, train_loss=0.380, train_accuracy=0.889, val_loss=0.398, val_accuracy=0.805]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 73:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.419, v_num=0, train_loss=0.380, train_accuracy=0.889, val_loss=0.398, val_accuracy=0.805]
Validating:   7%|▋         | 2/29 [00:02<00:29,  1.11s/it][A
Epoch 73:  90%|█████████ | 230/255 [02:38<00:17,  1.45it/s, loss=0.419, v_num=0, train_loss=0.380, train_accuracy=0.889, val_loss=0.398, val_accuracy=0.805]
Validating:  14%|█▍        | 4/29 [00:02<00:12,  2.06it/s][A
Epoch 73:  91%|█████████ | 232/255 [02:38<00:15,  1.46it/s, loss=0.419, v_num=0, train_loss=0.380, train_accuracy=0.889, val_loss=0.398, val_accuracy=0.805]
Validating:  21%|██        | 6/29 [00:03<00:06,  3.31it/s][A
Epoch 73:  92%|█████████▏| 234/255 [02:38<00:14,  1.47it/s, loss=0.419, v_num=0, train_loss=0.380,

Epoch 73, global step 16723: val_loss was not in top 2


Epoch 74:  89%|████████▊ | 226/255 [02:35<00:19,  1.45it/s, loss=0.358, v_num=0, train_loss=0.274, train_accuracy=0.833, val_loss=0.469, val_accuracy=0.789]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 74:  89%|████████▉ | 228/255 [02:37<00:18,  1.44it/s, loss=0.358, v_num=0, train_loss=0.274, train_accuracy=0.833, val_loss=0.469, val_accuracy=0.789]
Validating:   7%|▋         | 2/29 [00:02<00:29,  1.09s/it][A
Epoch 74:  90%|█████████ | 230/255 [02:38<00:17,  1.45it/s, loss=0.358, v_num=0, train_loss=0.274, train_accuracy=0.833, val_loss=0.469, val_accuracy=0.789]
Validating:  14%|█▍        | 4/29 [00:02<00:11,  2.11it/s][A
Epoch 74:  91%|█████████ | 232/255 [02:38<00:15,  1.46it/s, loss=0.358, v_num=0, train_loss=0.274, train_accuracy=0.833, val_loss=0.469, val_accuracy=0.789]
Validating:  21%|██        | 6/29 [00:03<00:06,  3.29it/s][A
Epoch 74:  92%|█████████▏| 234/255 [02:38<00:14,  1.47it/s, loss=0.358, v_num=0, train_loss=0.274,

Epoch 74, global step 16949: val_loss was not in top 2


Epoch 75:  89%|████████▊ | 226/255 [02:35<00:19,  1.46it/s, loss=0.368, v_num=0, train_loss=0.286, train_accuracy=0.889, val_loss=0.438, val_accuracy=0.792]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 75:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.368, v_num=0, train_loss=0.286, train_accuracy=0.889, val_loss=0.438, val_accuracy=0.792]
Validating:   7%|▋         | 2/29 [00:02<00:29,  1.10s/it][A
Epoch 75:  90%|█████████ | 230/255 [02:38<00:17,  1.46it/s, loss=0.368, v_num=0, train_loss=0.286, train_accuracy=0.889, val_loss=0.438, val_accuracy=0.792]
Validating:  14%|█▍        | 4/29 [00:02<00:11,  2.10it/s][A
Epoch 75:  91%|█████████ | 232/255 [02:38<00:15,  1.46it/s, loss=0.368, v_num=0, train_loss=0.286, train_accuracy=0.889, val_loss=0.438, val_accuracy=0.792]
Validating:  21%|██        | 6/29 [00:03<00:06,  3.33it/s][A
Epoch 75:  92%|█████████▏| 234/255 [02:38<00:14,  1.47it/s, loss=0.368, v_num=0, train_loss=0.286,

Epoch 75, global step 17175: val_loss was not in top 2


Epoch 76:  89%|████████▊ | 226/255 [02:35<00:19,  1.45it/s, loss=0.375, v_num=0, train_loss=0.273, train_accuracy=0.889, val_loss=0.443, val_accuracy=0.800]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 76:  89%|████████▉ | 228/255 [02:37<00:18,  1.44it/s, loss=0.375, v_num=0, train_loss=0.273, train_accuracy=0.889, val_loss=0.443, val_accuracy=0.800]
Validating:   7%|▋         | 2/29 [00:02<00:29,  1.10s/it][A
Epoch 76:  90%|█████████ | 230/255 [02:38<00:17,  1.45it/s, loss=0.375, v_num=0, train_loss=0.273, train_accuracy=0.889, val_loss=0.443, val_accuracy=0.800]
Validating:  14%|█▍        | 4/29 [00:02<00:11,  2.09it/s][A
Epoch 76:  91%|█████████ | 232/255 [02:38<00:15,  1.46it/s, loss=0.375, v_num=0, train_loss=0.273, train_accuracy=0.889, val_loss=0.443, val_accuracy=0.800]
Validating:  21%|██        | 6/29 [00:03<00:06,  3.29it/s][A
Epoch 76:  92%|█████████▏| 234/255 [02:39<00:14,  1.47it/s, loss=0.375, v_num=0, train_loss=0.273,

Epoch 76, global step 17401: val_loss was not in top 2


Epoch 77:  89%|████████▊ | 226/255 [02:35<00:19,  1.46it/s, loss=0.362, v_num=0, train_loss=0.482, train_accuracy=0.722, val_loss=0.433, val_accuracy=0.791]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 77:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.362, v_num=0, train_loss=0.482, train_accuracy=0.722, val_loss=0.433, val_accuracy=0.791]
Validating:   7%|▋         | 2/29 [00:02<00:30,  1.11s/it][A
Epoch 77:  90%|█████████ | 230/255 [02:38<00:17,  1.46it/s, loss=0.362, v_num=0, train_loss=0.482, train_accuracy=0.722, val_loss=0.433, val_accuracy=0.791]
Validating:  14%|█▍        | 4/29 [00:02<00:12,  2.06it/s][A
Epoch 77:  91%|█████████ | 232/255 [02:38<00:15,  1.47it/s, loss=0.362, v_num=0, train_loss=0.482, train_accuracy=0.722, val_loss=0.433, val_accuracy=0.791]
Validating:  21%|██        | 6/29 [00:03<00:06,  3.30it/s][A
Epoch 77:  92%|█████████▏| 234/255 [02:38<00:14,  1.47it/s, loss=0.362, v_num=0, train_loss=0.482,

Epoch 77, global step 17627: val_loss was not in top 2


Epoch 78:  89%|████████▊ | 226/255 [02:35<00:19,  1.46it/s, loss=0.359, v_num=0, train_loss=0.221, train_accuracy=0.944, val_loss=0.421, val_accuracy=0.808]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 78:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.359, v_num=0, train_loss=0.221, train_accuracy=0.944, val_loss=0.421, val_accuracy=0.808]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.16s/it][A
Epoch 78:  90%|█████████ | 230/255 [02:38<00:17,  1.45it/s, loss=0.359, v_num=0, train_loss=0.221, train_accuracy=0.944, val_loss=0.421, val_accuracy=0.808]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  2.00it/s][A
Epoch 78:  91%|█████████ | 232/255 [02:38<00:15,  1.46it/s, loss=0.359, v_num=0, train_loss=0.221, train_accuracy=0.944, val_loss=0.421, val_accuracy=0.808]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.18it/s][A
Epoch 78:  92%|█████████▏| 234/255 [02:38<00:14,  1.47it/s, loss=0.359, v_num=0, train_loss=0.221,

Epoch 78, global step 17853: val_loss was not in top 2


Epoch 79:  89%|████████▊ | 226/255 [02:35<00:19,  1.46it/s, loss=0.352, v_num=0, train_loss=0.403, train_accuracy=0.722, val_loss=0.423, val_accuracy=0.808]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 79:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.352, v_num=0, train_loss=0.403, train_accuracy=0.722, val_loss=0.423, val_accuracy=0.808]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.16s/it][A
Epoch 79:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.352, v_num=0, train_loss=0.403, train_accuracy=0.722, val_loss=0.423, val_accuracy=0.808]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  2.01it/s][A
Epoch 79:  91%|█████████ | 232/255 [02:38<00:15,  1.47it/s, loss=0.352, v_num=0, train_loss=0.403, train_accuracy=0.722, val_loss=0.423, val_accuracy=0.808]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.20it/s][A
Epoch 79:  92%|█████████▏| 234/255 [02:38<00:14,  1.47it/s, loss=0.352, v_num=0, train_loss=0.403,

Epoch 79, global step 18079: val_loss reached 0.40035 (best 0.39828), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-34.ckpt" as top 2


Epoch 80:  89%|████████▊ | 226/255 [02:35<00:19,  1.46it/s, loss=0.359, v_num=0, train_loss=0.371, train_accuracy=0.778, val_loss=0.400, val_accuracy=0.801]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 80:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.359, v_num=0, train_loss=0.371, train_accuracy=0.778, val_loss=0.400, val_accuracy=0.801]
Validating:   7%|▋         | 2/29 [00:02<00:29,  1.10s/it][A
Epoch 80:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.359, v_num=0, train_loss=0.371, train_accuracy=0.778, val_loss=0.400, val_accuracy=0.801]
Validating:  14%|█▍        | 4/29 [00:02<00:11,  2.10it/s][A
Epoch 80:  91%|█████████ | 232/255 [02:38<00:15,  1.47it/s, loss=0.359, v_num=0, train_loss=0.371, train_accuracy=0.778, val_loss=0.400, val_accuracy=0.801]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.28it/s][A
Epoch 80:  92%|█████████▏| 234/255 [02:38<00:14,  1.47it/s, loss=0.359, v_num=0, train_loss=0.371,

Epoch 80, global step 18305: val_loss reached 0.38358 (best 0.38358), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-34.ckpt" as top 2


Epoch 81:  89%|████████▊ | 226/255 [02:35<00:19,  1.46it/s, loss=0.349, v_num=0, train_loss=0.317, train_accuracy=0.778, val_loss=0.384, val_accuracy=0.812]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 81:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.349, v_num=0, train_loss=0.317, train_accuracy=0.778, val_loss=0.384, val_accuracy=0.812]
Validating:   7%|▋         | 2/29 [00:02<00:29,  1.10s/it][A
Epoch 81:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.349, v_num=0, train_loss=0.317, train_accuracy=0.778, val_loss=0.384, val_accuracy=0.812]
Validating:  14%|█▍        | 4/29 [00:02<00:11,  2.09it/s][A
Epoch 81:  91%|█████████ | 232/255 [02:38<00:15,  1.47it/s, loss=0.349, v_num=0, train_loss=0.317, train_accuracy=0.778, val_loss=0.384, val_accuracy=0.812]
Validating:  21%|██        | 6/29 [00:03<00:06,  3.30it/s][A
Epoch 81:  92%|█████████▏| 234/255 [02:38<00:14,  1.48it/s, loss=0.349, v_num=0, train_loss=0.317,

Epoch 81, global step 18531: val_loss reached 0.38462 (best 0.38358), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-34-v1.ckpt" as top 2


Epoch 82:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.326, v_num=0, train_loss=0.291, train_accuracy=0.778, val_loss=0.385, val_accuracy=0.823]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 82:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.326, v_num=0, train_loss=0.291, train_accuracy=0.778, val_loss=0.385, val_accuracy=0.823]
Validating:   7%|▋         | 2/29 [00:02<00:29,  1.10s/it][A
Epoch 82:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.326, v_num=0, train_loss=0.291, train_accuracy=0.778, val_loss=0.385, val_accuracy=0.823]
Validating:  14%|█▍        | 4/29 [00:02<00:11,  2.09it/s][A
Epoch 82:  91%|█████████ | 232/255 [02:38<00:15,  1.47it/s, loss=0.326, v_num=0, train_loss=0.291, train_accuracy=0.778, val_loss=0.385, val_accuracy=0.823]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.23it/s][A
Epoch 82:  92%|█████████▏| 234/255 [02:38<00:14,  1.48it/s, loss=0.326, v_num=0, train_loss=0.291,

Epoch 82, global step 18757: val_loss was not in top 2


Epoch 83:  89%|████████▊ | 226/255 [02:35<00:19,  1.45it/s, loss=0.339, v_num=0, train_loss=0.197, train_accuracy=0.889, val_loss=0.400, val_accuracy=0.815]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 83:  89%|████████▉ | 228/255 [02:37<00:18,  1.44it/s, loss=0.339, v_num=0, train_loss=0.197, train_accuracy=0.889, val_loss=0.400, val_accuracy=0.815]
Validating:   7%|▋         | 2/29 [00:02<00:29,  1.11s/it][A
Epoch 83:  90%|█████████ | 230/255 [02:38<00:17,  1.45it/s, loss=0.339, v_num=0, train_loss=0.197, train_accuracy=0.889, val_loss=0.400, val_accuracy=0.815]
Validating:  14%|█▍        | 4/29 [00:02<00:12,  2.06it/s][A
Epoch 83:  91%|█████████ | 232/255 [02:38<00:15,  1.46it/s, loss=0.339, v_num=0, train_loss=0.197, train_accuracy=0.889, val_loss=0.400, val_accuracy=0.815]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.26it/s][A
Epoch 83:  92%|█████████▏| 234/255 [02:39<00:14,  1.47it/s, loss=0.339, v_num=0, train_loss=0.197,

Epoch 83, global step 18983: val_loss reached 0.35767 (best 0.35767), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-34-v1.ckpt" as top 2


Epoch 84:  89%|████████▊ | 226/255 [02:35<00:19,  1.45it/s, loss=0.342, v_num=0, train_loss=0.189, train_accuracy=1.000, val_loss=0.358, val_accuracy=0.825]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 84:  89%|████████▉ | 228/255 [02:38<00:18,  1.44it/s, loss=0.342, v_num=0, train_loss=0.189, train_accuracy=1.000, val_loss=0.358, val_accuracy=0.825]
Validating:   7%|▋         | 2/29 [00:02<00:29,  1.09s/it][A
Epoch 84:  90%|█████████ | 230/255 [02:38<00:17,  1.45it/s, loss=0.342, v_num=0, train_loss=0.189, train_accuracy=1.000, val_loss=0.358, val_accuracy=0.825]
Validating:  14%|█▍        | 4/29 [00:02<00:12,  2.07it/s][A
Epoch 84:  91%|█████████ | 232/255 [02:38<00:15,  1.46it/s, loss=0.342, v_num=0, train_loss=0.189, train_accuracy=1.000, val_loss=0.358, val_accuracy=0.825]
Validating:  21%|██        | 6/29 [00:03<00:06,  3.30it/s][A
Epoch 84:  92%|█████████▏| 234/255 [02:39<00:14,  1.47it/s, loss=0.342, v_num=0, train_loss=0.189,

Epoch 84, global step 19209: val_loss reached 0.35689 (best 0.35689), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-34.ckpt" as top 2


Epoch 85:  89%|████████▊ | 226/255 [02:35<00:19,  1.45it/s, loss=0.353, v_num=0, train_loss=0.286, train_accuracy=0.833, val_loss=0.357, val_accuracy=0.830]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 85:  89%|████████▉ | 228/255 [02:38<00:18,  1.44it/s, loss=0.353, v_num=0, train_loss=0.286, train_accuracy=0.833, val_loss=0.357, val_accuracy=0.830]
Validating:   7%|▋         | 2/29 [00:02<00:29,  1.10s/it][A
Epoch 85:  90%|█████████ | 230/255 [02:38<00:17,  1.45it/s, loss=0.353, v_num=0, train_loss=0.286, train_accuracy=0.833, val_loss=0.357, val_accuracy=0.830]
Validating:  14%|█▍        | 4/29 [00:02<00:12,  2.08it/s][A
Epoch 85:  91%|█████████ | 232/255 [02:38<00:15,  1.46it/s, loss=0.353, v_num=0, train_loss=0.286, train_accuracy=0.833, val_loss=0.357, val_accuracy=0.830]
Validating:  21%|██        | 6/29 [00:03<00:06,  3.29it/s][A
Epoch 85:  92%|█████████▏| 234/255 [02:39<00:14,  1.47it/s, loss=0.353, v_num=0, train_loss=0.286,

Epoch 85, global step 19435: val_loss was not in top 2


Epoch 86:  89%|████████▊ | 226/255 [02:35<00:19,  1.46it/s, loss=0.33, v_num=0, train_loss=0.263, train_accuracy=0.944, val_loss=0.387, val_accuracy=0.813] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 86:  89%|████████▉ | 228/255 [02:37<00:18,  1.44it/s, loss=0.33, v_num=0, train_loss=0.263, train_accuracy=0.944, val_loss=0.387, val_accuracy=0.813]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.18s/it][A
Epoch 86:  90%|█████████ | 230/255 [02:38<00:17,  1.45it/s, loss=0.33, v_num=0, train_loss=0.263, train_accuracy=0.944, val_loss=0.387, val_accuracy=0.813]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.98it/s][A
Epoch 86:  91%|█████████ | 232/255 [02:38<00:15,  1.46it/s, loss=0.33, v_num=0, train_loss=0.263, train_accuracy=0.944, val_loss=0.387, val_accuracy=0.813]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.19it/s][A
Epoch 86:  92%|█████████▏| 234/255 [02:38<00:14,  1.47it/s, loss=0.33, v_num=0, train_loss=0.263, tra

Epoch 86, global step 19661: val_loss reached 0.35456 (best 0.35456), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-34-v1.ckpt" as top 2


Epoch 87:  89%|████████▊ | 226/255 [02:35<00:19,  1.46it/s, loss=0.306, v_num=0, train_loss=0.280, train_accuracy=0.944, val_loss=0.355, val_accuracy=0.835]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 87:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.306, v_num=0, train_loss=0.280, train_accuracy=0.944, val_loss=0.355, val_accuracy=0.835]
Validating:   7%|▋         | 2/29 [00:02<00:29,  1.09s/it][A
Epoch 87:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.306, v_num=0, train_loss=0.280, train_accuracy=0.944, val_loss=0.355, val_accuracy=0.835]
Validating:  14%|█▍        | 4/29 [00:02<00:11,  2.10it/s][A
Epoch 87:  91%|█████████ | 232/255 [02:38<00:15,  1.47it/s, loss=0.306, v_num=0, train_loss=0.280, train_accuracy=0.944, val_loss=0.355, val_accuracy=0.835]
Validating:  21%|██        | 6/29 [00:03<00:06,  3.33it/s][A
Epoch 87:  92%|█████████▏| 234/255 [02:38<00:14,  1.48it/s, loss=0.306, v_num=0, train_loss=0.280,

Epoch 87, global step 19887: val_loss was not in top 2


Epoch 88:  89%|████████▊ | 226/255 [02:35<00:19,  1.45it/s, loss=0.37, v_num=0, train_loss=0.304, train_accuracy=0.833, val_loss=0.358, val_accuracy=0.838] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 88:  89%|████████▉ | 228/255 [02:37<00:18,  1.44it/s, loss=0.37, v_num=0, train_loss=0.304, train_accuracy=0.833, val_loss=0.358, val_accuracy=0.838]
Validating:   7%|▋         | 2/29 [00:02<00:29,  1.10s/it][A
Epoch 88:  90%|█████████ | 230/255 [02:38<00:17,  1.45it/s, loss=0.37, v_num=0, train_loss=0.304, train_accuracy=0.833, val_loss=0.358, val_accuracy=0.838]
Validating:  14%|█▍        | 4/29 [00:02<00:11,  2.10it/s][A
Epoch 88:  91%|█████████ | 232/255 [02:38<00:15,  1.46it/s, loss=0.37, v_num=0, train_loss=0.304, train_accuracy=0.833, val_loss=0.358, val_accuracy=0.838]
Validating:  21%|██        | 6/29 [00:03<00:06,  3.33it/s][A
Epoch 88:  92%|█████████▏| 234/255 [02:38<00:14,  1.47it/s, loss=0.37, v_num=0, train_loss=0.304, tra

Epoch 88, global step 20113: val_loss was not in top 2


Epoch 89:  89%|████████▊ | 226/255 [02:35<00:19,  1.46it/s, loss=0.356, v_num=0, train_loss=0.268, train_accuracy=0.944, val_loss=0.514, val_accuracy=0.780]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 89:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.356, v_num=0, train_loss=0.268, train_accuracy=0.944, val_loss=0.514, val_accuracy=0.780]
Validating:   7%|▋         | 2/29 [00:02<00:30,  1.12s/it][A
Epoch 89:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.356, v_num=0, train_loss=0.268, train_accuracy=0.944, val_loss=0.514, val_accuracy=0.780]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  2.05it/s][A
Epoch 89:  91%|█████████ | 232/255 [02:38<00:15,  1.47it/s, loss=0.356, v_num=0, train_loss=0.268, train_accuracy=0.944, val_loss=0.514, val_accuracy=0.780]
Validating:  21%|██        | 6/29 [00:03<00:06,  3.29it/s][A
Epoch 89:  92%|█████████▏| 234/255 [02:38<00:14,  1.47it/s, loss=0.356, v_num=0, train_loss=0.268,

Epoch 89, global step 20339: val_loss was not in top 2


Epoch 90:  89%|████████▊ | 226/255 [02:35<00:19,  1.45it/s, loss=0.316, v_num=0, train_loss=0.291, train_accuracy=0.833, val_loss=0.369, val_accuracy=0.821]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 90:  89%|████████▉ | 228/255 [02:37<00:18,  1.44it/s, loss=0.316, v_num=0, train_loss=0.291, train_accuracy=0.833, val_loss=0.369, val_accuracy=0.821]
Validating:   7%|▋         | 2/29 [00:02<00:30,  1.11s/it][A
Epoch 90:  90%|█████████ | 230/255 [02:38<00:17,  1.45it/s, loss=0.316, v_num=0, train_loss=0.291, train_accuracy=0.833, val_loss=0.369, val_accuracy=0.821]
Validating:  14%|█▍        | 4/29 [00:02<00:12,  2.08it/s][A
Epoch 90:  91%|█████████ | 232/255 [02:38<00:15,  1.46it/s, loss=0.316, v_num=0, train_loss=0.291, train_accuracy=0.833, val_loss=0.369, val_accuracy=0.821]
Validating:  21%|██        | 6/29 [00:03<00:06,  3.32it/s][A
Epoch 90:  92%|█████████▏| 234/255 [02:39<00:14,  1.47it/s, loss=0.316, v_num=0, train_loss=0.291,

Epoch 90, global step 20565: val_loss reached 0.34527 (best 0.34527), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-34.ckpt" as top 2


Epoch 91:  89%|████████▊ | 226/255 [02:35<00:19,  1.45it/s, loss=0.322, v_num=0, train_loss=0.257, train_accuracy=0.889, val_loss=0.345, val_accuracy=0.833]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 91:  89%|████████▉ | 228/255 [02:37<00:18,  1.44it/s, loss=0.322, v_num=0, train_loss=0.257, train_accuracy=0.889, val_loss=0.345, val_accuracy=0.833]
Validating:   7%|▋         | 2/29 [00:02<00:30,  1.11s/it][A
Epoch 91:  90%|█████████ | 230/255 [02:38<00:17,  1.45it/s, loss=0.322, v_num=0, train_loss=0.257, train_accuracy=0.889, val_loss=0.345, val_accuracy=0.833]
Validating:  14%|█▍        | 4/29 [00:02<00:12,  2.08it/s][A
Epoch 91:  91%|█████████ | 232/255 [02:38<00:15,  1.46it/s, loss=0.322, v_num=0, train_loss=0.257, train_accuracy=0.889, val_loss=0.345, val_accuracy=0.833]
Validating:  21%|██        | 6/29 [00:03<00:06,  3.31it/s][A
Epoch 91:  92%|█████████▏| 234/255 [02:38<00:14,  1.47it/s, loss=0.322, v_num=0, train_loss=0.257,

Epoch 91, global step 20791: val_loss was not in top 2


Epoch 92:  89%|████████▊ | 226/255 [02:35<00:19,  1.46it/s, loss=0.466, v_num=0, train_loss=0.322, train_accuracy=0.833, val_loss=0.373, val_accuracy=0.816]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 92:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.466, v_num=0, train_loss=0.322, train_accuracy=0.833, val_loss=0.373, val_accuracy=0.816]
Validating:   7%|▋         | 2/29 [00:02<00:30,  1.11s/it][A
Epoch 92:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.466, v_num=0, train_loss=0.322, train_accuracy=0.833, val_loss=0.373, val_accuracy=0.816]
Validating:  14%|█▍        | 4/29 [00:02<00:12,  2.08it/s][A
Epoch 92:  91%|█████████ | 232/255 [02:38<00:15,  1.47it/s, loss=0.466, v_num=0, train_loss=0.322, train_accuracy=0.833, val_loss=0.373, val_accuracy=0.816]
Validating:  21%|██        | 6/29 [00:03<00:06,  3.32it/s][A
Epoch 92:  92%|█████████▏| 234/255 [02:38<00:14,  1.48it/s, loss=0.466, v_num=0, train_loss=0.322,

Epoch 92, global step 21017: val_loss was not in top 2


Epoch 93:  89%|████████▊ | 226/255 [02:35<00:19,  1.46it/s, loss=0.406, v_num=0, train_loss=0.254, train_accuracy=0.833, val_loss=0.483, val_accuracy=0.746]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 93:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.406, v_num=0, train_loss=0.254, train_accuracy=0.833, val_loss=0.483, val_accuracy=0.746]
Validating:   7%|▋         | 2/29 [00:02<00:29,  1.10s/it][A
Epoch 93:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.406, v_num=0, train_loss=0.254, train_accuracy=0.833, val_loss=0.483, val_accuracy=0.746]
Validating:  14%|█▍        | 4/29 [00:02<00:12,  2.06it/s][A
Epoch 93:  91%|█████████ | 232/255 [02:38<00:15,  1.47it/s, loss=0.406, v_num=0, train_loss=0.254, train_accuracy=0.833, val_loss=0.483, val_accuracy=0.746]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.28it/s][A
Epoch 93:  92%|█████████▏| 234/255 [02:38<00:14,  1.48it/s, loss=0.406, v_num=0, train_loss=0.254,

Epoch 93, global step 21243: val_loss was not in top 2


Epoch 94:  89%|████████▊ | 226/255 [02:35<00:19,  1.46it/s, loss=0.377, v_num=0, train_loss=0.408, train_accuracy=0.778, val_loss=0.433, val_accuracy=0.783]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 94:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.377, v_num=0, train_loss=0.408, train_accuracy=0.778, val_loss=0.433, val_accuracy=0.783]
Validating:   7%|▋         | 2/29 [00:02<00:29,  1.09s/it][A
Epoch 94:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.377, v_num=0, train_loss=0.408, train_accuracy=0.778, val_loss=0.433, val_accuracy=0.783]
Validating:  14%|█▍        | 4/29 [00:02<00:11,  2.11it/s][A
Epoch 94:  91%|█████████ | 232/255 [02:38<00:15,  1.47it/s, loss=0.377, v_num=0, train_loss=0.408, train_accuracy=0.778, val_loss=0.433, val_accuracy=0.783]
Validating:  21%|██        | 6/29 [00:03<00:06,  3.31it/s][A
Epoch 94:  92%|█████████▏| 234/255 [02:38<00:14,  1.48it/s, loss=0.377, v_num=0, train_loss=0.408,

Epoch 94, global step 21469: val_loss was not in top 2


Epoch 95:  89%|████████▊ | 226/255 [02:35<00:19,  1.45it/s, loss=0.344, v_num=0, train_loss=0.294, train_accuracy=0.833, val_loss=0.406, val_accuracy=0.794]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 95:  89%|████████▉ | 228/255 [02:37<00:18,  1.44it/s, loss=0.344, v_num=0, train_loss=0.294, train_accuracy=0.833, val_loss=0.406, val_accuracy=0.794]
Validating:   7%|▋         | 2/29 [00:02<00:30,  1.11s/it][A
Epoch 95:  90%|█████████ | 230/255 [02:38<00:17,  1.45it/s, loss=0.344, v_num=0, train_loss=0.294, train_accuracy=0.833, val_loss=0.406, val_accuracy=0.794]
Validating:  14%|█▍        | 4/29 [00:02<00:12,  2.05it/s][A
Epoch 95:  91%|█████████ | 232/255 [02:38<00:15,  1.46it/s, loss=0.344, v_num=0, train_loss=0.294, train_accuracy=0.833, val_loss=0.406, val_accuracy=0.794]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.26it/s][A
Epoch 95:  92%|█████████▏| 234/255 [02:38<00:14,  1.47it/s, loss=0.344, v_num=0, train_loss=0.294,

Epoch 95, global step 21695: val_loss was not in top 2


Epoch 96:  89%|████████▊ | 226/255 [02:35<00:19,  1.45it/s, loss=0.367, v_num=0, train_loss=0.353, train_accuracy=0.778, val_loss=0.395, val_accuracy=0.808]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 96:  89%|████████▉ | 228/255 [02:37<00:18,  1.44it/s, loss=0.367, v_num=0, train_loss=0.353, train_accuracy=0.778, val_loss=0.395, val_accuracy=0.808]
Validating:   7%|▋         | 2/29 [00:02<00:29,  1.11s/it][A
Epoch 96:  90%|█████████ | 230/255 [02:38<00:17,  1.45it/s, loss=0.367, v_num=0, train_loss=0.353, train_accuracy=0.778, val_loss=0.395, val_accuracy=0.808]
Validating:  14%|█▍        | 4/29 [00:02<00:12,  2.06it/s][A
Epoch 96:  91%|█████████ | 232/255 [02:38<00:15,  1.46it/s, loss=0.367, v_num=0, train_loss=0.353, train_accuracy=0.778, val_loss=0.395, val_accuracy=0.808]
Validating:  21%|██        | 6/29 [00:03<00:06,  3.29it/s][A
Epoch 96:  92%|█████████▏| 234/255 [02:38<00:14,  1.47it/s, loss=0.367, v_num=0, train_loss=0.353,

Epoch 96, global step 21921: val_loss was not in top 2


Epoch 97:  89%|████████▊ | 226/255 [02:35<00:19,  1.45it/s, loss=0.345, v_num=0, train_loss=0.320, train_accuracy=0.778, val_loss=0.385, val_accuracy=0.811]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 97:  89%|████████▉ | 228/255 [02:37<00:18,  1.44it/s, loss=0.345, v_num=0, train_loss=0.320, train_accuracy=0.778, val_loss=0.385, val_accuracy=0.811]
Validating:   7%|▋         | 2/29 [00:02<00:29,  1.09s/it][A
Epoch 97:  90%|█████████ | 230/255 [02:38<00:17,  1.45it/s, loss=0.345, v_num=0, train_loss=0.320, train_accuracy=0.778, val_loss=0.385, val_accuracy=0.811]
Validating:  14%|█▍        | 4/29 [00:02<00:11,  2.10it/s][A
Epoch 97:  91%|█████████ | 232/255 [02:38<00:15,  1.46it/s, loss=0.345, v_num=0, train_loss=0.320, train_accuracy=0.778, val_loss=0.385, val_accuracy=0.811]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.27it/s][A
Epoch 97:  92%|█████████▏| 234/255 [02:39<00:14,  1.47it/s, loss=0.345, v_num=0, train_loss=0.320,

Epoch 97, global step 22147: val_loss was not in top 2


Epoch 98:  19%|█▉        | 48/255 [00:34<02:29,  1.38it/s, loss=0.348, v_num=0, train_loss=0.442, train_accuracy=0.800, val_loss=0.379, val_accuracy=0.821] 

IOPub message rate exceeded.
The notebook server will temporarily stop sending output
to the client in order to avoid crashing it.
To change this limit, set the config variable
`--NotebookApp.iopub_msg_rate_limit`.

Current values:
NotebookApp.iopub_msg_rate_limit=1000.0 (msgs/sec)
NotebookApp.rate_limit_window=3.0 (secs)



Epoch 101:  89%|████████▊ | 226/255 [02:35<00:19,  1.46it/s, loss=0.293, v_num=0, train_loss=0.243, train_accuracy=0.889, val_loss=0.354, val_accuracy=0.828]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 101:  89%|████████▉ | 228/255 [02:37<00:18,  1.44it/s, loss=0.293, v_num=0, train_loss=0.243, train_accuracy=0.889, val_loss=0.354, val_accuracy=0.828]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.16s/it][A
Epoch 101:  90%|█████████ | 230/255 [02:38<00:17,  1.45it/s, loss=0.293, v_num=0, train_loss=0.243, train_accuracy=0.889, val_loss=0.354, val_accuracy=0.828]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  2.01it/s][A
Epoch 101:  91%|█████████ | 232/255 [02:38<00:15,  1.46it/s, loss=0.293, v_num=0, train_loss=0.243, train_accuracy=0.889, val_loss=0.354, val_accuracy=0.828]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.24it/s][A
Epoch 101:  92%|█████████▏| 234/255 [02:38<00:14,  1.47it/s, loss=0.293, v_num=0, train_loss=0

Epoch 101, global step 23051: val_loss reached 0.35065 (best 0.34527), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-34-v1.ckpt" as top 2


Epoch 102:  89%|████████▊ | 226/255 [02:35<00:19,  1.45it/s, loss=0.308, v_num=0, train_loss=0.201, train_accuracy=0.944, val_loss=0.351, val_accuracy=0.834]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 102:  89%|████████▉ | 228/255 [02:37<00:18,  1.44it/s, loss=0.308, v_num=0, train_loss=0.201, train_accuracy=0.944, val_loss=0.351, val_accuracy=0.834]
Validating:   7%|▋         | 2/29 [00:02<00:29,  1.07s/it][A
Epoch 102:  90%|█████████ | 230/255 [02:38<00:17,  1.45it/s, loss=0.308, v_num=0, train_loss=0.201, train_accuracy=0.944, val_loss=0.351, val_accuracy=0.834]
Validating:  14%|█▍        | 4/29 [00:02<00:11,  2.12it/s][A
Epoch 102:  91%|█████████ | 232/255 [02:38<00:15,  1.46it/s, loss=0.308, v_num=0, train_loss=0.201, train_accuracy=0.944, val_loss=0.351, val_accuracy=0.834]
Validating:  21%|██        | 6/29 [00:03<00:06,  3.29it/s][A
Epoch 102:  92%|█████████▏| 234/255 [02:38<00:14,  1.47it/s, loss=0.308, v_num=0, train_loss=0

Epoch 102, global step 23277: val_loss was not in top 2


Epoch 103:  89%|████████▊ | 226/255 [02:35<00:19,  1.45it/s, loss=0.313, v_num=0, train_loss=0.461, train_accuracy=0.778, val_loss=0.354, val_accuracy=0.838]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 103:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.313, v_num=0, train_loss=0.461, train_accuracy=0.778, val_loss=0.354, val_accuracy=0.838]
Validating:   7%|▋         | 2/29 [00:02<00:29,  1.08s/it][A
Epoch 103:  90%|█████████ | 230/255 [02:38<00:17,  1.45it/s, loss=0.313, v_num=0, train_loss=0.461, train_accuracy=0.778, val_loss=0.354, val_accuracy=0.838]
Validating:  14%|█▍        | 4/29 [00:02<00:11,  2.11it/s][A
Epoch 103:  91%|█████████ | 232/255 [02:38<00:15,  1.46it/s, loss=0.313, v_num=0, train_loss=0.461, train_accuracy=0.778, val_loss=0.354, val_accuracy=0.838]
Validating:  21%|██        | 6/29 [00:03<00:06,  3.32it/s][A
Epoch 103:  92%|█████████▏| 234/255 [02:38<00:14,  1.47it/s, loss=0.313, v_num=0, train_loss=0

Epoch 103, global step 23503: val_loss was not in top 2


Epoch 104:  89%|████████▊ | 226/255 [02:35<00:19,  1.46it/s, loss=0.313, v_num=0, train_loss=0.313, train_accuracy=0.833, val_loss=0.366, val_accuracy=0.843]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 104:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.313, v_num=0, train_loss=0.313, train_accuracy=0.833, val_loss=0.366, val_accuracy=0.843]
Validating:   7%|▋         | 2/29 [00:02<00:29,  1.08s/it][A
Epoch 104:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.313, v_num=0, train_loss=0.313, train_accuracy=0.833, val_loss=0.366, val_accuracy=0.843]
Validating:  14%|█▍        | 4/29 [00:02<00:11,  2.12it/s][A
Epoch 104:  91%|█████████ | 232/255 [02:38<00:15,  1.47it/s, loss=0.313, v_num=0, train_loss=0.313, train_accuracy=0.833, val_loss=0.366, val_accuracy=0.843]
Validating:  21%|██        | 6/29 [00:03<00:06,  3.35it/s][A
Epoch 104:  92%|█████████▏| 234/255 [02:38<00:14,  1.48it/s, loss=0.313, v_num=0, train_loss=0

Epoch 104, global step 23729: val_loss reached 0.34607 (best 0.34527), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-34-v1.ckpt" as top 2


Epoch 105:  89%|████████▊ | 226/255 [02:35<00:19,  1.46it/s, loss=0.31, v_num=0, train_loss=0.269, train_accuracy=0.889, val_loss=0.346, val_accuracy=0.839] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 105:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.31, v_num=0, train_loss=0.269, train_accuracy=0.889, val_loss=0.346, val_accuracy=0.839]
Validating:   7%|▋         | 2/29 [00:02<00:29,  1.09s/it][A
Epoch 105:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.31, v_num=0, train_loss=0.269, train_accuracy=0.889, val_loss=0.346, val_accuracy=0.839]
Validating:  14%|█▍        | 4/29 [00:02<00:11,  2.11it/s][A
Epoch 105:  91%|█████████ | 232/255 [02:38<00:15,  1.47it/s, loss=0.31, v_num=0, train_loss=0.269, train_accuracy=0.889, val_loss=0.346, val_accuracy=0.839]
Validating:  21%|██        | 6/29 [00:03<00:06,  3.33it/s][A
Epoch 105:  92%|█████████▏| 234/255 [02:38<00:14,  1.48it/s, loss=0.31, v_num=0, train_loss=0.269

Epoch 105, global step 23955: val_loss reached 0.34592 (best 0.34527), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-34-v1.ckpt" as top 2


Epoch 106:  89%|████████▊ | 226/255 [02:35<00:19,  1.46it/s, loss=0.28, v_num=0, train_loss=0.205, train_accuracy=0.889, val_loss=0.346, val_accuracy=0.826] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 106:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.28, v_num=0, train_loss=0.205, train_accuracy=0.889, val_loss=0.346, val_accuracy=0.826]
Validating:   7%|▋         | 2/29 [00:02<00:29,  1.09s/it][A
Epoch 106:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.28, v_num=0, train_loss=0.205, train_accuracy=0.889, val_loss=0.346, val_accuracy=0.826]
Validating:  14%|█▍        | 4/29 [00:02<00:11,  2.12it/s][A
Epoch 106:  91%|█████████ | 232/255 [02:38<00:15,  1.47it/s, loss=0.28, v_num=0, train_loss=0.205, train_accuracy=0.889, val_loss=0.346, val_accuracy=0.826]
Validating:  21%|██        | 6/29 [00:03<00:06,  3.31it/s][A
Epoch 106:  92%|█████████▏| 234/255 [02:38<00:14,  1.48it/s, loss=0.28, v_num=0, train_loss=0.205

Epoch 106, global step 24181: val_loss reached 0.34382 (best 0.34382), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-34-v1.ckpt" as top 2


Epoch 107:  89%|████████▊ | 226/255 [02:35<00:19,  1.46it/s, loss=0.292, v_num=0, train_loss=0.254, train_accuracy=0.889, val_loss=0.344, val_accuracy=0.840]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 107:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.292, v_num=0, train_loss=0.254, train_accuracy=0.889, val_loss=0.344, val_accuracy=0.840]
Validating:   7%|▋         | 2/29 [00:02<00:29,  1.09s/it][A
Epoch 107:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.292, v_num=0, train_loss=0.254, train_accuracy=0.889, val_loss=0.344, val_accuracy=0.840]
Validating:  14%|█▍        | 4/29 [00:02<00:11,  2.10it/s][A
Epoch 107:  91%|█████████ | 232/255 [02:38<00:15,  1.47it/s, loss=0.292, v_num=0, train_loss=0.254, train_accuracy=0.889, val_loss=0.344, val_accuracy=0.840]
Validating:  21%|██        | 6/29 [00:03<00:06,  3.30it/s][A
Epoch 107:  92%|█████████▏| 234/255 [02:38<00:14,  1.48it/s, loss=0.292, v_num=0, train_loss=0

Epoch 107, global step 24407: val_loss was not in top 2


Epoch 108:  89%|████████▊ | 226/255 [02:35<00:19,  1.45it/s, loss=0.291, v_num=0, train_loss=0.176, train_accuracy=0.944, val_loss=0.346, val_accuracy=0.832]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 108:  89%|████████▉ | 228/255 [02:37<00:18,  1.44it/s, loss=0.291, v_num=0, train_loss=0.176, train_accuracy=0.944, val_loss=0.346, val_accuracy=0.832]
Validating:   7%|▋         | 2/29 [00:02<00:29,  1.09s/it][A
Epoch 108:  90%|█████████ | 230/255 [02:38<00:17,  1.45it/s, loss=0.291, v_num=0, train_loss=0.176, train_accuracy=0.944, val_loss=0.346, val_accuracy=0.832]
Validating:  14%|█▍        | 4/29 [00:02<00:12,  2.07it/s][A
Epoch 108:  91%|█████████ | 232/255 [02:38<00:15,  1.46it/s, loss=0.291, v_num=0, train_loss=0.176, train_accuracy=0.944, val_loss=0.346, val_accuracy=0.832]
Validating:  21%|██        | 6/29 [00:03<00:06,  3.29it/s][A
Epoch 108:  92%|█████████▏| 234/255 [02:38<00:14,  1.47it/s, loss=0.291, v_num=0, train_loss=0

Epoch 108, global step 24633: val_loss reached 0.33172 (best 0.33172), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-34.ckpt" as top 2


Epoch 109:  89%|████████▊ | 226/255 [02:35<00:19,  1.45it/s, loss=0.267, v_num=0, train_loss=0.467, train_accuracy=0.833, val_loss=0.332, val_accuracy=0.840]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 109:  89%|████████▉ | 228/255 [02:37<00:18,  1.44it/s, loss=0.267, v_num=0, train_loss=0.467, train_accuracy=0.833, val_loss=0.332, val_accuracy=0.840]
Validating:   7%|▋         | 2/29 [00:02<00:29,  1.10s/it][A
Epoch 109:  90%|█████████ | 230/255 [02:38<00:17,  1.45it/s, loss=0.267, v_num=0, train_loss=0.467, train_accuracy=0.833, val_loss=0.332, val_accuracy=0.840]
Validating:  14%|█▍        | 4/29 [00:02<00:11,  2.09it/s][A
Epoch 109:  91%|█████████ | 232/255 [02:38<00:15,  1.46it/s, loss=0.267, v_num=0, train_loss=0.467, train_accuracy=0.833, val_loss=0.332, val_accuracy=0.840]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.27it/s][A
Epoch 109:  92%|█████████▏| 234/255 [02:38<00:14,  1.47it/s, loss=0.267, v_num=0, train_loss=0

Epoch 109, global step 24859: val_loss reached 0.32935 (best 0.32935), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-34-v1.ckpt" as top 2


Epoch 110:  89%|████████▊ | 226/255 [02:35<00:19,  1.45it/s, loss=0.275, v_num=0, train_loss=0.326, train_accuracy=0.833, val_loss=0.329, val_accuracy=0.847] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 110:  89%|████████▉ | 228/255 [02:37<00:18,  1.44it/s, loss=0.275, v_num=0, train_loss=0.326, train_accuracy=0.833, val_loss=0.329, val_accuracy=0.847]
Validating:   7%|▋         | 2/29 [00:02<00:29,  1.11s/it][A
Epoch 110:  90%|█████████ | 230/255 [02:38<00:17,  1.45it/s, loss=0.275, v_num=0, train_loss=0.326, train_accuracy=0.833, val_loss=0.329, val_accuracy=0.847]
Validating:  14%|█▍        | 4/29 [00:02<00:11,  2.09it/s][A
Epoch 110:  91%|█████████ | 232/255 [02:38<00:15,  1.46it/s, loss=0.275, v_num=0, train_loss=0.326, train_accuracy=0.833, val_loss=0.329, val_accuracy=0.847]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.27it/s][A
Epoch 110:  92%|█████████▏| 234/255 [02:38<00:14,  1.47it/s, loss=0.275, v_num=0, train_loss=

Epoch 110, global step 25085: val_loss reached 0.32719 (best 0.32719), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-34.ckpt" as top 2


Epoch 111:  89%|████████▊ | 226/255 [02:35<00:19,  1.45it/s, loss=0.266, v_num=0, train_loss=0.358, train_accuracy=0.889, val_loss=0.327, val_accuracy=0.854]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 111:  89%|████████▉ | 228/255 [02:37<00:18,  1.44it/s, loss=0.266, v_num=0, train_loss=0.358, train_accuracy=0.889, val_loss=0.327, val_accuracy=0.854]
Validating:   7%|▋         | 2/29 [00:02<00:31,  1.17s/it][A
Epoch 111:  90%|█████████ | 230/255 [02:38<00:17,  1.45it/s, loss=0.266, v_num=0, train_loss=0.358, train_accuracy=0.889, val_loss=0.327, val_accuracy=0.854]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.97it/s][A
Epoch 111:  91%|█████████ | 232/255 [02:38<00:15,  1.46it/s, loss=0.266, v_num=0, train_loss=0.358, train_accuracy=0.889, val_loss=0.327, val_accuracy=0.854]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.15it/s][A
Epoch 111:  92%|█████████▏| 234/255 [02:39<00:14,  1.47it/s, loss=0.266, v_num=0, train_loss=0

Epoch 111, global step 25311: val_loss was not in top 2


Epoch 112:  89%|████████▊ | 226/255 [02:35<00:19,  1.46it/s, loss=0.305, v_num=0, train_loss=0.280, train_accuracy=0.944, val_loss=0.343, val_accuracy=0.846]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 112:  89%|████████▉ | 228/255 [02:37<00:18,  1.44it/s, loss=0.305, v_num=0, train_loss=0.280, train_accuracy=0.944, val_loss=0.343, val_accuracy=0.846]
Validating:   7%|▋         | 2/29 [00:02<00:32,  1.19s/it][A
Epoch 112:  90%|█████████ | 230/255 [02:38<00:17,  1.45it/s, loss=0.305, v_num=0, train_loss=0.280, train_accuracy=0.944, val_loss=0.343, val_accuracy=0.846]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  1.97it/s][A
Epoch 112:  91%|█████████ | 232/255 [02:38<00:15,  1.46it/s, loss=0.305, v_num=0, train_loss=0.280, train_accuracy=0.944, val_loss=0.343, val_accuracy=0.846]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.18it/s][A
Epoch 112:  92%|█████████▏| 234/255 [02:38<00:14,  1.47it/s, loss=0.305, v_num=0, train_loss=0

Epoch 112, global step 25537: val_loss reached 0.31025 (best 0.31025), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-34-v1.ckpt" as top 2


Epoch 113:  89%|████████▊ | 226/255 [02:35<00:19,  1.45it/s, loss=0.27, v_num=0, train_loss=0.226, train_accuracy=0.889, val_loss=0.310, val_accuracy=0.851] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 113:  89%|████████▉ | 228/255 [02:37<00:18,  1.44it/s, loss=0.27, v_num=0, train_loss=0.226, train_accuracy=0.889, val_loss=0.310, val_accuracy=0.851]
Validating:   7%|▋         | 2/29 [00:02<00:29,  1.11s/it][A
Epoch 113:  90%|█████████ | 230/255 [02:38<00:17,  1.45it/s, loss=0.27, v_num=0, train_loss=0.226, train_accuracy=0.889, val_loss=0.310, val_accuracy=0.851]
Validating:  14%|█▍        | 4/29 [00:02<00:12,  2.06it/s][A
Epoch 113:  91%|█████████ | 232/255 [02:38<00:15,  1.46it/s, loss=0.27, v_num=0, train_loss=0.226, train_accuracy=0.889, val_loss=0.310, val_accuracy=0.851]
Validating:  21%|██        | 6/29 [00:03<00:06,  3.30it/s][A
Epoch 113:  92%|█████████▏| 234/255 [02:38<00:14,  1.47it/s, loss=0.27, v_num=0, train_loss=0.226

Epoch 113, global step 25763: val_loss reached 0.31331 (best 0.31025), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-34.ckpt" as top 2


Epoch 114:  89%|████████▊ | 226/255 [02:35<00:19,  1.45it/s, loss=0.246, v_num=0, train_loss=0.384, train_accuracy=0.833, val_loss=0.313, val_accuracy=0.861]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 114:  89%|████████▉ | 228/255 [02:38<00:18,  1.44it/s, loss=0.246, v_num=0, train_loss=0.384, train_accuracy=0.833, val_loss=0.313, val_accuracy=0.861]
Validating:   7%|▋         | 2/29 [00:02<00:30,  1.13s/it][A
Epoch 114:  90%|█████████ | 230/255 [02:38<00:17,  1.45it/s, loss=0.246, v_num=0, train_loss=0.384, train_accuracy=0.833, val_loss=0.313, val_accuracy=0.861]
Validating:  14%|█▍        | 4/29 [00:03<00:12,  2.03it/s][A
Epoch 114:  91%|█████████ | 232/255 [02:38<00:15,  1.46it/s, loss=0.246, v_num=0, train_loss=0.384, train_accuracy=0.833, val_loss=0.313, val_accuracy=0.861]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.26it/s][A
Epoch 114:  92%|█████████▏| 234/255 [02:39<00:14,  1.47it/s, loss=0.246, v_num=0, train_loss=0

Epoch 114, global step 25989: val_loss reached 0.30649 (best 0.30649), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-34.ckpt" as top 2


Epoch 115:  89%|████████▊ | 226/255 [02:35<00:19,  1.45it/s, loss=0.221, v_num=0, train_loss=0.430, train_accuracy=0.722, val_loss=0.306, val_accuracy=0.858]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 115:  89%|████████▉ | 228/255 [02:38<00:18,  1.44it/s, loss=0.221, v_num=0, train_loss=0.430, train_accuracy=0.722, val_loss=0.306, val_accuracy=0.858]
Validating:   7%|▋         | 2/29 [00:02<00:29,  1.10s/it][A
Epoch 115:  90%|█████████ | 230/255 [02:38<00:17,  1.45it/s, loss=0.221, v_num=0, train_loss=0.430, train_accuracy=0.722, val_loss=0.306, val_accuracy=0.858]
Validating:  14%|█▍        | 4/29 [00:02<00:11,  2.10it/s][A
Epoch 115:  91%|█████████ | 232/255 [02:38<00:15,  1.46it/s, loss=0.221, v_num=0, train_loss=0.430, train_accuracy=0.722, val_loss=0.306, val_accuracy=0.858]
Validating:  21%|██        | 6/29 [00:03<00:07,  3.28it/s][A
Epoch 115:  92%|█████████▏| 234/255 [02:39<00:14,  1.47it/s, loss=0.221, v_num=0, train_loss=0

Epoch 115, global step 26215: val_loss was not in top 2


Epoch 116:  22%|██▏       | 57/255 [00:40<02:22,  1.39it/s, loss=0.25, v_num=0, train_loss=0.217, train_accuracy=0.900, val_loss=0.324, val_accuracy=0.855]  

## Load Checkpoint 

In [None]:
# best-checkpoint-corr-3-v1.ckptn
# trainer.fit(model, data_module, ckpt_path="/Workspace/code/checkpoints/best-checkpoint-corr-3-v1.ckpt")