In [1]:
import os
import pandas as pd
import numpy as np
from sklearn.preprocessing import LabelEncoder
from sklearn.model_selection import train_test_split
from sklearn.metrics import classification_report, confusion_matrix
import matplotlib.pyplot as plt

import torch
from torch import nn, optim
from torch.nn import functional as F
from torch.utils.data import Dataset, DataLoader

import torchmetrics
from torchmetrics.functional import accuracy, f1_score

import pytorch_lightning as pl
from pytorch_lightning.loggers import TensorBoardLogger
from pytorch_lightning.callbacks import ModelCheckpoint

device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
print(device)

  from .autonotebook import tqdm as notebook_tqdm


cuda


## Model Setup 

In [2]:
pl.seed_everything(42, workers=True)

class DrowsyDataset(Dataset):
    
    def __init__(self, sequences):
        self.sequences = sequences
        
    def __len__(self):
        return len(self.sequences)
    
    def __getitem__(self, idx):
        sequence, label = self.sequences[idx]
        return dict(
            sequence=torch.Tensor(sequence.to_numpy()),
            label=torch.tensor(label).long()
        )
    
class DrowsyDataModule(pl.LightningDataModule):
    
    def __init__(self, train_sequences, val_sequences, test_sequences, batch_size):
        super().__init__()
        self.train_sequences = train_sequences
        self.val_sequences = val_sequences
        self.test_sequences = test_sequences
        self.batch_size = batch_size

    def setup(self, stage=None):
        self.train_dataset = DrowsyDataset(self.train_sequences)
        self.val_dataset = DrowsyDataset(self.val_sequences)
        self.test_dataset = DrowsyDataset(self.test_sequences)
        
    def train_dataloader(self):
        return DataLoader(
            self.train_dataset,
            batch_size=self.batch_size,
            shuffle=True,
            num_workers=os.cpu_count()
        )
    
    def val_dataloader(self):
        return DataLoader(
            self.val_dataset,
            batch_size=self.batch_size,
            shuffle=False,
            num_workers=os.cpu_count()
        )
    
    def test_dataloader(self):
        return DataLoader(
            self.test_dataset,
            batch_size=self.batch_size,
            shuffle=False,
            num_workers=os.cpu_count()
        ) 

class DrowsyModel(nn.Module):
    
    def __init__(self, n_features, n_classes, n_hidden=256, n_layers=3):
        super().__init__()
        
        self.n_hidden = n_hidden
        
        self.lstm = nn.LSTM(
            input_size=n_features,
            hidden_size=n_hidden,
            num_layers=n_layers,
            batch_first=True,
            dropout=0.75
        )
        
        self.classifier = nn.Linear(n_hidden, n_classes)
        
    def forward(self, x):
        self.lstm.flatten_parameters()
        _, (hidden, _) = self.lstm(x)
        
        out = hidden[-1]
        return self.classifier(out)
    
class DrowsyPredictor(pl.LightningModule):
    
    def __init__(self, n_features: int, n_classes: int):
        super().__init__()
        self.model = DrowsyModel(n_features, n_classes)
        self.criterion = nn.CrossEntropyLoss()
        
    def forward(self, x, label=None):
        output = self.model(x)
        loss = 0
        if label is not None:
            loss = self.criterion(output, label)
        return loss, output
        
    def training_step(self, batch, batch_idx):
        sequences = batch["sequence"]
        labels = batch["label"]
        loss, outputs = self(sequences, labels)
        predictions = torch.argmax(outputs, dim=1)
        step_accuracy = accuracy(predictions, labels)
        my_f1_score = f1_score(predictions, labels)
        
        self.log("train_loss", loss, prog_bar=True, logger=True)
        self.log("train_accuracy", step_accuracy, prog_bar=True, logger=True)
        self.log("train_f1_score", my_f1_score, prog_bar=True, logger=True)
        
        return {"loss": loss, "accuracy": step_accuracy, "f1_score": my_f1_score}
    
    def validation_step(self, batch, batch_idx):
        sequences = batch["sequence"]
        labels = batch["label"]
        loss, outputs = self(sequences, labels)
        predictions = torch.argmax(outputs, dim=1)
        step_accuracy = accuracy(predictions, labels)
        my_f1_score = f1_score(predictions, labels)
        
        self.log("val_loss", loss, prog_bar=True, logger=True)
        self.log("val_accuracy", step_accuracy, prog_bar=True, logger=True)
        self.log("val_f1_score", my_f1_score, prog_bar=True, logger=True)
        
        return {"loss": loss, "accuracy": step_accuracy, "f1_score": my_f1_score}
    
    def test_step(self, batch, batch_idx):
        sequences = batch["sequence"]
        labels = batch["label"]
        loss, outputs = self(sequences, labels)
        predictions = torch.argmax(outputs, dim=1)
        step_accuracy = accuracy(predictions, labels)
        my_f1_score = f1_score(predictions, labels)
        
        self.log("test_train_loss", loss, prog_bar=True, logger=True)
        self.log("test_train_accuracy", step_accuracy, prog_bar=True, logger=True)
        self.log("test_f1_score", my_f1_score, prog_bar=True, logger=True)
        
        return {"loss": loss, "accuracy": step_accuracy, "f1_score": my_f1_score}
    
    def configure_optimizers(self):
        return optim.Adam(self.parameters(), lr=0.0001)

Global seed set to 42


## 參數設置

In [3]:
%load_ext tensorboard
%reload_ext tensorboard
%tensorboard --logdir ./lightning_logs --host 0.0.0.0 --port=8888

ERROR: Failed to launch TensorBoard (exited with 255).
Contents of stderr:
2022-06-28 06:04:43.628716: I tensorflow/stream_executor/platform/default/dso_loader.cc:48] Successfully opened dynamic library libcudart.so.10.1
E0628 06:04:51.250766 140239692838720 program.py:312] TensorBoard could not bind to port 8888, it was already in use
ERROR: TensorBoard could not bind to port 8888, it was already in use

In [4]:
X_train = pd.read_csv('../data2.csv')

In [5]:
N_EPOCHS = 200
BATCH_SIZE = 50

ORG_FEATURE_COLUMNS = ['TP8', 'FP2', 'FCZ', 'FT10', 'O2', 'O1', 'FT7', 'F4', 'TP7', 'C3', 'C4', 'F3', 'FT8', 'T6', 'HEOR', 'T5', 'VEOL', 'F7', 'FZ', 'VEOU', 'A1', 'P3', 'PZ', 'CP3', 'P4', 'CPZ', 'A2', 'HEOL', 'CP4', 'FT9', 'F8', 'OZ', 'CZ', 'FC4', 'FC3', 'FP1', 'PO1', 'T3', 'T4', 'PO2']
g = X_train.groupby("group")

# ORG_FEATURE_COLUMNS = ['FP1','FP2','FZ']


## Main

In [None]:
n = 0
FEATURE_COLUMNS = ORG_FEATURE_COLUMNS[n:]

while(n < 40):
    print("------------------ Round: " + str(n) + " ------------------")
    print(FEATURE_COLUMNS)
    print("Len:", len(FEATURE_COLUMNS))
    
    label_encoder = LabelEncoder()
    encoded_labels = label_encoder.fit_transform(X_train.state)

    label_encoder.classes_

    X_train['label'] = encoded_labels

    # Prepare data ###########################################
    sequences = [] 

    for name, group in g:
        sequence_features = group[FEATURE_COLUMNS]
        label = group.label.iloc[0]

        # print((sequence_features, label))
        sequences.append((sequence_features, label))

    # Setting up train, test, val gruop #######################
    train_sequences, test_sequences = train_test_split(sequences, test_size=0.2)
    val_sequences, test_sequences = train_test_split(test_sequences, test_size=0.5)


    # Setting up data module ##################################
    data_module = DrowsyDataModule(
        train_sequences, val_sequences, test_sequences, BATCH_SIZE
    )

    model = DrowsyPredictor(
        n_features=len(FEATURE_COLUMNS), 
        n_classes=len(label_encoder.classes_)
    )

    # Check points and logger #################################
    checkpoint_callback = ModelCheckpoint(
        dirpath="checkpoints",
        filename="best-checkpoint-corr-" + str(n),
        save_top_k=2,
        verbose=True,
        monitor="val_loss",
        mode="min"
    )

    logger = TensorBoardLogger("lightning_logs", name="Drowsy_pcc" + str(n))

    trainer = pl.Trainer(
        logger=logger,
        callbacks=[checkpoint_callback],
        max_epochs=N_EPOCHS,
        gpus=[1],
        # gpus=2, 
        # auto_select_gpus=True,
        auto_lr_find=True, 
        # check_val_every_n_epoch=10
        # refresh_rate=20,
    )
    
    # Training start
    if (n == 3):
        trainer.fit(model, data_module, ckpt_path="Workspace/code/checkpoints/best-checkpoint-corr-3-v1.ckpt")
    else:
        trainer.fit(model, data_module)
    trainer.test(model, data_module)
    
    FEATURE_COLUMNS.pop(0)
    n = n + 1

------------------ Round: 0 ------------------
['TP8', 'FP2', 'FCZ', 'FT10', 'O2', 'O1', 'FT7', 'F4', 'TP7', 'C3', 'C4', 'F3', 'FT8', 'T6', 'HEOR', 'T5', 'VEOL', 'F7', 'FZ', 'VEOU', 'A1', 'P3', 'PZ', 'CP3', 'P4', 'CPZ', 'A2', 'HEOL', 'CP4', 'FT9', 'F8', 'OZ', 'CZ', 'FC4', 'FC3', 'FP1', 'PO1', 'T3', 'T4', 'PO2']
Len: 40


GPU available: True, used: True
TPU available: False, using: 0 TPU cores
IPU available: False, using: 0 IPUs
Restoring states from the checkpoint path at /Workspace/code/checkpoints/best-checkpoint-corr-0-v2.ckpt
LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1,2]
  "You're resuming from a checkpoint that ended mid-epoch."
Restored all states from the checkpoint file at /Workspace/code/checkpoints/best-checkpoint-corr-0-v2.ckpt

  | Name      | Type             | Params
-----------------------------------------------
0 | model     | DrowsyModel      | 1.4 M 
1 | criterion | CrossEntropyLoss | 0     
-----------------------------------------------
1.4 M     Trainable params
0         Non-trainable params
1.4 M     Total params
5.433     Total estimated model params size (MB)
  rank_zero_warn(f"Checkpoint directory {dirpath} exists and is not empty.")


                                                                      

Global seed set to 42


Epoch 149:  89%|████████▊ | 226/255 [02:24<00:18,  1.56it/s, loss=0.0739, v_num=8, train_loss=0.0754, train_accuracy=0.944, train_f1_score=0.944]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 149:  89%|████████▉ | 228/255 [02:27<00:17,  1.54it/s, loss=0.0739, v_num=8, train_loss=0.0754, train_accuracy=0.944, train_f1_score=0.944]
Validating:   7%|▋         | 2/29 [00:03<00:34,  1.27s/it][A
Epoch 149:  90%|█████████ | 230/255 [02:28<00:16,  1.55it/s, loss=0.0739, v_num=8, train_loss=0.0754, train_accuracy=0.944, train_f1_score=0.944]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.78it/s][A
Epoch 149:  91%|█████████ | 232/255 [02:28<00:14,  1.56it/s, loss=0.0739, v_num=8, train_loss=0.0754, train_accuracy=0.944, train_f1_score=0.944]
Validating:  21%|██        | 6/29 [00:03<00:07,  2.90it/s][A
Epoch 149:  92%|█████████▏| 234/255 [02:28<00:13,  1.57it/s, loss=0.0739, v_num=8, train_loss=0.0754, train_accuracy=0.944, train_f1_score=0.9

Epoch 149, global step 33899: val_loss was not in top 2


Epoch 150:  89%|████████▊ | 226/255 [02:26<00:18,  1.54it/s, loss=0.134, v_num=8, train_loss=0.139, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.328, val_accuracy=0.913, val_f1_score=0.913]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 150:  89%|████████▉ | 228/255 [02:29<00:17,  1.53it/s, loss=0.134, v_num=8, train_loss=0.139, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.328, val_accuracy=0.913, val_f1_score=0.913]
Validating:   7%|▋         | 2/29 [00:03<00:34,  1.28s/it][A
Epoch 150:  90%|█████████ | 230/255 [02:29<00:16,  1.54it/s, loss=0.134, v_num=8, train_loss=0.139, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.328, val_accuracy=0.913, val_f1_score=0.913]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.77it/s][A
Epoch 150:  91%|█████████ | 232/255 [02:30<00:14,  1.55it/s, loss=0.134, v_num=8, train_loss=0.139, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.328, val_accuracy=0.913, val_f1

Epoch 150, global step 34125: val_loss was not in top 2


Epoch 151:  89%|████████▊ | 226/255 [02:26<00:18,  1.54it/s, loss=0.143, v_num=8, train_loss=0.419, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.335, val_accuracy=0.903, val_f1_score=0.903]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 151:  89%|████████▉ | 228/255 [02:29<00:17,  1.52it/s, loss=0.143, v_num=8, train_loss=0.419, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.335, val_accuracy=0.903, val_f1_score=0.903]
Validating:   7%|▋         | 2/29 [00:03<00:34,  1.29s/it][A
Epoch 151:  90%|█████████ | 230/255 [02:30<00:16,  1.53it/s, loss=0.143, v_num=8, train_loss=0.419, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.335, val_accuracy=0.903, val_f1_score=0.903]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.74it/s][A
Epoch 151:  91%|█████████ | 232/255 [02:30<00:14,  1.54it/s, loss=0.143, v_num=8, train_loss=0.419, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.335, val_accuracy=0.903, val_f1

Epoch 151, global step 34351: val_loss was not in top 2


Epoch 152:  89%|████████▊ | 226/255 [02:27<00:18,  1.53it/s, loss=0.0803, v_num=8, train_loss=0.0513, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.364, val_accuracy=0.903, val_f1_score=0.903]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 152:  89%|████████▉ | 228/255 [02:30<00:17,  1.52it/s, loss=0.0803, v_num=8, train_loss=0.0513, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.364, val_accuracy=0.903, val_f1_score=0.903]
Validating:   7%|▋         | 2/29 [00:02<00:34,  1.27s/it][A
Epoch 152:  90%|█████████ | 230/255 [02:30<00:16,  1.53it/s, loss=0.0803, v_num=8, train_loss=0.0513, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.364, val_accuracy=0.903, val_f1_score=0.903]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.88it/s][A
Epoch 152:  91%|█████████ | 232/255 [02:30<00:14,  1.54it/s, loss=0.0803, v_num=8, train_loss=0.0513, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.364, val_accuracy=0.903, 

Epoch 152, global step 34577: val_loss was not in top 2


Epoch 153:  89%|████████▊ | 226/255 [02:26<00:18,  1.54it/s, loss=0.106, v_num=8, train_loss=0.0258, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.300, val_accuracy=0.916, val_f1_score=0.916] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 153:  89%|████████▉ | 228/255 [02:29<00:17,  1.52it/s, loss=0.106, v_num=8, train_loss=0.0258, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.300, val_accuracy=0.916, val_f1_score=0.916]
Validating:   7%|▋         | 2/29 [00:03<00:35,  1.30s/it][A
Epoch 153:  90%|█████████ | 230/255 [02:30<00:16,  1.53it/s, loss=0.106, v_num=8, train_loss=0.0258, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.300, val_accuracy=0.916, val_f1_score=0.916]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.85it/s][A
Epoch 153:  91%|█████████ | 232/255 [02:30<00:14,  1.54it/s, loss=0.106, v_num=8, train_loss=0.0258, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.300, val_accuracy=0.916, val

Epoch 153, global step 34803: val_loss was not in top 2


Epoch 154:  89%|████████▊ | 226/255 [02:26<00:18,  1.54it/s, loss=0.119, v_num=8, train_loss=0.0216, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.308, val_accuracy=0.906, val_f1_score=0.906] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 154:  89%|████████▉ | 228/255 [02:29<00:17,  1.52it/s, loss=0.119, v_num=8, train_loss=0.0216, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.308, val_accuracy=0.906, val_f1_score=0.906]
Validating:   7%|▋         | 2/29 [00:03<00:34,  1.27s/it][A
Epoch 154:  90%|█████████ | 230/255 [02:30<00:16,  1.53it/s, loss=0.119, v_num=8, train_loss=0.0216, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.308, val_accuracy=0.906, val_f1_score=0.906]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.77it/s][A
Epoch 154:  91%|█████████ | 232/255 [02:30<00:14,  1.54it/s, loss=0.119, v_num=8, train_loss=0.0216, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.308, val_accuracy=0.906, val

Epoch 154, global step 35029: val_loss was not in top 2


Epoch 155:  89%|████████▊ | 226/255 [02:27<00:18,  1.54it/s, loss=0.104, v_num=8, train_loss=0.0205, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.270, val_accuracy=0.915, val_f1_score=0.915] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 155:  89%|████████▉ | 228/255 [02:30<00:17,  1.52it/s, loss=0.104, v_num=8, train_loss=0.0205, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.270, val_accuracy=0.915, val_f1_score=0.915]
Validating:   7%|▋         | 2/29 [00:03<00:34,  1.27s/it][A
Epoch 155:  90%|█████████ | 230/255 [02:30<00:16,  1.53it/s, loss=0.104, v_num=8, train_loss=0.0205, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.270, val_accuracy=0.915, val_f1_score=0.915]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.78it/s][A
Epoch 155:  91%|█████████ | 232/255 [02:30<00:14,  1.54it/s, loss=0.104, v_num=8, train_loss=0.0205, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.270, val_accuracy=0.915, val

Epoch 155, global step 35255: val_loss was not in top 2


Epoch 156:  89%|████████▊ | 226/255 [02:27<00:18,  1.53it/s, loss=0.104, v_num=8, train_loss=0.0712, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.266, val_accuracy=0.911, val_f1_score=0.911] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 156:  89%|████████▉ | 228/255 [02:30<00:17,  1.51it/s, loss=0.104, v_num=8, train_loss=0.0712, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.266, val_accuracy=0.911, val_f1_score=0.911]
Epoch 156:  90%|█████████ | 230/255 [02:30<00:16,  1.52it/s, loss=0.104, v_num=8, train_loss=0.0712, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.266, val_accuracy=0.911, val_f1_score=0.911]
Validating:  14%|█▍        | 4/29 [00:03<00:16,  1.53it/s][A
Epoch 156:  91%|█████████ | 232/255 [02:31<00:14,  1.53it/s, loss=0.104, v_num=8, train_loss=0.0712, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.266, val_accuracy=0.911, val_f1_score=0.911]
Validating:  21%|██        | 6/29 [00:03<00:0

Epoch 156, global step 35481: val_loss was not in top 2


Epoch 157:  89%|████████▊ | 226/255 [02:26<00:18,  1.54it/s, loss=0.108, v_num=8, train_loss=0.162, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.263, val_accuracy=0.906, val_f1_score=0.906]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 157:  89%|████████▉ | 228/255 [02:29<00:17,  1.52it/s, loss=0.108, v_num=8, train_loss=0.162, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.263, val_accuracy=0.906, val_f1_score=0.906]
Validating:   7%|▋         | 2/29 [00:03<00:36,  1.36s/it][A
Epoch 157:  90%|█████████ | 230/255 [02:30<00:16,  1.53it/s, loss=0.108, v_num=8, train_loss=0.162, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.263, val_accuracy=0.906, val_f1_score=0.906]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.80it/s][A
Epoch 157:  91%|█████████ | 232/255 [02:30<00:14,  1.54it/s, loss=0.108, v_num=8, train_loss=0.162, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.263, val_accuracy=0.906, val_f1

Epoch 157, global step 35707: val_loss was not in top 2


Epoch 158:  89%|████████▊ | 226/255 [02:27<00:18,  1.54it/s, loss=0.117, v_num=8, train_loss=0.264, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.270, val_accuracy=0.897, val_f1_score=0.897]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 158:  89%|████████▉ | 228/255 [02:30<00:17,  1.52it/s, loss=0.117, v_num=8, train_loss=0.264, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.270, val_accuracy=0.897, val_f1_score=0.897]
Validating:   7%|▋         | 2/29 [00:03<00:36,  1.35s/it][A
Epoch 158:  90%|█████████ | 230/255 [02:30<00:16,  1.53it/s, loss=0.117, v_num=8, train_loss=0.264, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.270, val_accuracy=0.897, val_f1_score=0.897]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.81it/s][A
Epoch 158:  91%|█████████ | 232/255 [02:30<00:14,  1.54it/s, loss=0.117, v_num=8, train_loss=0.264, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.270, val_accuracy=0.897, val_f1

Epoch 158, global step 35933: val_loss was not in top 2


Epoch 159:  89%|████████▊ | 226/255 [02:26<00:18,  1.54it/s, loss=0.107, v_num=8, train_loss=0.161, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.256, val_accuracy=0.914, val_f1_score=0.914]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 159:  89%|████████▉ | 228/255 [02:29<00:17,  1.52it/s, loss=0.107, v_num=8, train_loss=0.161, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.256, val_accuracy=0.914, val_f1_score=0.914]
Validating:   7%|▋         | 2/29 [00:03<00:36,  1.34s/it][A
Epoch 159:  90%|█████████ | 230/255 [02:30<00:16,  1.53it/s, loss=0.107, v_num=8, train_loss=0.161, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.256, val_accuracy=0.914, val_f1_score=0.914]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.81it/s][A
Epoch 159:  91%|█████████ | 232/255 [02:30<00:14,  1.54it/s, loss=0.107, v_num=8, train_loss=0.161, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.256, val_accuracy=0.914, val_f1

Epoch 159, global step 36159: val_loss reached 0.23913 (best 0.23913), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-0-v3.ckpt" as top 2


Epoch 160:  89%|████████▊ | 226/255 [02:27<00:18,  1.53it/s, loss=0.196, v_num=8, train_loss=0.122, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.239, val_accuracy=0.906, val_f1_score=0.906]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 160:  89%|████████▉ | 228/255 [02:30<00:17,  1.52it/s, loss=0.196, v_num=8, train_loss=0.122, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.239, val_accuracy=0.906, val_f1_score=0.906]
Validating:   7%|▋         | 2/29 [00:03<00:36,  1.35s/it][A
Epoch 160:  90%|█████████ | 230/255 [02:30<00:16,  1.53it/s, loss=0.196, v_num=8, train_loss=0.122, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.239, val_accuracy=0.906, val_f1_score=0.906]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.84it/s][A
Epoch 160:  91%|█████████ | 232/255 [02:31<00:14,  1.54it/s, loss=0.196, v_num=8, train_loss=0.122, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.239, val_accuracy=0.906, val_f1

Epoch 160, global step 36385: val_loss was not in top 2


Epoch 161:  89%|████████▊ | 226/255 [02:27<00:18,  1.53it/s, loss=0.116, v_num=8, train_loss=0.0384, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.405, val_accuracy=0.881, val_f1_score=0.881]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 161:  89%|████████▉ | 228/255 [02:30<00:17,  1.51it/s, loss=0.116, v_num=8, train_loss=0.0384, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.405, val_accuracy=0.881, val_f1_score=0.881]
Validating:   7%|▋         | 2/29 [00:03<00:36,  1.35s/it][A
Epoch 161:  90%|█████████ | 230/255 [02:31<00:16,  1.52it/s, loss=0.116, v_num=8, train_loss=0.0384, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.405, val_accuracy=0.881, val_f1_score=0.881]
Validating:  14%|█▍        | 4/29 [00:03<00:13,  1.83it/s][A
Epoch 161:  91%|█████████ | 232/255 [02:31<00:15,  1.53it/s, loss=0.116, v_num=8, train_loss=0.0384, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.405, val_accuracy=0.881, val_

Epoch 161, global step 36611: val_loss was not in top 2


Epoch 162:  89%|████████▊ | 226/255 [02:27<00:18,  1.53it/s, loss=0.397, v_num=8, train_loss=0.560, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.314, val_accuracy=0.896, val_f1_score=0.896]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 162:  89%|████████▉ | 228/255 [02:30<00:17,  1.51it/s, loss=0.397, v_num=8, train_loss=0.560, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.314, val_accuracy=0.896, val_f1_score=0.896]
Validating:   7%|▋         | 2/29 [00:03<00:35,  1.33s/it][A
Epoch 162:  90%|█████████ | 230/255 [02:30<00:16,  1.52it/s, loss=0.397, v_num=8, train_loss=0.560, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.314, val_accuracy=0.896, val_f1_score=0.896]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.70it/s][A
Epoch 162:  91%|█████████ | 232/255 [02:31<00:14,  1.53it/s, loss=0.397, v_num=8, train_loss=0.560, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.314, val_accuracy=0.896, val_f1

Epoch 162, global step 36837: val_loss was not in top 2


Epoch 163:  89%|████████▊ | 226/255 [02:27<00:18,  1.53it/s, loss=0.151, v_num=8, train_loss=0.521, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.378, val_accuracy=0.891, val_f1_score=0.891] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 163:  89%|████████▉ | 228/255 [02:30<00:17,  1.51it/s, loss=0.151, v_num=8, train_loss=0.521, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.378, val_accuracy=0.891, val_f1_score=0.891]
Validating:   7%|▋         | 2/29 [00:03<00:35,  1.33s/it][A
Epoch 163:  90%|█████████ | 230/255 [02:30<00:16,  1.52it/s, loss=0.151, v_num=8, train_loss=0.521, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.378, val_accuracy=0.891, val_f1_score=0.891]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.68it/s][A
Epoch 163:  91%|█████████ | 232/255 [02:31<00:15,  1.53it/s, loss=0.151, v_num=8, train_loss=0.521, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.378, val_accuracy=0.891, val_f1_

Epoch 163, global step 37063: val_loss was not in top 2


Epoch 164:  89%|████████▊ | 226/255 [02:27<00:18,  1.54it/s, loss=0.154, v_num=8, train_loss=0.320, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.310, val_accuracy=0.894, val_f1_score=0.894] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 164:  89%|████████▉ | 228/255 [02:30<00:17,  1.52it/s, loss=0.154, v_num=8, train_loss=0.320, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.310, val_accuracy=0.894, val_f1_score=0.894]
Epoch 164:  90%|█████████ | 230/255 [02:30<00:16,  1.53it/s, loss=0.154, v_num=8, train_loss=0.320, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.310, val_accuracy=0.894, val_f1_score=0.894]
Validating:  14%|█▍        | 4/29 [00:03<00:15,  1.58it/s][A
Epoch 164:  91%|█████████ | 232/255 [02:30<00:14,  1.54it/s, loss=0.154, v_num=8, train_loss=0.320, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.310, val_accuracy=0.894, val_f1_score=0.894]
Validating:  21%|██        | 6/29 [00:04<00:08,  

Epoch 164, global step 37289: val_loss was not in top 2


Epoch 165:  89%|████████▊ | 226/255 [02:27<00:18,  1.54it/s, loss=0.114, v_num=8, train_loss=0.0208, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.334, val_accuracy=0.895, val_f1_score=0.895]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 165:  89%|████████▉ | 228/255 [02:30<00:17,  1.52it/s, loss=0.114, v_num=8, train_loss=0.0208, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.334, val_accuracy=0.895, val_f1_score=0.895]
Validating:   7%|▋         | 2/29 [00:03<00:38,  1.44s/it][A
Epoch 165:  90%|█████████ | 230/255 [02:30<00:16,  1.52it/s, loss=0.114, v_num=8, train_loss=0.0208, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.334, val_accuracy=0.895, val_f1_score=0.895]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.74it/s][A
Epoch 165:  91%|█████████ | 232/255 [02:31<00:14,  1.53it/s, loss=0.114, v_num=8, train_loss=0.0208, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.334, val_accuracy=0.895, val_

Epoch 165, global step 37515: val_loss was not in top 2


Epoch 166:  89%|████████▊ | 226/255 [02:27<00:18,  1.53it/s, loss=0.106, v_num=8, train_loss=0.274, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.275, val_accuracy=0.899, val_f1_score=0.899]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 166:  89%|████████▉ | 228/255 [02:30<00:17,  1.52it/s, loss=0.106, v_num=8, train_loss=0.274, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.275, val_accuracy=0.899, val_f1_score=0.899]
Validating:   7%|▋         | 2/29 [00:03<00:38,  1.41s/it][A
Epoch 166:  90%|█████████ | 230/255 [02:30<00:16,  1.53it/s, loss=0.106, v_num=8, train_loss=0.274, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.275, val_accuracy=0.899, val_f1_score=0.899]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.71it/s][A
Epoch 166:  91%|█████████ | 232/255 [02:31<00:14,  1.53it/s, loss=0.106, v_num=8, train_loss=0.274, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.275, val_accuracy=0.899, val_f1

Epoch 166, global step 37741: val_loss was not in top 2


Epoch 167:  89%|████████▊ | 226/255 [02:27<00:18,  1.54it/s, loss=0.143, v_num=8, train_loss=0.157, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.275, val_accuracy=0.905, val_f1_score=0.905] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 167:  89%|████████▉ | 228/255 [02:30<00:17,  1.52it/s, loss=0.143, v_num=8, train_loss=0.157, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.275, val_accuracy=0.905, val_f1_score=0.905]
Validating:   7%|▋         | 2/29 [00:03<00:38,  1.41s/it][A
Epoch 167:  90%|█████████ | 230/255 [02:30<00:16,  1.53it/s, loss=0.143, v_num=8, train_loss=0.157, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.275, val_accuracy=0.905, val_f1_score=0.905]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.70it/s][A
Epoch 167:  91%|█████████ | 232/255 [02:31<00:14,  1.54it/s, loss=0.143, v_num=8, train_loss=0.157, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.275, val_accuracy=0.905, val_f1_

Epoch 167, global step 37967: val_loss was not in top 2


Epoch 168:  89%|████████▊ | 226/255 [02:27<00:18,  1.53it/s, loss=0.123, v_num=8, train_loss=0.252, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.319, val_accuracy=0.892, val_f1_score=0.892] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 168:  89%|████████▉ | 228/255 [02:30<00:17,  1.51it/s, loss=0.123, v_num=8, train_loss=0.252, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.319, val_accuracy=0.892, val_f1_score=0.892]
Validating:   7%|▋         | 2/29 [00:03<00:38,  1.42s/it][A
Epoch 168:  90%|█████████ | 230/255 [02:31<00:16,  1.52it/s, loss=0.123, v_num=8, train_loss=0.252, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.319, val_accuracy=0.892, val_f1_score=0.892]
Validating:  14%|█▍        | 4/29 [00:03<00:15,  1.64it/s][A
Epoch 168:  91%|█████████ | 232/255 [02:31<00:15,  1.53it/s, loss=0.123, v_num=8, train_loss=0.252, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.319, val_accuracy=0.892, val_f1_

Epoch 168, global step 38193: val_loss was not in top 2


Epoch 169:  89%|████████▊ | 226/255 [02:27<00:18,  1.53it/s, loss=0.206, v_num=8, train_loss=0.134, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.267, val_accuracy=0.907, val_f1_score=0.907] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 169:  89%|████████▉ | 228/255 [02:30<00:17,  1.51it/s, loss=0.206, v_num=8, train_loss=0.134, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.267, val_accuracy=0.907, val_f1_score=0.907]
Validating:   7%|▋         | 2/29 [00:03<00:38,  1.42s/it][A
Epoch 169:  90%|█████████ | 230/255 [02:30<00:16,  1.52it/s, loss=0.206, v_num=8, train_loss=0.134, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.267, val_accuracy=0.907, val_f1_score=0.907]
Validating:  14%|█▍        | 4/29 [00:03<00:15,  1.65it/s][A
Epoch 169:  91%|█████████ | 232/255 [02:31<00:15,  1.53it/s, loss=0.206, v_num=8, train_loss=0.134, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.267, val_accuracy=0.907, val_f1_

Epoch 169, global step 38419: val_loss was not in top 2


Epoch 170:  89%|████████▊ | 226/255 [02:27<00:18,  1.53it/s, loss=0.161, v_num=8, train_loss=0.0432, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.304, val_accuracy=0.890, val_f1_score=0.890]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 170:  89%|████████▉ | 228/255 [02:30<00:17,  1.51it/s, loss=0.161, v_num=8, train_loss=0.0432, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.304, val_accuracy=0.890, val_f1_score=0.890]
Validating:   7%|▋         | 2/29 [00:03<00:38,  1.44s/it][A
Epoch 170:  90%|█████████ | 230/255 [02:31<00:16,  1.52it/s, loss=0.161, v_num=8, train_loss=0.0432, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.304, val_accuracy=0.890, val_f1_score=0.890]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.75it/s][A
Epoch 170:  91%|█████████ | 232/255 [02:31<00:15,  1.53it/s, loss=0.161, v_num=8, train_loss=0.0432, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.304, val_accuracy=0.890, val_

Epoch 170, global step 38645: val_loss was not in top 2


Epoch 171:  89%|████████▊ | 226/255 [02:29<00:19,  1.52it/s, loss=0.126, v_num=8, train_loss=0.0713, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.269, val_accuracy=0.903, val_f1_score=0.903]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 171:  89%|████████▉ | 228/255 [02:32<00:18,  1.50it/s, loss=0.126, v_num=8, train_loss=0.0713, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.269, val_accuracy=0.903, val_f1_score=0.903]
Validating:   7%|▋         | 2/29 [00:03<00:38,  1.43s/it][A
Epoch 171:  90%|█████████ | 230/255 [02:32<00:16,  1.51it/s, loss=0.126, v_num=8, train_loss=0.0713, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.269, val_accuracy=0.903, val_f1_score=0.903]
Validating:  14%|█▍        | 4/29 [00:03<00:15,  1.64it/s][A
Epoch 171:  91%|█████████ | 232/255 [02:33<00:15,  1.52it/s, loss=0.126, v_num=8, train_loss=0.0713, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.269, val_accuracy=0.903, val_

Epoch 171, global step 38871: val_loss was not in top 2


Epoch 172:  89%|████████▊ | 226/255 [02:31<00:19,  1.50it/s, loss=0.148, v_num=8, train_loss=0.140, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.277, val_accuracy=0.902, val_f1_score=0.902] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 172:  89%|████████▉ | 228/255 [02:34<00:18,  1.48it/s, loss=0.148, v_num=8, train_loss=0.140, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.277, val_accuracy=0.902, val_f1_score=0.902]
Validating:   7%|▋         | 2/29 [00:03<00:38,  1.43s/it][A
Epoch 172:  90%|█████████ | 230/255 [02:34<00:16,  1.49it/s, loss=0.148, v_num=8, train_loss=0.140, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.277, val_accuracy=0.902, val_f1_score=0.902]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.73it/s][A
Epoch 172:  91%|█████████ | 232/255 [02:34<00:15,  1.50it/s, loss=0.148, v_num=8, train_loss=0.140, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.277, val_accuracy=0.902, val_f1_

Epoch 172, global step 39097: val_loss was not in top 2


Epoch 173:  89%|████████▊ | 226/255 [02:30<00:19,  1.50it/s, loss=0.117, v_num=8, train_loss=0.019, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.275, val_accuracy=0.895, val_f1_score=0.895] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 173:  89%|████████▉ | 228/255 [02:33<00:18,  1.48it/s, loss=0.117, v_num=8, train_loss=0.019, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.275, val_accuracy=0.895, val_f1_score=0.895]
Epoch 173:  90%|█████████ | 230/255 [02:33<00:16,  1.49it/s, loss=0.117, v_num=8, train_loss=0.019, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.275, val_accuracy=0.895, val_f1_score=0.895]
Validating:  14%|█▍        | 4/29 [00:03<00:15,  1.58it/s][A
Epoch 173:  91%|█████████ | 232/255 [02:34<00:15,  1.50it/s, loss=0.117, v_num=8, train_loss=0.019, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.275, val_accuracy=0.895, val_f1_score=0.895]
Validating:  21%|██        | 6/29 [00:03<00:09,  

Epoch 173, global step 39323: val_loss was not in top 2


Epoch 174:  89%|████████▊ | 226/255 [02:27<00:18,  1.53it/s, loss=0.101, v_num=8, train_loss=0.0911, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.276, val_accuracy=0.901, val_f1_score=0.901]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 174:  89%|████████▉ | 228/255 [02:31<00:17,  1.51it/s, loss=0.101, v_num=8, train_loss=0.0911, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.276, val_accuracy=0.901, val_f1_score=0.901]
Validating:   7%|▋         | 2/29 [00:03<00:38,  1.43s/it][A
Epoch 174:  90%|█████████ | 230/255 [02:31<00:16,  1.52it/s, loss=0.101, v_num=8, train_loss=0.0911, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.276, val_accuracy=0.901, val_f1_score=0.901]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.76it/s][A
Epoch 174:  91%|█████████ | 232/255 [02:31<00:15,  1.53it/s, loss=0.101, v_num=8, train_loss=0.0911, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.276, val_accuracy=0.901, val_

Epoch 174, global step 39549: val_loss was not in top 2


Epoch 175:  89%|████████▊ | 226/255 [02:27<00:18,  1.53it/s, loss=0.123, v_num=8, train_loss=0.0527, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.270, val_accuracy=0.910, val_f1_score=0.910]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 175:  89%|████████▉ | 228/255 [02:30<00:17,  1.52it/s, loss=0.123, v_num=8, train_loss=0.0527, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.270, val_accuracy=0.910, val_f1_score=0.910]
Validating:   7%|▋         | 2/29 [00:03<00:38,  1.42s/it][A
Epoch 175:  90%|█████████ | 230/255 [02:30<00:16,  1.52it/s, loss=0.123, v_num=8, train_loss=0.0527, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.270, val_accuracy=0.910, val_f1_score=0.910]
Validating:  14%|█▍        | 4/29 [00:03<00:15,  1.64it/s][A
Epoch 175:  91%|█████████ | 232/255 [02:31<00:14,  1.53it/s, loss=0.123, v_num=8, train_loss=0.0527, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.270, val_accuracy=0.910, val_

Epoch 175, global step 39775: val_loss was not in top 2


Epoch 176:  89%|████████▊ | 226/255 [02:27<00:18,  1.53it/s, loss=0.106, v_num=8, train_loss=0.136, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.272, val_accuracy=0.906, val_f1_score=0.906]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 176:  89%|████████▉ | 228/255 [02:30<00:17,  1.51it/s, loss=0.106, v_num=8, train_loss=0.136, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.272, val_accuracy=0.906, val_f1_score=0.906]
Validating:   7%|▋         | 2/29 [00:03<00:38,  1.43s/it][A
Epoch 176:  90%|█████████ | 230/255 [02:31<00:16,  1.52it/s, loss=0.106, v_num=8, train_loss=0.136, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.272, val_accuracy=0.906, val_f1_score=0.906]
Validating:  14%|█▍        | 4/29 [00:03<00:15,  1.63it/s][A
Epoch 176:  91%|█████████ | 232/255 [02:31<00:15,  1.53it/s, loss=0.106, v_num=8, train_loss=0.136, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.272, val_accuracy=0.906, val_f1

Epoch 176, global step 40001: val_loss was not in top 2


Epoch 177:  89%|████████▊ | 226/255 [02:27<00:18,  1.53it/s, loss=0.105, v_num=8, train_loss=0.0639, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.254, val_accuracy=0.913, val_f1_score=0.913] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 177:  89%|████████▉ | 228/255 [02:30<00:17,  1.51it/s, loss=0.105, v_num=8, train_loss=0.0639, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.254, val_accuracy=0.913, val_f1_score=0.913]
Validating:   7%|▋         | 2/29 [00:03<00:38,  1.43s/it][A
Epoch 177:  90%|█████████ | 230/255 [02:30<00:16,  1.52it/s, loss=0.105, v_num=8, train_loss=0.0639, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.254, val_accuracy=0.913, val_f1_score=0.913]
Validating:  14%|█▍        | 4/29 [00:03<00:15,  1.64it/s][A
Epoch 177:  91%|█████████ | 232/255 [02:31<00:14,  1.53it/s, loss=0.105, v_num=8, train_loss=0.0639, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.254, val_accuracy=0.913, val

Epoch 177, global step 40227: val_loss reached 0.22987 (best 0.22987), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-0-v2.ckpt" as top 2


Epoch 178:  89%|████████▊ | 226/255 [02:27<00:18,  1.53it/s, loss=0.104, v_num=8, train_loss=0.114, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.230, val_accuracy=0.915, val_f1_score=0.915]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 178:  89%|████████▉ | 228/255 [02:30<00:17,  1.51it/s, loss=0.104, v_num=8, train_loss=0.114, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.230, val_accuracy=0.915, val_f1_score=0.915]
Validating:   7%|▋         | 2/29 [00:03<00:38,  1.43s/it][A
Epoch 178:  90%|█████████ | 230/255 [02:31<00:16,  1.52it/s, loss=0.104, v_num=8, train_loss=0.114, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.230, val_accuracy=0.915, val_f1_score=0.915]
Validating:  14%|█▍        | 4/29 [00:03<00:15,  1.62it/s][A
Epoch 178:  91%|█████████ | 232/255 [02:31<00:15,  1.53it/s, loss=0.104, v_num=8, train_loss=0.114, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.230, val_accuracy=0.915, val_f1

Epoch 178, global step 40453: val_loss reached 0.23410 (best 0.22987), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-0-v3.ckpt" as top 2


Epoch 179:  89%|████████▊ | 226/255 [02:26<00:18,  1.54it/s, loss=0.108, v_num=8, train_loss=0.0361, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.234, val_accuracy=0.917, val_f1_score=0.917] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 179:  89%|████████▉ | 228/255 [02:30<00:17,  1.52it/s, loss=0.108, v_num=8, train_loss=0.0361, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.234, val_accuracy=0.917, val_f1_score=0.917]
Validating:   7%|▋         | 2/29 [00:03<00:38,  1.41s/it][A
Epoch 179:  90%|█████████ | 230/255 [02:30<00:16,  1.53it/s, loss=0.108, v_num=8, train_loss=0.0361, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.234, val_accuracy=0.917, val_f1_score=0.917]
Validating:  14%|█▍        | 4/29 [00:03<00:15,  1.63it/s][A
Epoch 179:  91%|█████████ | 232/255 [02:30<00:14,  1.54it/s, loss=0.108, v_num=8, train_loss=0.0361, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.234, val_accuracy=0.917, val

Epoch 179, global step 40679: val_loss was not in top 2


Epoch 180:  89%|████████▊ | 226/255 [02:27<00:18,  1.54it/s, loss=0.104, v_num=8, train_loss=0.247, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.248, val_accuracy=0.917, val_f1_score=0.917]   
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 180:  89%|████████▉ | 228/255 [02:30<00:17,  1.52it/s, loss=0.104, v_num=8, train_loss=0.247, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.248, val_accuracy=0.917, val_f1_score=0.917]
Validating:   7%|▋         | 2/29 [00:03<00:37,  1.40s/it][A
Epoch 180:  90%|█████████ | 230/255 [02:30<00:16,  1.53it/s, loss=0.104, v_num=8, train_loss=0.247, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.248, val_accuracy=0.917, val_f1_score=0.917]
Validating:  14%|█▍        | 4/29 [00:03<00:15,  1.64it/s][A
Epoch 180:  91%|█████████ | 232/255 [02:30<00:14,  1.54it/s, loss=0.104, v_num=8, train_loss=0.247, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.248, val_accuracy=0.917, val_f

Epoch 180, global step 40905: val_loss was not in top 2


Epoch 181:  89%|████████▊ | 226/255 [02:27<00:18,  1.54it/s, loss=0.11, v_num=8, train_loss=0.130, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.272, val_accuracy=0.921, val_f1_score=0.921]   
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 181:  89%|████████▉ | 228/255 [02:30<00:17,  1.52it/s, loss=0.11, v_num=8, train_loss=0.130, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.272, val_accuracy=0.921, val_f1_score=0.921]
Validating:   7%|▋         | 2/29 [00:03<00:38,  1.41s/it][A
Epoch 181:  90%|█████████ | 230/255 [02:30<00:16,  1.53it/s, loss=0.11, v_num=8, train_loss=0.130, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.272, val_accuracy=0.921, val_f1_score=0.921]
Validating:  14%|█▍        | 4/29 [00:03<00:15,  1.66it/s][A
Epoch 181:  91%|█████████ | 232/255 [02:31<00:14,  1.54it/s, loss=0.11, v_num=8, train_loss=0.130, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.272, val_accuracy=0.921, val_f1_sc

Epoch 181, global step 41131: val_loss was not in top 2


Epoch 182:  89%|████████▊ | 226/255 [02:27<00:18,  1.53it/s, loss=0.11, v_num=8, train_loss=0.406, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.249, val_accuracy=0.912, val_f1_score=0.912]   
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 182:  89%|████████▉ | 228/255 [02:30<00:17,  1.51it/s, loss=0.11, v_num=8, train_loss=0.406, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.249, val_accuracy=0.912, val_f1_score=0.912]
Validating:   7%|▋         | 2/29 [00:03<00:37,  1.40s/it][A
Epoch 182:  90%|█████████ | 230/255 [02:31<00:16,  1.52it/s, loss=0.11, v_num=8, train_loss=0.406, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.249, val_accuracy=0.912, val_f1_score=0.912]
Validating:  14%|█▍        | 4/29 [00:03<00:15,  1.65it/s][A
Epoch 182:  91%|█████████ | 232/255 [02:31<00:15,  1.53it/s, loss=0.11, v_num=8, train_loss=0.406, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.249, val_accuracy=0.912, val_f1_sc

Epoch 182, global step 41357: val_loss was not in top 2


Epoch 183:  89%|████████▊ | 226/255 [02:27<00:18,  1.54it/s, loss=0.159, v_num=8, train_loss=0.169, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.258, val_accuracy=0.920, val_f1_score=0.920] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 183:  89%|████████▉ | 228/255 [02:30<00:17,  1.51it/s, loss=0.159, v_num=8, train_loss=0.169, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.258, val_accuracy=0.920, val_f1_score=0.920]
Validating:   7%|▋         | 2/29 [00:03<00:40,  1.49s/it][A
Epoch 183:  90%|█████████ | 230/255 [02:30<00:16,  1.52it/s, loss=0.159, v_num=8, train_loss=0.169, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.258, val_accuracy=0.920, val_f1_score=0.920]
Validating:  14%|█▍        | 4/29 [00:03<00:15,  1.67it/s][A
Epoch 183:  91%|█████████ | 232/255 [02:31<00:15,  1.53it/s, loss=0.159, v_num=8, train_loss=0.169, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.258, val_accuracy=0.920, val_f1_

Epoch 183, global step 41583: val_loss was not in top 2


Epoch 184:  89%|████████▊ | 226/255 [02:27<00:18,  1.53it/s, loss=0.213, v_num=8, train_loss=0.117, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.276, val_accuracy=0.903, val_f1_score=0.903] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 184:  89%|████████▉ | 228/255 [02:30<00:17,  1.51it/s, loss=0.213, v_num=8, train_loss=0.117, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.276, val_accuracy=0.903, val_f1_score=0.903]
Validating:   7%|▋         | 2/29 [00:03<00:37,  1.40s/it][A
Epoch 184:  90%|█████████ | 230/255 [02:30<00:16,  1.52it/s, loss=0.213, v_num=8, train_loss=0.117, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.276, val_accuracy=0.903, val_f1_score=0.903]
Validating:  14%|█▍        | 4/29 [00:03<00:15,  1.66it/s][A
Epoch 184:  91%|█████████ | 232/255 [02:31<00:14,  1.53it/s, loss=0.213, v_num=8, train_loss=0.117, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.276, val_accuracy=0.903, val_f1_

Epoch 184, global step 41809: val_loss was not in top 2


Epoch 185:  89%|████████▊ | 226/255 [02:27<00:18,  1.53it/s, loss=0.153, v_num=8, train_loss=0.257, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.297, val_accuracy=0.887, val_f1_score=0.887] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 185:  89%|████████▉ | 228/255 [02:30<00:17,  1.51it/s, loss=0.153, v_num=8, train_loss=0.257, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.297, val_accuracy=0.887, val_f1_score=0.887]
Validating:   7%|▋         | 2/29 [00:03<00:38,  1.42s/it][A
Epoch 185:  90%|█████████ | 230/255 [02:31<00:16,  1.52it/s, loss=0.153, v_num=8, train_loss=0.257, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.297, val_accuracy=0.887, val_f1_score=0.887]
Validating:  14%|█▍        | 4/29 [00:03<00:15,  1.64it/s][A
Epoch 185:  91%|█████████ | 232/255 [02:31<00:15,  1.53it/s, loss=0.153, v_num=8, train_loss=0.257, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.297, val_accuracy=0.887, val_f1_

Epoch 185, global step 42035: val_loss was not in top 2


Epoch 186:  89%|████████▊ | 226/255 [02:27<00:18,  1.53it/s, loss=0.153, v_num=8, train_loss=0.198, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.258, val_accuracy=0.896, val_f1_score=0.896] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 186:  89%|████████▉ | 228/255 [02:30<00:17,  1.51it/s, loss=0.153, v_num=8, train_loss=0.198, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.258, val_accuracy=0.896, val_f1_score=0.896]
Epoch 186:  90%|█████████ | 230/255 [02:31<00:16,  1.52it/s, loss=0.153, v_num=8, train_loss=0.198, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.258, val_accuracy=0.896, val_f1_score=0.896]
Validating:  14%|█▍        | 4/29 [00:03<00:17,  1.42it/s][A
Epoch 186:  91%|█████████ | 232/255 [02:31<00:15,  1.53it/s, loss=0.153, v_num=8, train_loss=0.198, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.258, val_accuracy=0.896, val_f1_score=0.896]
Validating:  21%|██        | 6/29 [00:04<00:09,  

Epoch 186, global step 42261: val_loss was not in top 2


Epoch 187:  89%|████████▊ | 226/255 [02:27<00:18,  1.53it/s, loss=0.129, v_num=8, train_loss=0.0726, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.288, val_accuracy=0.886, val_f1_score=0.886]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 187:  89%|████████▉ | 228/255 [02:30<00:17,  1.51it/s, loss=0.129, v_num=8, train_loss=0.0726, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.288, val_accuracy=0.886, val_f1_score=0.886]
Validating:   7%|▋         | 2/29 [00:03<00:38,  1.42s/it][A
Epoch 187:  90%|█████████ | 230/255 [02:31<00:16,  1.52it/s, loss=0.129, v_num=8, train_loss=0.0726, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.288, val_accuracy=0.886, val_f1_score=0.886]
Validating:  14%|█▍        | 4/29 [00:03<00:15,  1.65it/s][A
Epoch 187:  91%|█████████ | 232/255 [02:31<00:15,  1.53it/s, loss=0.129, v_num=8, train_loss=0.0726, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.288, val_accuracy=0.886, val_

Epoch 187, global step 42487: val_loss was not in top 2


Epoch 188:  89%|████████▊ | 226/255 [02:27<00:18,  1.53it/s, loss=0.123, v_num=8, train_loss=0.174, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.265, val_accuracy=0.899, val_f1_score=0.899] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 188:  89%|████████▉ | 228/255 [02:30<00:17,  1.51it/s, loss=0.123, v_num=8, train_loss=0.174, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.265, val_accuracy=0.899, val_f1_score=0.899]
Validating:   7%|▋         | 2/29 [00:03<00:40,  1.49s/it][A
Epoch 188:  90%|█████████ | 230/255 [02:31<00:16,  1.52it/s, loss=0.123, v_num=8, train_loss=0.174, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.265, val_accuracy=0.899, val_f1_score=0.899]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.67it/s][A
Epoch 188:  91%|█████████ | 232/255 [02:31<00:15,  1.53it/s, loss=0.123, v_num=8, train_loss=0.174, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.265, val_accuracy=0.899, val_f1_

Epoch 188, global step 42713: val_loss was not in top 2


Epoch 189:  89%|████████▊ | 226/255 [02:27<00:18,  1.54it/s, loss=0.0991, v_num=8, train_loss=0.0603, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.257, val_accuracy=0.908, val_f1_score=0.908]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 189:  89%|████████▉ | 228/255 [02:30<00:17,  1.52it/s, loss=0.0991, v_num=8, train_loss=0.0603, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.257, val_accuracy=0.908, val_f1_score=0.908]
Validating:   7%|▋         | 2/29 [00:03<00:38,  1.42s/it][A
Epoch 189:  90%|█████████ | 230/255 [02:30<00:16,  1.53it/s, loss=0.0991, v_num=8, train_loss=0.0603, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.257, val_accuracy=0.908, val_f1_score=0.908]
Epoch 189:  91%|█████████ | 232/255 [02:31<00:14,  1.54it/s, loss=0.0991, v_num=8, train_loss=0.0603, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.257, val_accuracy=0.908, val_f1_score=0.908]
Validating:  21%|██        | 6/29 [00:04<0

Epoch 189, global step 42939: val_loss was not in top 2


Epoch 190:  89%|████████▊ | 226/255 [02:27<00:18,  1.53it/s, loss=0.134, v_num=8, train_loss=0.124, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.279, val_accuracy=0.905, val_f1_score=0.905]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 190:  89%|████████▉ | 228/255 [02:30<00:17,  1.51it/s, loss=0.134, v_num=8, train_loss=0.124, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.279, val_accuracy=0.905, val_f1_score=0.905]
Epoch 190:  90%|█████████ | 230/255 [02:30<00:16,  1.52it/s, loss=0.134, v_num=8, train_loss=0.124, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.279, val_accuracy=0.905, val_f1_score=0.905]
Validating:  14%|█▍        | 4/29 [00:03<00:17,  1.42it/s][A
Epoch 190:  91%|█████████ | 232/255 [02:31<00:14,  1.53it/s, loss=0.134, v_num=8, train_loss=0.124, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.279, val_accuracy=0.905, val_f1_score=0.905]
Validating:  21%|██        | 6/29 [00:04<00:09, 

Epoch 190, global step 43165: val_loss was not in top 2


Epoch 191:  89%|████████▊ | 226/255 [02:27<00:18,  1.53it/s, loss=0.165, v_num=8, train_loss=0.296, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.305, val_accuracy=0.904, val_f1_score=0.904] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 191:  89%|████████▉ | 228/255 [02:30<00:17,  1.51it/s, loss=0.165, v_num=8, train_loss=0.296, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.305, val_accuracy=0.904, val_f1_score=0.904]
Validating:   7%|▋         | 2/29 [00:03<00:39,  1.46s/it][A
Epoch 191:  90%|█████████ | 230/255 [02:30<00:16,  1.52it/s, loss=0.165, v_num=8, train_loss=0.296, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.305, val_accuracy=0.904, val_f1_score=0.904]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.72it/s][A
Epoch 191:  91%|█████████ | 232/255 [02:31<00:14,  1.53it/s, loss=0.165, v_num=8, train_loss=0.296, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.305, val_accuracy=0.904, val_f1_

Epoch 191, global step 43391: val_loss was not in top 2


Epoch 192:  89%|████████▊ | 226/255 [02:27<00:18,  1.54it/s, loss=0.151, v_num=8, train_loss=0.252, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.308, val_accuracy=0.872, val_f1_score=0.872] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 192:  89%|████████▉ | 228/255 [02:30<00:17,  1.52it/s, loss=0.151, v_num=8, train_loss=0.252, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.308, val_accuracy=0.872, val_f1_score=0.872]
Epoch 192:  90%|█████████ | 230/255 [02:30<00:16,  1.53it/s, loss=0.151, v_num=8, train_loss=0.252, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.308, val_accuracy=0.872, val_f1_score=0.872]
Validating:  14%|█▍        | 4/29 [00:03<00:17,  1.42it/s][A
Epoch 192:  91%|█████████ | 232/255 [02:31<00:14,  1.54it/s, loss=0.151, v_num=8, train_loss=0.252, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.308, val_accuracy=0.872, val_f1_score=0.872]
Validating:  21%|██        | 6/29 [00:04<00:09,  

Epoch 192, global step 43617: val_loss was not in top 2


Epoch 193:  89%|████████▊ | 226/255 [02:27<00:18,  1.53it/s, loss=0.23, v_num=8, train_loss=0.150, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.307, val_accuracy=0.889, val_f1_score=0.889]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 193:  89%|████████▉ | 228/255 [02:30<00:17,  1.51it/s, loss=0.23, v_num=8, train_loss=0.150, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.307, val_accuracy=0.889, val_f1_score=0.889]
Epoch 193:  90%|█████████ | 230/255 [02:30<00:16,  1.52it/s, loss=0.23, v_num=8, train_loss=0.150, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.307, val_accuracy=0.889, val_f1_score=0.889]
Validating:  14%|█▍        | 4/29 [00:03<00:16,  1.55it/s][A
Epoch 193:  91%|█████████ | 232/255 [02:31<00:15,  1.53it/s, loss=0.23, v_num=8, train_loss=0.150, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.307, val_accuracy=0.889, val_f1_score=0.889]
Validating:  21%|██        | 6/29 [00:04<00:08,  2.5

Epoch 193, global step 43843: val_loss was not in top 2


Epoch 194:  89%|████████▊ | 226/255 [02:27<00:18,  1.54it/s, loss=0.176, v_num=8, train_loss=0.0228, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.382, val_accuracy=0.859, val_f1_score=0.859]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 194:  89%|████████▉ | 228/255 [02:30<00:17,  1.51it/s, loss=0.176, v_num=8, train_loss=0.0228, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.382, val_accuracy=0.859, val_f1_score=0.859]
Validating:   7%|▋         | 2/29 [00:03<00:40,  1.49s/it][A
Epoch 194:  90%|█████████ | 230/255 [02:30<00:16,  1.52it/s, loss=0.176, v_num=8, train_loss=0.0228, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.382, val_accuracy=0.859, val_f1_score=0.859]
Validating:  14%|█▍        | 4/29 [00:03<00:14,  1.68it/s][A
Epoch 194:  91%|█████████ | 232/255 [02:31<00:15,  1.53it/s, loss=0.176, v_num=8, train_loss=0.0228, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.382, val_accuracy=0.859, val_

Epoch 194, global step 44069: val_loss was not in top 2


Epoch 195:  89%|████████▊ | 226/255 [02:27<00:18,  1.53it/s, loss=0.162, v_num=8, train_loss=0.0335, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.322, val_accuracy=0.881, val_f1_score=0.881]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 195:  89%|████████▉ | 228/255 [02:30<00:17,  1.51it/s, loss=0.162, v_num=8, train_loss=0.0335, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.322, val_accuracy=0.881, val_f1_score=0.881]
Validating:   7%|▋         | 2/29 [00:03<00:38,  1.41s/it][A
Epoch 195:  90%|█████████ | 230/255 [02:30<00:16,  1.52it/s, loss=0.162, v_num=8, train_loss=0.0335, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.322, val_accuracy=0.881, val_f1_score=0.881]
Validating:  14%|█▍        | 4/29 [00:03<00:15,  1.65it/s][A
Epoch 195:  91%|█████████ | 232/255 [02:31<00:15,  1.53it/s, loss=0.162, v_num=8, train_loss=0.0335, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.322, val_accuracy=0.881, val_

Epoch 195, global step 44295: val_loss was not in top 2


Epoch 196:  89%|████████▊ | 226/255 [02:30<00:19,  1.51it/s, loss=0.166, v_num=8, train_loss=0.218, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.395, val_accuracy=0.867, val_f1_score=0.867] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 196:  89%|████████▉ | 228/255 [02:33<00:18,  1.49it/s, loss=0.166, v_num=8, train_loss=0.218, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.395, val_accuracy=0.867, val_f1_score=0.867]
Epoch 196:  90%|█████████ | 230/255 [02:33<00:16,  1.50it/s, loss=0.166, v_num=8, train_loss=0.218, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.395, val_accuracy=0.867, val_f1_score=0.867]
Epoch 196:  91%|█████████ | 232/255 [02:33<00:15,  1.51it/s, loss=0.166, v_num=8, train_loss=0.218, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.395, val_accuracy=0.867, val_f1_score=0.867]
Epoch 196:  92%|█████████▏| 234/255 [02:33<00:13,  1.52it/s, loss=0.166, v_num=8, train_loss=0.218, train_accur

Epoch 196, global step 44521: val_loss was not in top 2


Epoch 197:  89%|████████▊ | 226/255 [02:31<00:19,  1.50it/s, loss=0.144, v_num=8, train_loss=0.0526, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.315, val_accuracy=0.882, val_f1_score=0.882]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 197:  89%|████████▉ | 228/255 [02:34<00:18,  1.48it/s, loss=0.144, v_num=8, train_loss=0.0526, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.315, val_accuracy=0.882, val_f1_score=0.882]
Epoch 197:  90%|█████████ | 230/255 [02:34<00:16,  1.49it/s, loss=0.144, v_num=8, train_loss=0.0526, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.315, val_accuracy=0.882, val_f1_score=0.882]
Epoch 197:  91%|█████████ | 232/255 [02:34<00:15,  1.50it/s, loss=0.144, v_num=8, train_loss=0.0526, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.315, val_accuracy=0.882, val_f1_score=0.882]
Epoch 197:  92%|█████████▏| 234/255 [02:34<00:13,  1.51it/s, loss=0.144, v_num=8, train_loss=0.0526, train_a

Epoch 197, global step 44747: val_loss was not in top 2


Epoch 198:  89%|████████▊ | 226/255 [02:29<00:19,  1.52it/s, loss=0.166, v_num=8, train_loss=0.0664, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.280, val_accuracy=0.900, val_f1_score=0.900]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 198:  89%|████████▉ | 228/255 [02:32<00:18,  1.49it/s, loss=0.166, v_num=8, train_loss=0.0664, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.280, val_accuracy=0.900, val_f1_score=0.900]
Validating:   7%|▋         | 2/29 [00:03<00:41,  1.54s/it][A
Epoch 198:  90%|█████████ | 230/255 [02:32<00:16,  1.50it/s, loss=0.166, v_num=8, train_loss=0.0664, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.280, val_accuracy=0.900, val_f1_score=0.900]
Validating:  14%|█▍        | 4/29 [00:03<00:15,  1.64it/s][A
Epoch 198:  91%|█████████ | 232/255 [02:33<00:15,  1.51it/s, loss=0.166, v_num=8, train_loss=0.0664, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.280, val_accuracy=0.900, val_

Epoch 198, global step 44973: val_loss was not in top 2


Epoch 199:  89%|████████▊ | 226/255 [02:27<00:18,  1.53it/s, loss=0.152, v_num=8, train_loss=0.073, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.296, val_accuracy=0.901, val_f1_score=0.901] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 199:  89%|████████▉ | 228/255 [02:30<00:17,  1.51it/s, loss=0.152, v_num=8, train_loss=0.073, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.296, val_accuracy=0.901, val_f1_score=0.901]
Epoch 199:  90%|█████████ | 230/255 [02:30<00:16,  1.52it/s, loss=0.152, v_num=8, train_loss=0.073, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.296, val_accuracy=0.901, val_f1_score=0.901]
Validating:  14%|█▍        | 4/29 [00:03<00:17,  1.43it/s][A
Epoch 199:  91%|█████████ | 232/255 [02:31<00:14,  1.53it/s, loss=0.152, v_num=8, train_loss=0.073, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.296, val_accuracy=0.901, val_f1_score=0.901]
Validating:  21%|██        | 6/29 [00:04<00:09,  

Epoch 199, global step 45199: val_loss was not in top 2


Epoch 199: 100%|██████████| 255/255 [02:36<00:00,  1.63it/s, loss=0.152, v_num=8, train_loss=0.073, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.288, val_accuracy=0.895, val_f1_score=0.895]


LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1,2]


Testing: 100%|██████████| 29/29 [00:08<00:00,  3.70it/s]--------------------------------------------------------------------------------
DATALOADER:0 TEST RESULTS
{'test_f1_score': 0.8992193341255188,
 'test_train_accuracy': 0.8992193341255188,
 'test_train_loss': 0.28896135091781616}
--------------------------------------------------------------------------------
Testing: 100%|██████████| 29/29 [00:08<00:00,  3.32it/s]
------------------ Round: 1 ------------------
['FP2', 'FCZ', 'FT10', 'O2', 'O1', 'FT7', 'F4', 'TP7', 'C3', 'C4', 'F3', 'FT8', 'T6', 'HEOR', 'T5', 'VEOL', 'F7', 'FZ', 'VEOU', 'A1', 'P3', 'PZ', 'CP3', 'P4', 'CPZ', 'A2', 'HEOL', 'CP4', 'FT9', 'F8', 'OZ', 'CZ', 'FC4', 'FC3', 'FP1', 'PO1', 'T3', 'T4', 'PO2']
Len: 39


GPU available: True, used: True
TPU available: False, using: 0 TPU cores
IPU available: False, using: 0 IPUs
LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1,2]

  | Name      | Type             | Params
-----------------------------------------------
0 | model     | DrowsyModel      | 1.4 M 
1 | criterion | CrossEntropyLoss | 0     
-----------------------------------------------
1.4 M     Trainable params
0         Non-trainable params
1.4 M     Total params
5.429     Total estimated model params size (MB)
  rank_zero_warn(f"Checkpoint directory {dirpath} exists and is not empty.")


                                                                      

Global seed set to 42


Epoch 0:  89%|████████▊ | 226/255 [02:30<00:19,  1.51it/s, loss=0.621, v_num=1, train_loss=0.626, train_accuracy=0.611, train_f1_score=0.611]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 0:  89%|████████▉ | 228/255 [02:35<00:18,  1.47it/s, loss=0.621, v_num=1, train_loss=0.626, train_accuracy=0.611, train_f1_score=0.611]
Validating:   7%|▋         | 2/29 [00:05<01:02,  2.33s/it][A
Epoch 0:  90%|█████████ | 230/255 [02:35<00:16,  1.48it/s, loss=0.621, v_num=1, train_loss=0.626, train_accuracy=0.611, train_f1_score=0.611]
Validating:  14%|█▍        | 4/29 [00:05<00:22,  1.12it/s][A
Epoch 0:  91%|█████████ | 232/255 [02:36<00:15,  1.48it/s, loss=0.621, v_num=1, train_loss=0.626, train_accuracy=0.611, train_f1_score=0.611]
Validating:  21%|██        | 6/29 [00:06<00:11,  2.02it/s][A
Epoch 0:  92%|█████████▏| 234/255 [02:36<00:14,  1.49it/s, loss=0.621, v_num=1, train_loss=0.626, train_accuracy=0.611, train_f1_score=0.611]
Validating:  28%

Epoch 0, global step 225: val_loss reached 0.64166 (best 0.64166), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-1-v2.ckpt" as top 2


Epoch 1:  89%|████████▊ | 226/255 [02:30<00:19,  1.50it/s, loss=0.566, v_num=1, train_loss=0.532, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.642, val_accuracy=0.666, val_f1_score=0.666]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 1:  89%|████████▉ | 228/255 [02:35<00:18,  1.46it/s, loss=0.566, v_num=1, train_loss=0.532, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.642, val_accuracy=0.666, val_f1_score=0.666]
Validating:   7%|▋         | 2/29 [00:05<01:04,  2.40s/it][A
Epoch 1:  90%|█████████ | 230/255 [02:36<00:16,  1.47it/s, loss=0.566, v_num=1, train_loss=0.532, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.642, val_accuracy=0.666, val_f1_score=0.666]
Validating:  14%|█▍        | 4/29 [00:06<00:23,  1.07it/s][A
Epoch 1:  91%|█████████ | 232/255 [02:36<00:15,  1.48it/s, loss=0.566, v_num=1, train_loss=0.532, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.642, val_accuracy=0.666, val_f1_score=0.6

Epoch 1, global step 451: val_loss reached 0.56226 (best 0.56226), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-1-v3.ckpt" as top 2


Epoch 2:  89%|████████▊ | 226/255 [02:30<00:19,  1.50it/s, loss=0.512, v_num=1, train_loss=0.390, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.562, val_accuracy=0.726, val_f1_score=0.726]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 2:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.512, v_num=1, train_loss=0.390, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.562, val_accuracy=0.726, val_f1_score=0.726]
Validating:   7%|▋         | 2/29 [00:05<01:04,  2.39s/it][A
Epoch 2:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.512, v_num=1, train_loss=0.390, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.562, val_accuracy=0.726, val_f1_score=0.726]
Epoch 2:  91%|█████████ | 232/255 [02:36<00:15,  1.48it/s, loss=0.512, v_num=1, train_loss=0.390, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.562, val_accuracy=0.726, val_f1_score=0.726]
Validating:  21%|██        | 6/29 [00:06<00:12,  1.91it/s]

Epoch 2, global step 677: val_loss reached 0.58085 (best 0.56226), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-1-v2.ckpt" as top 2


Epoch 3:  89%|████████▊ | 226/255 [02:30<00:19,  1.50it/s, loss=0.399, v_num=1, train_loss=0.362, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.581, val_accuracy=0.724, val_f1_score=0.724]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 3:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.399, v_num=1, train_loss=0.362, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.581, val_accuracy=0.724, val_f1_score=0.724]
Validating:   7%|▋         | 2/29 [00:05<01:04,  2.39s/it][A
Epoch 3:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.399, v_num=1, train_loss=0.362, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.581, val_accuracy=0.724, val_f1_score=0.724]
Validating:  14%|█▍        | 4/29 [00:06<00:23,  1.07it/s][A
Epoch 3:  91%|█████████ | 232/255 [02:36<00:15,  1.48it/s, loss=0.399, v_num=1, train_loss=0.362, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.581, val_accuracy=0.724, val_f1_score=0.7

Epoch 3, global step 903: val_loss reached 0.53172 (best 0.53172), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-1-v2.ckpt" as top 2


Epoch 4:  89%|████████▊ | 226/255 [02:30<00:19,  1.50it/s, loss=0.631, v_num=1, train_loss=0.746, train_accuracy=0.611, train_f1_score=0.611, val_loss=0.532, val_accuracy=0.786, val_f1_score=0.786]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 4:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.631, v_num=1, train_loss=0.746, train_accuracy=0.611, train_f1_score=0.611, val_loss=0.532, val_accuracy=0.786, val_f1_score=0.786]
Validating:   7%|▋         | 2/29 [00:05<01:06,  2.47s/it][A
Epoch 4:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.631, v_num=1, train_loss=0.746, train_accuracy=0.611, train_f1_score=0.611, val_loss=0.532, val_accuracy=0.786, val_f1_score=0.786]
Validating:  14%|█▍        | 4/29 [00:06<00:23,  1.05it/s][A
Epoch 4:  91%|█████████ | 232/255 [02:37<00:15,  1.48it/s, loss=0.631, v_num=1, train_loss=0.746, train_accuracy=0.611, train_f1_score=0.611, val_loss=0.532, val_accuracy=0.786, val_f1_score=0.7

Epoch 4, global step 1129: val_loss was not in top 2


Epoch 5:  89%|████████▊ | 226/255 [02:30<00:19,  1.50it/s, loss=0.739, v_num=1, train_loss=0.863, train_accuracy=0.611, train_f1_score=0.611, val_loss=0.637, val_accuracy=0.628, val_f1_score=0.628]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 5:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.739, v_num=1, train_loss=0.863, train_accuracy=0.611, train_f1_score=0.611, val_loss=0.637, val_accuracy=0.628, val_f1_score=0.628]
Validating:   7%|▋         | 2/29 [00:05<01:06,  2.47s/it][A
Epoch 5:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.739, v_num=1, train_loss=0.863, train_accuracy=0.611, train_f1_score=0.611, val_loss=0.637, val_accuracy=0.628, val_f1_score=0.628]
Validating:  14%|█▍        | 4/29 [00:06<00:22,  1.10it/s][A
Epoch 5:  91%|█████████ | 232/255 [02:36<00:15,  1.48it/s, loss=0.739, v_num=1, train_loss=0.863, train_accuracy=0.611, train_f1_score=0.611, val_loss=0.637, val_accuracy=0.628, val_f1_score=0.6

Epoch 5, global step 1355: val_loss was not in top 2


Epoch 6:  89%|████████▊ | 226/255 [02:29<00:19,  1.51it/s, loss=0.516, v_num=1, train_loss=0.440, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.643, val_accuracy=0.693, val_f1_score=0.693]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 6:  89%|████████▉ | 228/255 [02:35<00:18,  1.47it/s, loss=0.516, v_num=1, train_loss=0.440, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.643, val_accuracy=0.693, val_f1_score=0.693]
Validating:   7%|▋         | 2/29 [00:05<01:06,  2.48s/it][A
Epoch 6:  90%|█████████ | 230/255 [02:36<00:16,  1.47it/s, loss=0.516, v_num=1, train_loss=0.440, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.643, val_accuracy=0.693, val_f1_score=0.693]
Validating:  14%|█▍        | 4/29 [00:06<00:23,  1.07it/s][A
Epoch 6:  91%|█████████ | 232/255 [02:36<00:15,  1.48it/s, loss=0.516, v_num=1, train_loss=0.440, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.643, val_accuracy=0.693, val_f1_score=0.6

Epoch 6, global step 1581: val_loss reached 0.52321 (best 0.52321), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-1-v3.ckpt" as top 2


Epoch 7:  89%|████████▊ | 226/255 [02:30<00:19,  1.50it/s, loss=0.444, v_num=1, train_loss=0.604, train_accuracy=0.667, train_f1_score=0.667, val_loss=0.523, val_accuracy=0.749, val_f1_score=0.749]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 7:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.444, v_num=1, train_loss=0.604, train_accuracy=0.667, train_f1_score=0.667, val_loss=0.523, val_accuracy=0.749, val_f1_score=0.749]
Validating:   7%|▋         | 2/29 [00:05<01:06,  2.47s/it][A
Epoch 7:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.444, v_num=1, train_loss=0.604, train_accuracy=0.667, train_f1_score=0.667, val_loss=0.523, val_accuracy=0.749, val_f1_score=0.749]
Validating:  14%|█▍        | 4/29 [00:06<00:22,  1.09it/s][A
Epoch 7:  91%|█████████ | 232/255 [02:37<00:15,  1.48it/s, loss=0.444, v_num=1, train_loss=0.604, train_accuracy=0.667, train_f1_score=0.667, val_loss=0.523, val_accuracy=0.749, val_f1_score=0.7

Epoch 7, global step 1807: val_loss reached 0.50760 (best 0.50760), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-1-v2.ckpt" as top 2


Epoch 8:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.345, v_num=1, train_loss=0.408, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.508, val_accuracy=0.768, val_f1_score=0.768]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 8:  89%|████████▉ | 228/255 [02:40<00:19,  1.42it/s, loss=0.345, v_num=1, train_loss=0.408, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.508, val_accuracy=0.768, val_f1_score=0.768]
Validating:   7%|▋         | 2/29 [00:05<01:06,  2.46s/it][A
Epoch 8:  90%|█████████ | 230/255 [02:40<00:17,  1.43it/s, loss=0.345, v_num=1, train_loss=0.408, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.508, val_accuracy=0.768, val_f1_score=0.768]
Validating:  14%|█▍        | 4/29 [00:06<00:23,  1.05it/s][A
Epoch 8:  91%|█████████ | 232/255 [02:41<00:15,  1.44it/s, loss=0.345, v_num=1, train_loss=0.408, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.508, val_accuracy=0.768, val_f1_score=0.7

Epoch 8, global step 2033: val_loss reached 0.48518 (best 0.48518), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-1-v3.ckpt" as top 2


Epoch 9:  89%|████████▊ | 226/255 [02:30<00:19,  1.50it/s, loss=0.36, v_num=1, train_loss=0.361, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.485, val_accuracy=0.793, val_f1_score=0.793] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 9:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.36, v_num=1, train_loss=0.361, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.485, val_accuracy=0.793, val_f1_score=0.793]
Validating:   7%|▋         | 2/29 [00:05<01:06,  2.45s/it][A
Epoch 9:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.36, v_num=1, train_loss=0.361, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.485, val_accuracy=0.793, val_f1_score=0.793]
Validating:  14%|█▍        | 4/29 [00:06<00:22,  1.10it/s][A
Epoch 9:  91%|█████████ | 232/255 [02:37<00:15,  1.48it/s, loss=0.36, v_num=1, train_loss=0.361, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.485, val_accuracy=0.793, val_f1_score=0.793]

Epoch 9, global step 2259: val_loss was not in top 2


Epoch 10:  89%|████████▊ | 226/255 [02:30<00:19,  1.50it/s, loss=0.345, v_num=1, train_loss=0.498, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.514, val_accuracy=0.784, val_f1_score=0.784]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 10:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.345, v_num=1, train_loss=0.498, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.514, val_accuracy=0.784, val_f1_score=0.784]
Validating:   7%|▋         | 2/29 [00:05<01:06,  2.47s/it][A
Epoch 10:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.345, v_num=1, train_loss=0.498, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.514, val_accuracy=0.784, val_f1_score=0.784]
Validating:  14%|█▍        | 4/29 [00:06<00:22,  1.10it/s][A
Epoch 10:  91%|█████████ | 232/255 [02:37<00:15,  1.48it/s, loss=0.345, v_num=1, train_loss=0.498, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.514, val_accuracy=0.784, val_f1_score

Epoch 10, global step 2485: val_loss was not in top 2


Epoch 11:  89%|████████▊ | 226/255 [02:30<00:19,  1.50it/s, loss=0.318, v_num=1, train_loss=0.196, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.605, val_accuracy=0.779, val_f1_score=0.779]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 11:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.318, v_num=1, train_loss=0.196, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.605, val_accuracy=0.779, val_f1_score=0.779]
Epoch 11:  90%|█████████ | 230/255 [02:36<00:16,  1.47it/s, loss=0.318, v_num=1, train_loss=0.196, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.605, val_accuracy=0.779, val_f1_score=0.779]
Validating:  14%|█▍        | 4/29 [00:06<00:25,  1.03s/it][A
Epoch 11:  91%|█████████ | 232/255 [02:36<00:15,  1.48it/s, loss=0.318, v_num=1, train_loss=0.196, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.605, val_accuracy=0.779, val_f1_score=0.779]
Epoch 11:  92%|█████████▏| 234/255 [02:37<00:14,  1.49

Epoch 11, global step 2711: val_loss reached 0.43867 (best 0.43867), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-1-v2.ckpt" as top 2


Epoch 12:  89%|████████▊ | 226/255 [02:30<00:19,  1.50it/s, loss=0.302, v_num=1, train_loss=0.146, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.439, val_accuracy=0.826, val_f1_score=0.826]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 12:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.302, v_num=1, train_loss=0.146, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.439, val_accuracy=0.826, val_f1_score=0.826]
Validating:   7%|▋         | 2/29 [00:06<01:08,  2.52s/it][A
Epoch 12:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.302, v_num=1, train_loss=0.146, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.439, val_accuracy=0.826, val_f1_score=0.826]
Validating:  14%|█▍        | 4/29 [00:06<00:23,  1.06it/s][A
Epoch 12:  91%|█████████ | 232/255 [02:37<00:15,  1.48it/s, loss=0.302, v_num=1, train_loss=0.146, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.439, val_accuracy=0.826, val_f1_score

Epoch 12, global step 2937: val_loss reached 0.38176 (best 0.38176), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-1-v3.ckpt" as top 2


Epoch 13:  89%|████████▊ | 226/255 [02:30<00:19,  1.50it/s, loss=0.632, v_num=1, train_loss=0.377, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.382, val_accuracy=0.859, val_f1_score=0.859]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 13:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.632, v_num=1, train_loss=0.377, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.382, val_accuracy=0.859, val_f1_score=0.859]
Validating:   7%|▋         | 2/29 [00:05<01:06,  2.46s/it][A
Epoch 13:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.632, v_num=1, train_loss=0.377, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.382, val_accuracy=0.859, val_f1_score=0.859]
Validating:  14%|█▍        | 4/29 [00:06<00:22,  1.10it/s][A
Epoch 13:  91%|█████████ | 232/255 [02:37<00:15,  1.48it/s, loss=0.632, v_num=1, train_loss=0.377, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.382, val_accuracy=0.859, val_f1_score

Epoch 13, global step 3163: val_loss was not in top 2


Epoch 14:  89%|████████▊ | 226/255 [02:30<00:19,  1.50it/s, loss=0.314, v_num=1, train_loss=0.190, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.639, val_accuracy=0.698, val_f1_score=0.698]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 14:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.314, v_num=1, train_loss=0.190, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.639, val_accuracy=0.698, val_f1_score=0.698]
Validating:   7%|▋         | 2/29 [00:05<01:05,  2.43s/it][A
Epoch 14:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.314, v_num=1, train_loss=0.190, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.639, val_accuracy=0.698, val_f1_score=0.698]
Validating:  14%|█▍        | 4/29 [00:06<00:23,  1.07it/s][A
Epoch 14:  91%|█████████ | 232/255 [02:36<00:15,  1.48it/s, loss=0.314, v_num=1, train_loss=0.190, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.639, val_accuracy=0.698, val_f1_score

Epoch 14, global step 3389: val_loss was not in top 2


Epoch 15:  89%|████████▊ | 226/255 [02:30<00:19,  1.50it/s, loss=0.31, v_num=1, train_loss=0.499, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.478, val_accuracy=0.823, val_f1_score=0.823] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 15:  89%|████████▉ | 228/255 [02:36<00:18,  1.45it/s, loss=0.31, v_num=1, train_loss=0.499, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.478, val_accuracy=0.823, val_f1_score=0.823]
Validating:   7%|▋         | 2/29 [00:06<01:08,  2.53s/it][A
Epoch 15:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.31, v_num=1, train_loss=0.499, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.478, val_accuracy=0.823, val_f1_score=0.823]
Validating:  14%|█▍        | 4/29 [00:06<00:24,  1.02it/s][A
Epoch 15:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.31, v_num=1, train_loss=0.499, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.478, val_accuracy=0.823, val_f1_score=0.

Epoch 15, global step 3615: val_loss was not in top 2


Epoch 16:  89%|████████▊ | 226/255 [02:30<00:19,  1.50it/s, loss=0.273, v_num=1, train_loss=0.204, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.547, val_accuracy=0.820, val_f1_score=0.820]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 16:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.273, v_num=1, train_loss=0.204, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.547, val_accuracy=0.820, val_f1_score=0.820]
Validating:   7%|▋         | 2/29 [00:06<01:07,  2.51s/it][A
Epoch 16:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.273, v_num=1, train_loss=0.204, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.547, val_accuracy=0.820, val_f1_score=0.820]
Validating:  14%|█▍        | 4/29 [00:06<00:24,  1.03it/s][A
Epoch 16:  91%|█████████ | 232/255 [02:37<00:15,  1.48it/s, loss=0.273, v_num=1, train_loss=0.204, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.547, val_accuracy=0.820, val_f1_score

Epoch 16, global step 3841: val_loss reached 0.43762 (best 0.38176), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-1-v2.ckpt" as top 2


Epoch 17:  89%|████████▊ | 226/255 [02:35<00:19,  1.46it/s, loss=0.254, v_num=1, train_loss=0.231, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.438, val_accuracy=0.825, val_f1_score=0.825]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 17:  89%|████████▉ | 228/255 [02:41<00:19,  1.42it/s, loss=0.254, v_num=1, train_loss=0.231, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.438, val_accuracy=0.825, val_f1_score=0.825]
Validating:   7%|▋         | 2/29 [00:06<01:09,  2.57s/it][A
Epoch 17:  90%|█████████ | 230/255 [02:41<00:17,  1.42it/s, loss=0.254, v_num=1, train_loss=0.231, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.438, val_accuracy=0.825, val_f1_score=0.825]
Validating:  14%|█▍        | 4/29 [00:06<00:24,  1.04it/s][A
Epoch 17:  91%|█████████ | 232/255 [02:41<00:16,  1.43it/s, loss=0.254, v_num=1, train_loss=0.231, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.438, val_accuracy=0.825, val_f1_score

Epoch 17, global step 4067: val_loss reached 0.43691 (best 0.38176), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-1-v2.ckpt" as top 2


Epoch 18:  89%|████████▊ | 226/255 [02:30<00:19,  1.50it/s, loss=0.223, v_num=1, train_loss=0.0996, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.437, val_accuracy=0.836, val_f1_score=0.836]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 18:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.223, v_num=1, train_loss=0.0996, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.437, val_accuracy=0.836, val_f1_score=0.836]
Validating:   7%|▋         | 2/29 [00:06<01:08,  2.54s/it][A
Epoch 18:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.223, v_num=1, train_loss=0.0996, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.437, val_accuracy=0.836, val_f1_score=0.836]
Validating:  14%|█▍        | 4/29 [00:06<00:24,  1.02it/s][A
Epoch 18:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.223, v_num=1, train_loss=0.0996, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.437, val_accuracy=0.836, val_f1_s

Epoch 18, global step 4293: val_loss reached 0.41898 (best 0.38176), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-1-v2.ckpt" as top 2


Epoch 19:  89%|████████▊ | 226/255 [02:30<00:19,  1.50it/s, loss=0.289, v_num=1, train_loss=0.254, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.419, val_accuracy=0.843, val_f1_score=0.843] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 19:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.289, v_num=1, train_loss=0.254, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.419, val_accuracy=0.843, val_f1_score=0.843]
Epoch 19:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.289, v_num=1, train_loss=0.254, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.419, val_accuracy=0.843, val_f1_score=0.843]
Validating:  14%|█▍        | 4/29 [00:06<00:26,  1.06s/it][A
Epoch 19:  91%|█████████ | 232/255 [02:37<00:15,  1.48it/s, loss=0.289, v_num=1, train_loss=0.254, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.419, val_accuracy=0.843, val_f1_score=0.843]
Validating:  21%|██        | 6/29 [00:06<00:13,  1.70

Epoch 19, global step 4519: val_loss was not in top 2


Epoch 20:  89%|████████▊ | 226/255 [02:30<00:19,  1.50it/s, loss=0.246, v_num=1, train_loss=0.164, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.513, val_accuracy=0.818, val_f1_score=0.818]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 20:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.246, v_num=1, train_loss=0.164, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.513, val_accuracy=0.818, val_f1_score=0.818]
Validating:   7%|▋         | 2/29 [00:06<01:08,  2.54s/it][A
Epoch 20:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.246, v_num=1, train_loss=0.164, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.513, val_accuracy=0.818, val_f1_score=0.818]
Validating:  14%|█▍        | 4/29 [00:06<00:24,  1.02it/s][A
Epoch 20:  91%|█████████ | 232/255 [02:37<00:15,  1.48it/s, loss=0.246, v_num=1, train_loss=0.164, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.513, val_accuracy=0.818, val_f1_score

Epoch 20, global step 4745: val_loss reached 0.39264 (best 0.38176), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-1-v2.ckpt" as top 2


Epoch 21:  89%|████████▊ | 226/255 [02:30<00:19,  1.50it/s, loss=0.209, v_num=1, train_loss=0.114, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.393, val_accuracy=0.847, val_f1_score=0.847] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 21:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.209, v_num=1, train_loss=0.114, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.393, val_accuracy=0.847, val_f1_score=0.847]
Validating:   7%|▋         | 2/29 [00:05<01:07,  2.50s/it][A
Epoch 21:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.209, v_num=1, train_loss=0.114, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.393, val_accuracy=0.847, val_f1_score=0.847]
Validating:  14%|█▍        | 4/29 [00:06<00:23,  1.08it/s][A
Epoch 21:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.209, v_num=1, train_loss=0.114, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.393, val_accuracy=0.847, val_f1_scor

Epoch 21, global step 4971: val_loss was not in top 2


Epoch 22:  89%|████████▊ | 226/255 [02:31<00:19,  1.49it/s, loss=0.365, v_num=1, train_loss=0.383, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.441, val_accuracy=0.855, val_f1_score=0.855] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 22:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.365, v_num=1, train_loss=0.383, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.441, val_accuracy=0.855, val_f1_score=0.855]
Validating:   7%|▋         | 2/29 [00:06<01:08,  2.53s/it][A
Epoch 22:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.365, v_num=1, train_loss=0.383, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.441, val_accuracy=0.855, val_f1_score=0.855]
Validating:  14%|█▍        | 4/29 [00:06<00:23,  1.07it/s][A
Epoch 22:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.365, v_num=1, train_loss=0.383, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.441, val_accuracy=0.855, val_f1_scor

Epoch 22, global step 5197: val_loss was not in top 2


Epoch 23:  89%|████████▊ | 226/255 [02:31<00:19,  1.50it/s, loss=0.248, v_num=1, train_loss=0.051, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.751, val_accuracy=0.767, val_f1_score=0.767] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 23:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.248, v_num=1, train_loss=0.051, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.751, val_accuracy=0.767, val_f1_score=0.767]
Epoch 23:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.248, v_num=1, train_loss=0.051, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.751, val_accuracy=0.767, val_f1_score=0.767]
Validating:  14%|█▍        | 4/29 [00:06<00:29,  1.16s/it][A
Epoch 23:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.248, v_num=1, train_loss=0.051, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.751, val_accuracy=0.767, val_f1_score=0.767]
Validating:  21%|██        | 6/29 [00:06<00:14,  1.60

Epoch 23, global step 5423: val_loss was not in top 2


Epoch 24:  89%|████████▊ | 226/255 [02:30<00:19,  1.50it/s, loss=0.264, v_num=1, train_loss=0.372, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.432, val_accuracy=0.852, val_f1_score=0.852] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 24:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.264, v_num=1, train_loss=0.372, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.432, val_accuracy=0.852, val_f1_score=0.852]
Validating:   7%|▋         | 2/29 [00:06<01:07,  2.50s/it][A
Epoch 24:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.264, v_num=1, train_loss=0.372, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.432, val_accuracy=0.852, val_f1_score=0.852]
Validating:  14%|█▍        | 4/29 [00:06<00:24,  1.04it/s][A
Epoch 24:  91%|█████████ | 232/255 [02:37<00:15,  1.48it/s, loss=0.264, v_num=1, train_loss=0.372, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.432, val_accuracy=0.852, val_f1_scor

Epoch 24, global step 5649: val_loss reached 0.36690 (best 0.36690), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-1-v2.ckpt" as top 2


Epoch 25:  89%|████████▊ | 226/255 [02:31<00:19,  1.49it/s, loss=0.224, v_num=1, train_loss=0.174, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.367, val_accuracy=0.853, val_f1_score=0.853]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 25:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.224, v_num=1, train_loss=0.174, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.367, val_accuracy=0.853, val_f1_score=0.853]
Validating:   7%|▋         | 2/29 [00:06<01:08,  2.53s/it][A
Epoch 25:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.224, v_num=1, train_loss=0.174, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.367, val_accuracy=0.853, val_f1_score=0.853]
Epoch 25:  91%|█████████ | 232/255 [02:38<00:15,  1.47it/s, loss=0.224, v_num=1, train_loss=0.174, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.367, val_accuracy=0.853, val_f1_score=0.853]
Epoch 25:  92%|█████████▏| 234/255 [02:38<00:14,  1.48

Epoch 25, global step 5875: val_loss was not in top 2


Epoch 26:  89%|████████▊ | 226/255 [02:33<00:19,  1.47it/s, loss=0.219, v_num=1, train_loss=0.0748, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.410, val_accuracy=0.850, val_f1_score=0.850]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 26:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.219, v_num=1, train_loss=0.0748, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.410, val_accuracy=0.850, val_f1_score=0.850]
Validating:   7%|▋         | 2/29 [00:06<01:11,  2.64s/it][A
Epoch 26:  90%|█████████ | 230/255 [02:40<00:17,  1.44it/s, loss=0.219, v_num=1, train_loss=0.0748, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.410, val_accuracy=0.850, val_f1_score=0.850]
Validating:  14%|█▍        | 4/29 [00:06<00:24,  1.03it/s][A
Epoch 26:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.219, v_num=1, train_loss=0.0748, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.410, val_accuracy=0.850, val_f1_s

Epoch 26, global step 6101: val_loss was not in top 2


Epoch 27:  89%|████████▊ | 226/255 [02:30<00:19,  1.50it/s, loss=0.294, v_num=1, train_loss=0.229, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.504, val_accuracy=0.835, val_f1_score=0.835] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 27:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.294, v_num=1, train_loss=0.229, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.504, val_accuracy=0.835, val_f1_score=0.835]
Validating:   7%|▋         | 2/29 [00:06<01:09,  2.58s/it][A
Epoch 27:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.294, v_num=1, train_loss=0.229, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.504, val_accuracy=0.835, val_f1_score=0.835]
Validating:  14%|█▍        | 4/29 [00:06<00:24,  1.02it/s][A
Epoch 27:  91%|█████████ | 232/255 [02:37<00:15,  1.48it/s, loss=0.294, v_num=1, train_loss=0.229, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.504, val_accuracy=0.835, val_f1_scor

Epoch 27, global step 6327: val_loss was not in top 2


Epoch 28:  89%|████████▊ | 226/255 [02:31<00:19,  1.49it/s, loss=0.182, v_num=1, train_loss=0.200, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.526, val_accuracy=0.845, val_f1_score=0.845] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 28:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.182, v_num=1, train_loss=0.200, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.526, val_accuracy=0.845, val_f1_score=0.845]
Validating:   7%|▋         | 2/29 [00:06<01:07,  2.51s/it][A
Epoch 28:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.182, v_num=1, train_loss=0.200, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.526, val_accuracy=0.845, val_f1_score=0.845]
Validating:  14%|█▍        | 4/29 [00:06<00:24,  1.03it/s][A
Epoch 28:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.182, v_num=1, train_loss=0.200, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.526, val_accuracy=0.845, val_f1_scor

Epoch 28, global step 6553: val_loss was not in top 2


Epoch 29:  89%|████████▊ | 226/255 [02:31<00:19,  1.50it/s, loss=0.217, v_num=1, train_loss=0.355, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.481, val_accuracy=0.851, val_f1_score=0.851]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 29:  89%|████████▉ | 228/255 [02:36<00:18,  1.45it/s, loss=0.217, v_num=1, train_loss=0.355, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.481, val_accuracy=0.851, val_f1_score=0.851]
Validating:   7%|▋         | 2/29 [00:06<01:08,  2.55s/it][A
Epoch 29:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.217, v_num=1, train_loss=0.355, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.481, val_accuracy=0.851, val_f1_score=0.851]
Validating:  14%|█▍        | 4/29 [00:06<00:24,  1.02it/s][A
Epoch 29:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.217, v_num=1, train_loss=0.355, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.481, val_accuracy=0.851, val_f1_score

Epoch 29, global step 6779: val_loss was not in top 2


Epoch 30:  89%|████████▊ | 226/255 [02:30<00:19,  1.50it/s, loss=0.151, v_num=1, train_loss=0.137, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.478, val_accuracy=0.848, val_f1_score=0.848] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 30:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.151, v_num=1, train_loss=0.137, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.478, val_accuracy=0.848, val_f1_score=0.848]
Validating:   7%|▋         | 2/29 [00:06<01:08,  2.54s/it][A
Epoch 30:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.151, v_num=1, train_loss=0.137, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.478, val_accuracy=0.848, val_f1_score=0.848]
Epoch 30:  91%|█████████ | 232/255 [02:36<00:15,  1.48it/s, loss=0.151, v_num=1, train_loss=0.137, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.478, val_accuracy=0.848, val_f1_score=0.848]
Validating:  21%|██        | 6/29 [00:06<00:13,  1.73

Epoch 30, global step 7005: val_loss was not in top 2


Epoch 31:  89%|████████▊ | 226/255 [02:30<00:19,  1.50it/s, loss=0.241, v_num=1, train_loss=0.172, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.481, val_accuracy=0.878, val_f1_score=0.878] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 31:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.241, v_num=1, train_loss=0.172, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.481, val_accuracy=0.878, val_f1_score=0.878]
Validating:   7%|▋         | 2/29 [00:06<01:09,  2.56s/it][A
Epoch 31:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.241, v_num=1, train_loss=0.172, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.481, val_accuracy=0.878, val_f1_score=0.878]
Validating:  14%|█▍        | 4/29 [00:06<00:23,  1.06it/s][A
Epoch 31:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.241, v_num=1, train_loss=0.172, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.481, val_accuracy=0.878, val_f1_scor

Epoch 31, global step 7231: val_loss was not in top 2


Epoch 32:  89%|████████▊ | 226/255 [02:31<00:19,  1.49it/s, loss=0.232, v_num=1, train_loss=0.188, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.492, val_accuracy=0.850, val_f1_score=0.850] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 32:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.232, v_num=1, train_loss=0.188, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.492, val_accuracy=0.850, val_f1_score=0.850]
Validating:   7%|▋         | 2/29 [00:06<01:10,  2.62s/it][A
Epoch 32:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.232, v_num=1, train_loss=0.188, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.492, val_accuracy=0.850, val_f1_score=0.850]
Validating:  14%|█▍        | 4/29 [00:06<00:24,  1.01it/s][A
Epoch 32:  91%|█████████ | 232/255 [02:38<00:15,  1.46it/s, loss=0.232, v_num=1, train_loss=0.188, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.492, val_accuracy=0.850, val_f1_scor

Epoch 32, global step 7457: val_loss reached 0.37787 (best 0.36690), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-1-v3.ckpt" as top 2


Epoch 33:  89%|████████▊ | 226/255 [02:30<00:19,  1.50it/s, loss=0.271, v_num=1, train_loss=0.301, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.378, val_accuracy=0.853, val_f1_score=0.853] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 33:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.271, v_num=1, train_loss=0.301, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.378, val_accuracy=0.853, val_f1_score=0.853]
Validating:   7%|▋         | 2/29 [00:06<01:09,  2.57s/it][A
Epoch 33:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.271, v_num=1, train_loss=0.301, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.378, val_accuracy=0.853, val_f1_score=0.853]
Validating:  14%|█▍        | 4/29 [00:06<00:24,  1.01it/s][A
Epoch 33:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.271, v_num=1, train_loss=0.301, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.378, val_accuracy=0.853, val_f1_scor

Epoch 33, global step 7683: val_loss reached 0.37093 (best 0.36690), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-1-v3.ckpt" as top 2


Epoch 34:  89%|████████▊ | 226/255 [02:33<00:19,  1.47it/s, loss=0.185, v_num=1, train_loss=0.223, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.371, val_accuracy=0.852, val_f1_score=0.852] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 34:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.185, v_num=1, train_loss=0.223, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.371, val_accuracy=0.852, val_f1_score=0.852]
Epoch 34:  90%|█████████ | 230/255 [02:39<00:17,  1.44it/s, loss=0.185, v_num=1, train_loss=0.223, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.371, val_accuracy=0.852, val_f1_score=0.852]
Epoch 34:  91%|█████████ | 232/255 [02:39<00:15,  1.45it/s, loss=0.185, v_num=1, train_loss=0.223, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.371, val_accuracy=0.852, val_f1_score=0.852]
Epoch 34:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.185, v_num=1, train_loss=0.223, train_accuracy=0

Epoch 34, global step 7909: val_loss was not in top 2


Epoch 35:  89%|████████▊ | 226/255 [02:31<00:19,  1.49it/s, loss=0.205, v_num=1, train_loss=0.281, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.391, val_accuracy=0.874, val_f1_score=0.874] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 35:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.205, v_num=1, train_loss=0.281, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.391, val_accuracy=0.874, val_f1_score=0.874]
Validating:   7%|▋         | 2/29 [00:06<01:09,  2.59s/it][A
Epoch 35:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.205, v_num=1, train_loss=0.281, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.391, val_accuracy=0.874, val_f1_score=0.874]
Validating:  14%|█▍        | 4/29 [00:06<00:24,  1.03it/s][A
Epoch 35:  91%|█████████ | 232/255 [02:38<00:15,  1.47it/s, loss=0.205, v_num=1, train_loss=0.281, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.391, val_accuracy=0.874, val_f1_scor

Epoch 35, global step 8135: val_loss was not in top 2


Epoch 36:  89%|████████▊ | 226/255 [02:30<00:19,  1.50it/s, loss=0.208, v_num=1, train_loss=0.401, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.593, val_accuracy=0.847, val_f1_score=0.847] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 36:  89%|████████▉ | 228/255 [02:36<00:18,  1.45it/s, loss=0.208, v_num=1, train_loss=0.401, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.593, val_accuracy=0.847, val_f1_score=0.847]
Validating:   7%|▋         | 2/29 [00:06<01:10,  2.60s/it][A
Epoch 36:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.208, v_num=1, train_loss=0.401, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.593, val_accuracy=0.847, val_f1_score=0.847]
Validating:  14%|█▍        | 4/29 [00:06<00:24,  1.00it/s][A
Epoch 36:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.208, v_num=1, train_loss=0.401, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.593, val_accuracy=0.847, val_f1_scor

Epoch 36, global step 8361: val_loss was not in top 2


Epoch 37:  89%|████████▊ | 226/255 [02:30<00:19,  1.50it/s, loss=0.195, v_num=1, train_loss=0.393, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.459, val_accuracy=0.874, val_f1_score=0.874] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 37:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.195, v_num=1, train_loss=0.393, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.459, val_accuracy=0.874, val_f1_score=0.874]
Validating:   7%|▋         | 2/29 [00:06<01:10,  2.61s/it][A
Epoch 37:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.195, v_num=1, train_loss=0.393, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.459, val_accuracy=0.874, val_f1_score=0.874]
Validating:  14%|█▍        | 4/29 [00:06<00:23,  1.04it/s][A
Epoch 37:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.195, v_num=1, train_loss=0.393, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.459, val_accuracy=0.874, val_f1_scor

Epoch 37, global step 8587: val_loss was not in top 2


Epoch 38:  89%|████████▊ | 226/255 [02:30<00:19,  1.50it/s, loss=0.114, v_num=1, train_loss=0.132, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.539, val_accuracy=0.836, val_f1_score=0.836] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 38:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.114, v_num=1, train_loss=0.132, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.539, val_accuracy=0.836, val_f1_score=0.836]
Validating:   7%|▋         | 2/29 [00:06<01:10,  2.61s/it][A
Epoch 38:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.114, v_num=1, train_loss=0.132, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.539, val_accuracy=0.836, val_f1_score=0.836]
Validating:  14%|█▍        | 4/29 [00:06<00:24,  1.00it/s][A
Epoch 38:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.114, v_num=1, train_loss=0.132, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.539, val_accuracy=0.836, val_f1_scor

Epoch 38, global step 8813: val_loss was not in top 2


Epoch 39:  89%|████████▊ | 226/255 [02:31<00:19,  1.50it/s, loss=0.179, v_num=1, train_loss=0.305, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.422, val_accuracy=0.886, val_f1_score=0.886] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 39:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.179, v_num=1, train_loss=0.305, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.422, val_accuracy=0.886, val_f1_score=0.886]
Validating:   7%|▋         | 2/29 [00:06<01:12,  2.67s/it][A
Epoch 39:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.179, v_num=1, train_loss=0.305, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.422, val_accuracy=0.886, val_f1_score=0.886]
Validating:  14%|█▍        | 4/29 [00:06<00:24,  1.02it/s][A
Epoch 39:  91%|█████████ | 232/255 [02:38<00:15,  1.47it/s, loss=0.179, v_num=1, train_loss=0.305, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.422, val_accuracy=0.886, val_f1_scor

Epoch 39, global step 9039: val_loss was not in top 2


Epoch 40:  89%|████████▊ | 226/255 [02:31<00:19,  1.49it/s, loss=0.14, v_num=1, train_loss=0.102, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.405, val_accuracy=0.871, val_f1_score=0.871]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 40:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.14, v_num=1, train_loss=0.102, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.405, val_accuracy=0.871, val_f1_score=0.871]
Validating:   7%|▋         | 2/29 [00:06<01:10,  2.61s/it][A
Epoch 40:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.14, v_num=1, train_loss=0.102, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.405, val_accuracy=0.871, val_f1_score=0.871]
Validating:  14%|█▍        | 4/29 [00:06<00:24,  1.04it/s][A
Epoch 40:  91%|█████████ | 232/255 [02:38<00:15,  1.47it/s, loss=0.14, v_num=1, train_loss=0.102, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.405, val_accuracy=0.871, val_f1_score=0

Epoch 40, global step 9265: val_loss was not in top 2


Epoch 41:  89%|████████▊ | 226/255 [02:31<00:19,  1.49it/s, loss=0.116, v_num=1, train_loss=0.0554, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.420, val_accuracy=0.881, val_f1_score=0.881]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 41:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.116, v_num=1, train_loss=0.0554, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.420, val_accuracy=0.881, val_f1_score=0.881]
Validating:   7%|▋         | 2/29 [00:06<01:09,  2.58s/it][A
Epoch 41:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.116, v_num=1, train_loss=0.0554, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.420, val_accuracy=0.881, val_f1_score=0.881]
Validating:  14%|█▍        | 4/29 [00:06<00:23,  1.06it/s][A
Epoch 41:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.116, v_num=1, train_loss=0.0554, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.420, val_accuracy=0.881, val_f1_s

Epoch 41, global step 9491: val_loss was not in top 2


Epoch 42:  89%|████████▊ | 226/255 [02:30<00:19,  1.50it/s, loss=0.16, v_num=1, train_loss=0.247, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.382, val_accuracy=0.897, val_f1_score=0.897]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 42:  89%|████████▉ | 228/255 [02:36<00:18,  1.45it/s, loss=0.16, v_num=1, train_loss=0.247, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.382, val_accuracy=0.897, val_f1_score=0.897]
Validating:   7%|▋         | 2/29 [00:06<01:09,  2.59s/it][A
Epoch 42:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.16, v_num=1, train_loss=0.247, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.382, val_accuracy=0.897, val_f1_score=0.897]
Validating:  14%|█▍        | 4/29 [00:06<00:23,  1.05it/s][A
Epoch 42:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.16, v_num=1, train_loss=0.247, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.382, val_accuracy=0.897, val_f1_score=0

Epoch 42, global step 9717: val_loss was not in top 2


Epoch 43:  89%|████████▊ | 226/255 [02:34<00:19,  1.47it/s, loss=0.158, v_num=1, train_loss=0.0825, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.401, val_accuracy=0.882, val_f1_score=0.882]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 43:  89%|████████▉ | 228/255 [02:40<00:18,  1.42it/s, loss=0.158, v_num=1, train_loss=0.0825, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.401, val_accuracy=0.882, val_f1_score=0.882]
Validating:   7%|▋         | 2/29 [00:06<01:11,  2.64s/it][A
Epoch 43:  90%|█████████ | 230/255 [02:40<00:17,  1.43it/s, loss=0.158, v_num=1, train_loss=0.0825, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.401, val_accuracy=0.882, val_f1_score=0.882]
Validating:  14%|█▍        | 4/29 [00:06<00:24,  1.03it/s][A
Epoch 43:  91%|█████████ | 232/255 [02:41<00:15,  1.44it/s, loss=0.158, v_num=1, train_loss=0.0825, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.401, val_accuracy=0.882, val_f1_s

Epoch 43, global step 9943: val_loss was not in top 2


Epoch 44:  89%|████████▊ | 226/255 [02:31<00:19,  1.50it/s, loss=0.0992, v_num=1, train_loss=0.0109, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.509, val_accuracy=0.877, val_f1_score=0.877]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 44:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.0992, v_num=1, train_loss=0.0109, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.509, val_accuracy=0.877, val_f1_score=0.877]
Validating:   7%|▋         | 2/29 [00:06<01:11,  2.65s/it][A
Epoch 44:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.0992, v_num=1, train_loss=0.0109, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.509, val_accuracy=0.877, val_f1_score=0.877]
Validating:  14%|█▍        | 4/29 [00:06<00:25,  1.01s/it][A
Epoch 44:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.0992, v_num=1, train_loss=0.0109, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.509, val_accuracy=0.877, val_

Epoch 44, global step 10169: val_loss was not in top 2


Epoch 45:  89%|████████▊ | 226/255 [02:30<00:19,  1.50it/s, loss=0.307, v_num=1, train_loss=0.457, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.424, val_accuracy=0.894, val_f1_score=0.894]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 45:  89%|████████▉ | 228/255 [02:36<00:18,  1.45it/s, loss=0.307, v_num=1, train_loss=0.457, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.424, val_accuracy=0.894, val_f1_score=0.894]
Validating:   7%|▋         | 2/29 [00:06<01:10,  2.62s/it][A
Epoch 45:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.307, v_num=1, train_loss=0.457, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.424, val_accuracy=0.894, val_f1_score=0.894]
Validating:  14%|█▍        | 4/29 [00:06<00:24,  1.00it/s][A
Epoch 45:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.307, v_num=1, train_loss=0.457, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.424, val_accuracy=0.894, val_f1_sco

Epoch 45, global step 10395: val_loss was not in top 2


Epoch 46:  89%|████████▊ | 226/255 [02:30<00:19,  1.50it/s, loss=0.19, v_num=1, train_loss=0.546, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.414, val_accuracy=0.851, val_f1_score=0.851]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 46:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.19, v_num=1, train_loss=0.546, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.414, val_accuracy=0.851, val_f1_score=0.851]
Validating:   7%|▋         | 2/29 [00:06<01:11,  2.64s/it][A
Epoch 46:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.19, v_num=1, train_loss=0.546, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.414, val_accuracy=0.851, val_f1_score=0.851]
Validating:  14%|█▍        | 4/29 [00:06<00:25,  1.01s/it][A
Epoch 46:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.19, v_num=1, train_loss=0.546, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.414, val_accuracy=0.851, val_f1_score=0

Epoch 46, global step 10621: val_loss was not in top 2


Epoch 47:  89%|████████▊ | 226/255 [02:31<00:19,  1.50it/s, loss=0.109, v_num=1, train_loss=0.0865, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.448, val_accuracy=0.858, val_f1_score=0.858] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 47:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.109, v_num=1, train_loss=0.0865, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.448, val_accuracy=0.858, val_f1_score=0.858]
Validating:   7%|▋         | 2/29 [00:06<01:11,  2.65s/it][A
Epoch 47:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.109, v_num=1, train_loss=0.0865, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.448, val_accuracy=0.858, val_f1_score=0.858]
Validating:  14%|█▍        | 4/29 [00:06<00:24,  1.01it/s][A
Epoch 47:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.109, v_num=1, train_loss=0.0865, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.448, val_accuracy=0.858, val_f1_

Epoch 47, global step 10847: val_loss was not in top 2


Epoch 48:  89%|████████▊ | 226/255 [02:31<00:19,  1.49it/s, loss=0.15, v_num=1, train_loss=0.197, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.411, val_accuracy=0.891, val_f1_score=0.891]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 48:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.15, v_num=1, train_loss=0.197, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.411, val_accuracy=0.891, val_f1_score=0.891]
Validating:   7%|▋         | 2/29 [00:06<01:09,  2.59s/it][A
Epoch 48:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.15, v_num=1, train_loss=0.197, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.411, val_accuracy=0.891, val_f1_score=0.891]
Validating:  14%|█▍        | 4/29 [00:06<00:24,  1.01it/s][A
Epoch 48:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.15, v_num=1, train_loss=0.197, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.411, val_accuracy=0.891, val_f1_score=0

Epoch 48, global step 11073: val_loss reached 0.31910 (best 0.31910), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-1-v3.ckpt" as top 2


Epoch 49:  89%|████████▊ | 226/255 [02:30<00:19,  1.50it/s, loss=0.138, v_num=1, train_loss=0.0732, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.319, val_accuracy=0.896, val_f1_score=0.896]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 49:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.138, v_num=1, train_loss=0.0732, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.319, val_accuracy=0.896, val_f1_score=0.896]
Validating:   7%|▋         | 2/29 [00:06<01:09,  2.56s/it][A
Epoch 49:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.138, v_num=1, train_loss=0.0732, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.319, val_accuracy=0.896, val_f1_score=0.896]
Validating:  14%|█▍        | 4/29 [00:06<00:23,  1.06it/s][A
Epoch 49:  91%|█████████ | 232/255 [02:37<00:15,  1.48it/s, loss=0.138, v_num=1, train_loss=0.0732, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.319, val_accuracy=0.896, val_f1_s

Epoch 49, global step 11299: val_loss reached 0.31322 (best 0.31322), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-1-v2.ckpt" as top 2


Epoch 50:  89%|████████▊ | 226/255 [02:31<00:19,  1.50it/s, loss=0.103, v_num=1, train_loss=0.100, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.313, val_accuracy=0.894, val_f1_score=0.894]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 50:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.103, v_num=1, train_loss=0.100, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.313, val_accuracy=0.894, val_f1_score=0.894]
Validating:   7%|▋         | 2/29 [00:06<01:10,  2.60s/it][A
Epoch 50:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.103, v_num=1, train_loss=0.100, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.313, val_accuracy=0.894, val_f1_score=0.894]
Validating:  14%|█▍        | 4/29 [00:06<00:24,  1.01it/s][A
Epoch 50:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.103, v_num=1, train_loss=0.100, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.313, val_accuracy=0.894, val_f1_sco

Epoch 50, global step 11525: val_loss was not in top 2


Epoch 51:  89%|████████▊ | 226/255 [02:34<00:19,  1.47it/s, loss=0.126, v_num=1, train_loss=0.0657, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.379, val_accuracy=0.892, val_f1_score=0.892] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 51:  89%|████████▉ | 228/255 [02:40<00:18,  1.42it/s, loss=0.126, v_num=1, train_loss=0.0657, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.379, val_accuracy=0.892, val_f1_score=0.892]
Epoch 51:  90%|█████████ | 230/255 [02:40<00:17,  1.43it/s, loss=0.126, v_num=1, train_loss=0.0657, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.379, val_accuracy=0.892, val_f1_score=0.892]
Epoch 51:  91%|█████████ | 232/255 [02:40<00:15,  1.44it/s, loss=0.126, v_num=1, train_loss=0.0657, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.379, val_accuracy=0.892, val_f1_score=0.892]
Epoch 51:  92%|█████████▏| 234/255 [02:40<00:14,  1.46it/s, loss=0.126, v_num=1, train_loss=0.0657, train_accur

Epoch 51, global step 11751: val_loss was not in top 2


Epoch 52:  89%|████████▊ | 226/255 [02:31<00:19,  1.49it/s, loss=0.118, v_num=1, train_loss=0.232, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.341, val_accuracy=0.903, val_f1_score=0.903]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 52:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.118, v_num=1, train_loss=0.232, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.341, val_accuracy=0.903, val_f1_score=0.903]
Validating:   7%|▋         | 2/29 [00:06<01:10,  2.59s/it][A
Epoch 52:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.118, v_num=1, train_loss=0.232, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.341, val_accuracy=0.903, val_f1_score=0.903]
Validating:  14%|█▍        | 4/29 [00:06<00:24,  1.00it/s][A
Epoch 52:  91%|█████████ | 232/255 [02:38<00:15,  1.47it/s, loss=0.118, v_num=1, train_loss=0.232, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.341, val_accuracy=0.903, val_f1_sco

Epoch 52, global step 11977: val_loss was not in top 2


Epoch 53:  89%|████████▊ | 226/255 [02:30<00:19,  1.50it/s, loss=0.0938, v_num=1, train_loss=0.0207, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.450, val_accuracy=0.886, val_f1_score=0.886]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 53:  89%|████████▉ | 228/255 [02:36<00:18,  1.45it/s, loss=0.0938, v_num=1, train_loss=0.0207, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.450, val_accuracy=0.886, val_f1_score=0.886]
Validating:   7%|▋         | 2/29 [00:06<01:11,  2.66s/it][A
Epoch 53:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.0938, v_num=1, train_loss=0.0207, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.450, val_accuracy=0.886, val_f1_score=0.886]
Validating:  14%|█▍        | 4/29 [00:06<00:24,  1.02it/s][A
Epoch 53:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.0938, v_num=1, train_loss=0.0207, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.450, val_accuracy=0.886, val_

Epoch 53, global step 12203: val_loss was not in top 2


Epoch 54:  89%|████████▊ | 226/255 [02:31<00:19,  1.49it/s, loss=0.101, v_num=1, train_loss=0.0196, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.430, val_accuracy=0.891, val_f1_score=0.891]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 54:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.101, v_num=1, train_loss=0.0196, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.430, val_accuracy=0.891, val_f1_score=0.891]
Validating:   7%|▋         | 2/29 [00:06<01:10,  2.62s/it][A
Epoch 54:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.101, v_num=1, train_loss=0.0196, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.430, val_accuracy=0.891, val_f1_score=0.891]
Validating:  14%|█▍        | 4/29 [00:06<00:24,  1.03it/s][A
Epoch 54:  91%|█████████ | 232/255 [02:38<00:15,  1.47it/s, loss=0.101, v_num=1, train_loss=0.0196, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.430, val_accuracy=0.891, val_f1

Epoch 54, global step 12429: val_loss was not in top 2


Epoch 55:  89%|████████▊ | 226/255 [02:31<00:19,  1.50it/s, loss=0.0957, v_num=1, train_loss=0.0827, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.425, val_accuracy=0.888, val_f1_score=0.888] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 55:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.0957, v_num=1, train_loss=0.0827, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.425, val_accuracy=0.888, val_f1_score=0.888]
Validating:   7%|▋         | 2/29 [00:06<01:11,  2.65s/it][A
Epoch 55:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.0957, v_num=1, train_loss=0.0827, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.425, val_accuracy=0.888, val_f1_score=0.888]
Validating:  14%|█▍        | 4/29 [00:06<00:24,  1.03it/s][A
Epoch 55:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.0957, v_num=1, train_loss=0.0827, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.425, val_accuracy=0.888, val

Epoch 55, global step 12655: val_loss was not in top 2


Epoch 56:  89%|████████▊ | 226/255 [02:31<00:19,  1.49it/s, loss=0.163, v_num=1, train_loss=0.238, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.425, val_accuracy=0.896, val_f1_score=0.896]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 56:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.163, v_num=1, train_loss=0.238, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.425, val_accuracy=0.896, val_f1_score=0.896]
Validating:   7%|▋         | 2/29 [00:06<01:11,  2.66s/it][A
Epoch 56:  90%|█████████ | 230/255 [02:38<00:17,  1.45it/s, loss=0.163, v_num=1, train_loss=0.238, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.425, val_accuracy=0.896, val_f1_score=0.896]
Validating:  14%|█▍        | 4/29 [00:06<00:25,  1.02s/it][A
Epoch 56:  91%|█████████ | 232/255 [02:38<00:15,  1.46it/s, loss=0.163, v_num=1, train_loss=0.238, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.425, val_accuracy=0.896, val_f1_sco

Epoch 56, global step 12881: val_loss was not in top 2


Epoch 57:  89%|████████▊ | 226/255 [02:30<00:19,  1.50it/s, loss=0.11, v_num=1, train_loss=0.0268, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.392, val_accuracy=0.874, val_f1_score=0.874]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 57:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.11, v_num=1, train_loss=0.0268, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.392, val_accuracy=0.874, val_f1_score=0.874]
Validating:   7%|▋         | 2/29 [00:06<01:12,  2.67s/it][A
Epoch 57:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.11, v_num=1, train_loss=0.0268, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.392, val_accuracy=0.874, val_f1_score=0.874]
Validating:  14%|█▍        | 4/29 [00:06<00:24,  1.01it/s][A
Epoch 57:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.11, v_num=1, train_loss=0.0268, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.392, val_accuracy=0.874, val_f1_sco

Epoch 57, global step 13107: val_loss was not in top 2


Epoch 58:  89%|████████▊ | 226/255 [02:31<00:19,  1.49it/s, loss=0.106, v_num=1, train_loss=0.0799, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.503, val_accuracy=0.868, val_f1_score=0.868] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 58:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.106, v_num=1, train_loss=0.0799, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.503, val_accuracy=0.868, val_f1_score=0.868]
Validating:   7%|▋         | 2/29 [00:06<01:10,  2.61s/it][A
Epoch 58:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.106, v_num=1, train_loss=0.0799, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.503, val_accuracy=0.868, val_f1_score=0.868]
Validating:  14%|█▍        | 4/29 [00:06<00:25,  1.00s/it][A
Epoch 58:  91%|█████████ | 232/255 [02:38<00:15,  1.47it/s, loss=0.106, v_num=1, train_loss=0.0799, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.503, val_accuracy=0.868, val_f1_

Epoch 58, global step 13333: val_loss was not in top 2


Epoch 59:  89%|████████▊ | 226/255 [02:33<00:19,  1.48it/s, loss=0.111, v_num=1, train_loss=0.280, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.440, val_accuracy=0.878, val_f1_score=0.878]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 59:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.111, v_num=1, train_loss=0.280, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.440, val_accuracy=0.878, val_f1_score=0.878]
Validating:   7%|▋         | 2/29 [00:06<01:10,  2.62s/it][A
Epoch 59:  90%|█████████ | 230/255 [02:39<00:17,  1.44it/s, loss=0.111, v_num=1, train_loss=0.280, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.440, val_accuracy=0.878, val_f1_score=0.878]
Validating:  14%|█▍        | 4/29 [00:06<00:24,  1.03it/s][A
Epoch 59:  91%|█████████ | 232/255 [02:39<00:15,  1.45it/s, loss=0.111, v_num=1, train_loss=0.280, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.440, val_accuracy=0.878, val_f1_sco

Epoch 59, global step 13559: val_loss was not in top 2


Epoch 60:  89%|████████▊ | 226/255 [02:32<00:19,  1.48it/s, loss=0.108, v_num=1, train_loss=0.158, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.442, val_accuracy=0.883, val_f1_score=0.883]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 60:  89%|████████▉ | 228/255 [02:38<00:18,  1.44it/s, loss=0.108, v_num=1, train_loss=0.158, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.442, val_accuracy=0.883, val_f1_score=0.883]
Validating:   7%|▋         | 2/29 [00:06<01:13,  2.74s/it][A
Epoch 60:  90%|█████████ | 230/255 [02:39<00:17,  1.44it/s, loss=0.108, v_num=1, train_loss=0.158, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.442, val_accuracy=0.883, val_f1_score=0.883]
Validating:  14%|█▍        | 4/29 [00:06<00:26,  1.05s/it][A
Epoch 60:  91%|█████████ | 232/255 [02:39<00:15,  1.45it/s, loss=0.108, v_num=1, train_loss=0.158, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.442, val_accuracy=0.883, val_f1_sco

Epoch 60, global step 13785: val_loss was not in top 2


Epoch 61:  89%|████████▊ | 226/255 [02:30<00:19,  1.50it/s, loss=0.135, v_num=1, train_loss=0.0427, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.512, val_accuracy=0.864, val_f1_score=0.864] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 61:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.135, v_num=1, train_loss=0.0427, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.512, val_accuracy=0.864, val_f1_score=0.864]
Validating:   7%|▋         | 2/29 [00:06<01:12,  2.70s/it][A
Epoch 61:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.135, v_num=1, train_loss=0.0427, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.512, val_accuracy=0.864, val_f1_score=0.864]
Validating:  14%|█▍        | 4/29 [00:06<00:25,  1.03s/it][A
Epoch 61:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.135, v_num=1, train_loss=0.0427, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.512, val_accuracy=0.864, val_f1_

Epoch 61, global step 14011: val_loss was not in top 2


Epoch 62:  89%|████████▊ | 226/255 [02:30<00:19,  1.50it/s, loss=0.0996, v_num=1, train_loss=0.0548, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.390, val_accuracy=0.881, val_f1_score=0.881]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 62:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.0996, v_num=1, train_loss=0.0548, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.390, val_accuracy=0.881, val_f1_score=0.881]
Validating:   7%|▋         | 2/29 [00:06<01:13,  2.71s/it][A
Epoch 62:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.0996, v_num=1, train_loss=0.0548, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.390, val_accuracy=0.881, val_f1_score=0.881]
Epoch 62:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.0996, v_num=1, train_loss=0.0548, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.390, val_accuracy=0.881, val_f1_score=0.881]
Validating:  21%|██        | 6/29 [00:07<00:14

Epoch 62, global step 14237: val_loss was not in top 2


Epoch 63:  89%|████████▊ | 226/255 [02:31<00:19,  1.50it/s, loss=0.131, v_num=1, train_loss=0.0607, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.472, val_accuracy=0.869, val_f1_score=0.869] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 63:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.131, v_num=1, train_loss=0.0607, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.472, val_accuracy=0.869, val_f1_score=0.869]
Validating:   7%|▋         | 2/29 [00:06<01:09,  2.58s/it][A
Epoch 63:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.131, v_num=1, train_loss=0.0607, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.472, val_accuracy=0.869, val_f1_score=0.869]
Validating:  14%|█▍        | 4/29 [00:06<00:24,  1.01it/s][A
Epoch 63:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.131, v_num=1, train_loss=0.0607, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.472, val_accuracy=0.869, val_f1_

Epoch 63, global step 14463: val_loss was not in top 2


Epoch 64:  89%|████████▊ | 226/255 [02:30<00:19,  1.51it/s, loss=0.107, v_num=1, train_loss=0.104, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.401, val_accuracy=0.867, val_f1_score=0.867]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 64:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.107, v_num=1, train_loss=0.104, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.401, val_accuracy=0.867, val_f1_score=0.867]
Validating:   7%|▋         | 2/29 [00:06<01:13,  2.72s/it][A
Epoch 64:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.107, v_num=1, train_loss=0.104, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.401, val_accuracy=0.867, val_f1_score=0.867]
Validating:  14%|█▍        | 4/29 [00:06<00:24,  1.01it/s][A
Epoch 64:  91%|█████████ | 232/255 [02:37<00:15,  1.48it/s, loss=0.107, v_num=1, train_loss=0.104, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.401, val_accuracy=0.867, val_f1_sco

Epoch 64, global step 14689: val_loss was not in top 2


Epoch 65:  89%|████████▊ | 226/255 [02:31<00:19,  1.50it/s, loss=0.0857, v_num=1, train_loss=0.0139, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.355, val_accuracy=0.888, val_f1_score=0.888]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 65:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.0857, v_num=1, train_loss=0.0139, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.355, val_accuracy=0.888, val_f1_score=0.888]
Validating:   7%|▋         | 2/29 [00:06<01:12,  2.67s/it][A
Epoch 65:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.0857, v_num=1, train_loss=0.0139, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.355, val_accuracy=0.888, val_f1_score=0.888]
Validating:  14%|█▍        | 4/29 [00:06<00:24,  1.02it/s][A
Epoch 65:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.0857, v_num=1, train_loss=0.0139, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.355, val_accuracy=0.888, val_

Epoch 65, global step 14915: val_loss was not in top 2


Epoch 66:  89%|████████▊ | 226/255 [02:30<00:19,  1.50it/s, loss=0.0701, v_num=1, train_loss=0.242, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.356, val_accuracy=0.894, val_f1_score=0.894]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 66:  89%|████████▉ | 228/255 [02:36<00:18,  1.45it/s, loss=0.0701, v_num=1, train_loss=0.242, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.356, val_accuracy=0.894, val_f1_score=0.894]
Validating:   7%|▋         | 2/29 [00:06<01:11,  2.67s/it][A
Epoch 66:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.0701, v_num=1, train_loss=0.242, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.356, val_accuracy=0.894, val_f1_score=0.894]
Validating:  14%|█▍        | 4/29 [00:06<00:25,  1.02s/it][A
Epoch 66:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.0701, v_num=1, train_loss=0.242, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.356, val_accuracy=0.894, val_f1

Epoch 66, global step 15141: val_loss was not in top 2


Epoch 67:  89%|████████▊ | 226/255 [02:31<00:19,  1.50it/s, loss=0.0599, v_num=1, train_loss=0.0457, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.460, val_accuracy=0.888, val_f1_score=0.888]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 67:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.0599, v_num=1, train_loss=0.0457, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.460, val_accuracy=0.888, val_f1_score=0.888]
Validating:   7%|▋         | 2/29 [00:06<01:11,  2.65s/it][A
Epoch 67:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.0599, v_num=1, train_loss=0.0457, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.460, val_accuracy=0.888, val_f1_score=0.888]
Validating:  14%|█▍        | 4/29 [00:06<00:24,  1.03it/s][A
Epoch 67:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.0599, v_num=1, train_loss=0.0457, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.460, val_accuracy=0.888, val_

Epoch 67, global step 15367: val_loss was not in top 2


Epoch 68:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.0794, v_num=1, train_loss=0.018, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.394, val_accuracy=0.896, val_f1_score=0.896]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 68:  89%|████████▉ | 228/255 [02:40<00:19,  1.42it/s, loss=0.0794, v_num=1, train_loss=0.018, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.394, val_accuracy=0.896, val_f1_score=0.896]
Validating:   7%|▋         | 2/29 [00:06<01:11,  2.65s/it][A
Epoch 68:  90%|█████████ | 230/255 [02:40<00:17,  1.43it/s, loss=0.0794, v_num=1, train_loss=0.018, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.394, val_accuracy=0.896, val_f1_score=0.896]
Validating:  14%|█▍        | 4/29 [00:06<00:25,  1.01s/it][A
Epoch 68:  91%|█████████ | 232/255 [02:41<00:15,  1.44it/s, loss=0.0794, v_num=1, train_loss=0.018, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.394, val_accuracy=0.896, val_f1

Epoch 68, global step 15593: val_loss was not in top 2


Epoch 69:  89%|████████▊ | 226/255 [02:31<00:19,  1.49it/s, loss=0.0762, v_num=1, train_loss=0.114, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.693, val_accuracy=0.855, val_f1_score=0.855]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 69:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.0762, v_num=1, train_loss=0.114, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.693, val_accuracy=0.855, val_f1_score=0.855]
Validating:   7%|▋         | 2/29 [00:06<01:12,  2.67s/it][A
Epoch 69:  90%|█████████ | 230/255 [02:38<00:17,  1.45it/s, loss=0.0762, v_num=1, train_loss=0.114, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.693, val_accuracy=0.855, val_f1_score=0.855]
Validating:  14%|█▍        | 4/29 [00:06<00:24,  1.02it/s][A
Epoch 69:  91%|█████████ | 232/255 [02:38<00:15,  1.46it/s, loss=0.0762, v_num=1, train_loss=0.114, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.693, val_accuracy=0.855, val_f1

Epoch 69, global step 15819: val_loss was not in top 2


Epoch 70:  89%|████████▊ | 226/255 [02:31<00:19,  1.49it/s, loss=0.0516, v_num=1, train_loss=0.0525, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.435, val_accuracy=0.884, val_f1_score=0.884] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 70:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.0516, v_num=1, train_loss=0.0525, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.435, val_accuracy=0.884, val_f1_score=0.884]
Validating:   7%|▋         | 2/29 [00:06<01:12,  2.67s/it][A
Epoch 70:  90%|█████████ | 230/255 [02:38<00:17,  1.45it/s, loss=0.0516, v_num=1, train_loss=0.0525, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.435, val_accuracy=0.884, val_f1_score=0.884]
Validating:  14%|█▍        | 4/29 [00:06<00:24,  1.02it/s][A
Epoch 70:  91%|█████████ | 232/255 [02:38<00:15,  1.46it/s, loss=0.0516, v_num=1, train_loss=0.0525, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.435, val_accuracy=0.884, val

Epoch 70, global step 16045: val_loss was not in top 2


Epoch 71:  89%|████████▊ | 226/255 [02:31<00:19,  1.49it/s, loss=0.0592, v_num=1, train_loss=0.0136, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.384, val_accuracy=0.908, val_f1_score=0.908] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 71:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.0592, v_num=1, train_loss=0.0136, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.384, val_accuracy=0.908, val_f1_score=0.908]
Validating:   7%|▋         | 2/29 [00:06<01:11,  2.67s/it][A
Epoch 71:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.0592, v_num=1, train_loss=0.0136, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.384, val_accuracy=0.908, val_f1_score=0.908]
Epoch 71:  91%|█████████ | 232/255 [02:38<00:15,  1.47it/s, loss=0.0592, v_num=1, train_loss=0.0136, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.384, val_accuracy=0.908, val_f1_score=0.908]
Validating:  21%|██        | 6/29 [00:07<00:1

Epoch 71, global step 16271: val_loss was not in top 2


Epoch 72:  89%|████████▊ | 226/255 [02:31<00:19,  1.50it/s, loss=0.0647, v_num=1, train_loss=0.0796, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.359, val_accuracy=0.909, val_f1_score=0.909] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 72:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.0647, v_num=1, train_loss=0.0796, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.359, val_accuracy=0.909, val_f1_score=0.909]
Validating:   7%|▋         | 2/29 [00:06<01:09,  2.59s/it][A
Epoch 72:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.0647, v_num=1, train_loss=0.0796, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.359, val_accuracy=0.909, val_f1_score=0.909]
Validating:  14%|█▍        | 4/29 [00:06<00:23,  1.05it/s][A
Epoch 72:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.0647, v_num=1, train_loss=0.0796, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.359, val_accuracy=0.909, val

Epoch 72, global step 16497: val_loss was not in top 2


Epoch 73:  89%|████████▊ | 226/255 [02:30<00:19,  1.50it/s, loss=0.0577, v_num=1, train_loss=0.0257, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.444, val_accuracy=0.896, val_f1_score=0.896] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 73:  89%|████████▉ | 228/255 [02:36<00:18,  1.45it/s, loss=0.0577, v_num=1, train_loss=0.0257, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.444, val_accuracy=0.896, val_f1_score=0.896]
Validating:   7%|▋         | 2/29 [00:06<01:13,  2.71s/it][A
Epoch 73:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.0577, v_num=1, train_loss=0.0257, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.444, val_accuracy=0.896, val_f1_score=0.896]
Epoch 73:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.0577, v_num=1, train_loss=0.0257, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.444, val_accuracy=0.896, val_f1_score=0.896]
Validating:  21%|██        | 6/29 [00:07<00:1

Epoch 73, global step 16723: val_loss was not in top 2


Epoch 74:  89%|████████▊ | 226/255 [02:30<00:19,  1.50it/s, loss=0.0507, v_num=1, train_loss=0.0134, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.467, val_accuracy=0.888, val_f1_score=0.888] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 74:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.0507, v_num=1, train_loss=0.0134, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.467, val_accuracy=0.888, val_f1_score=0.888]
Validating:   7%|▋         | 2/29 [00:06<01:13,  2.71s/it][A
Epoch 74:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.0507, v_num=1, train_loss=0.0134, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.467, val_accuracy=0.888, val_f1_score=0.888]
Validating:  14%|█▍        | 4/29 [00:06<00:24,  1.00it/s][A
Epoch 74:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.0507, v_num=1, train_loss=0.0134, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.467, val_accuracy=0.888, val

Epoch 74, global step 16949: val_loss was not in top 2


Epoch 75:  89%|████████▊ | 226/255 [02:30<00:19,  1.50it/s, loss=0.0793, v_num=1, train_loss=0.0169, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.516, val_accuracy=0.886, val_f1_score=0.886] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 75:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.0793, v_num=1, train_loss=0.0169, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.516, val_accuracy=0.886, val_f1_score=0.886]
Validating:   7%|▋         | 2/29 [00:06<01:12,  2.68s/it][A
Epoch 75:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.0793, v_num=1, train_loss=0.0169, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.516, val_accuracy=0.886, val_f1_score=0.886]
Validating:  14%|█▍        | 4/29 [00:06<00:24,  1.02it/s][A
Epoch 75:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.0793, v_num=1, train_loss=0.0169, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.516, val_accuracy=0.886, val

Epoch 75, global step 17175: val_loss was not in top 2


Epoch 76:  89%|████████▊ | 226/255 [02:35<00:19,  1.45it/s, loss=0.0524, v_num=1, train_loss=0.0226, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.448, val_accuracy=0.890, val_f1_score=0.890] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 76:  89%|████████▉ | 228/255 [02:41<00:19,  1.41it/s, loss=0.0524, v_num=1, train_loss=0.0226, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.448, val_accuracy=0.890, val_f1_score=0.890]
Validating:   7%|▋         | 2/29 [00:06<01:14,  2.75s/it][A
Epoch 76:  90%|█████████ | 230/255 [02:42<00:17,  1.42it/s, loss=0.0524, v_num=1, train_loss=0.0226, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.448, val_accuracy=0.890, val_f1_score=0.890]
Validating:  14%|█▍        | 4/29 [00:07<00:26,  1.05s/it][A
Epoch 76:  91%|█████████ | 232/255 [02:42<00:16,  1.43it/s, loss=0.0524, v_num=1, train_loss=0.0226, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.448, val_accuracy=0.890, val

Epoch 76, global step 17401: val_loss was not in top 2


Epoch 77:  89%|████████▊ | 226/255 [02:31<00:19,  1.49it/s, loss=0.18, v_num=1, train_loss=0.0769, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.373, val_accuracy=0.904, val_f1_score=0.904]   
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 77:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.18, v_num=1, train_loss=0.0769, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.373, val_accuracy=0.904, val_f1_score=0.904]
Validating:   7%|▋         | 2/29 [00:06<01:11,  2.66s/it][A
Epoch 77:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.18, v_num=1, train_loss=0.0769, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.373, val_accuracy=0.904, val_f1_score=0.904]
Validating:  14%|█▍        | 4/29 [00:06<00:25,  1.02s/it][A
Epoch 77:  91%|█████████ | 232/255 [02:38<00:15,  1.47it/s, loss=0.18, v_num=1, train_loss=0.0769, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.373, val_accuracy=0.904, val_f1_sc

Epoch 77, global step 17627: val_loss was not in top 2


Epoch 78:  89%|████████▊ | 226/255 [02:30<00:19,  1.50it/s, loss=0.101, v_num=1, train_loss=0.0311, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.374, val_accuracy=0.862, val_f1_score=0.862]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 78:  89%|████████▉ | 228/255 [02:36<00:18,  1.45it/s, loss=0.101, v_num=1, train_loss=0.0311, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.374, val_accuracy=0.862, val_f1_score=0.862]
Validating:   7%|▋         | 2/29 [00:06<01:12,  2.68s/it][A
Epoch 78:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.101, v_num=1, train_loss=0.0311, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.374, val_accuracy=0.862, val_f1_score=0.862]
Validating:  14%|█▍        | 4/29 [00:06<00:25,  1.03s/it][A
Epoch 78:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.101, v_num=1, train_loss=0.0311, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.374, val_accuracy=0.862, val_f1_s

Epoch 78, global step 17853: val_loss was not in top 2


Epoch 79:  89%|████████▊ | 226/255 [02:30<00:19,  1.50it/s, loss=0.0656, v_num=1, train_loss=0.0517, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.378, val_accuracy=0.883, val_f1_score=0.883]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 79:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.0656, v_num=1, train_loss=0.0517, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.378, val_accuracy=0.883, val_f1_score=0.883]
Validating:   7%|▋         | 2/29 [00:06<01:12,  2.67s/it][A
Epoch 79:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.0656, v_num=1, train_loss=0.0517, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.378, val_accuracy=0.883, val_f1_score=0.883]
Validating:  14%|█▍        | 4/29 [00:06<00:25,  1.03s/it][A
Epoch 79:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.0656, v_num=1, train_loss=0.0517, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.378, val_accuracy=0.883, val_

Epoch 79, global step 18079: val_loss was not in top 2


Epoch 80:  89%|████████▊ | 226/255 [02:31<00:19,  1.49it/s, loss=0.103, v_num=1, train_loss=0.0918, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.402, val_accuracy=0.899, val_f1_score=0.899] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 80:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.103, v_num=1, train_loss=0.0918, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.402, val_accuracy=0.899, val_f1_score=0.899]
Validating:   7%|▋         | 2/29 [00:06<01:11,  2.66s/it][A
Epoch 80:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.103, v_num=1, train_loss=0.0918, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.402, val_accuracy=0.899, val_f1_score=0.899]
Validating:  14%|█▍        | 4/29 [00:06<00:24,  1.02it/s][A
Epoch 80:  91%|█████████ | 232/255 [02:38<00:15,  1.47it/s, loss=0.103, v_num=1, train_loss=0.0918, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.402, val_accuracy=0.899, val_f1_

Epoch 80, global step 18305: val_loss was not in top 2


Epoch 81:  89%|████████▊ | 226/255 [02:31<00:19,  1.49it/s, loss=0.0614, v_num=1, train_loss=0.0178, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.347, val_accuracy=0.899, val_f1_score=0.899]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 81:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.0614, v_num=1, train_loss=0.0178, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.347, val_accuracy=0.899, val_f1_score=0.899]
Validating:   7%|▋         | 2/29 [00:06<01:12,  2.67s/it][A
Epoch 81:  90%|█████████ | 230/255 [02:38<00:17,  1.45it/s, loss=0.0614, v_num=1, train_loss=0.0178, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.347, val_accuracy=0.899, val_f1_score=0.899]
Validating:  14%|█▍        | 4/29 [00:06<00:24,  1.02it/s][A
Epoch 81:  91%|█████████ | 232/255 [02:38<00:15,  1.46it/s, loss=0.0614, v_num=1, train_loss=0.0178, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.347, val_accuracy=0.899, val_

Epoch 81, global step 18531: val_loss was not in top 2


Epoch 82:  89%|████████▊ | 226/255 [02:31<00:19,  1.49it/s, loss=0.055, v_num=1, train_loss=0.0319, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.346, val_accuracy=0.901, val_f1_score=0.901]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 82:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.055, v_num=1, train_loss=0.0319, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.346, val_accuracy=0.901, val_f1_score=0.901]
Validating:   7%|▋         | 2/29 [00:06<01:11,  2.65s/it][A
Epoch 82:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.055, v_num=1, train_loss=0.0319, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.346, val_accuracy=0.901, val_f1_score=0.901]
Validating:  14%|█▍        | 4/29 [00:06<00:24,  1.00it/s][A
Epoch 82:  91%|█████████ | 232/255 [02:38<00:15,  1.47it/s, loss=0.055, v_num=1, train_loss=0.0319, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.346, val_accuracy=0.901, val_f1

Epoch 82, global step 18757: val_loss was not in top 2


Epoch 83:  89%|████████▊ | 226/255 [02:31<00:19,  1.49it/s, loss=0.0724, v_num=1, train_loss=0.377, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.335, val_accuracy=0.916, val_f1_score=0.916]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 83:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.0724, v_num=1, train_loss=0.377, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.335, val_accuracy=0.916, val_f1_score=0.916]
Validating:   7%|▋         | 2/29 [00:06<01:11,  2.65s/it][A
Epoch 83:  90%|█████████ | 230/255 [02:38<00:17,  1.46it/s, loss=0.0724, v_num=1, train_loss=0.377, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.335, val_accuracy=0.916, val_f1_score=0.916]
Validating:  14%|█▍        | 4/29 [00:06<00:25,  1.02s/it][A
Epoch 83:  91%|█████████ | 232/255 [02:38<00:15,  1.47it/s, loss=0.0724, v_num=1, train_loss=0.377, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.335, val_accuracy=0.916, val_f1

Epoch 83, global step 18983: val_loss was not in top 2


Epoch 84:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.0527, v_num=1, train_loss=0.0333, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.476, val_accuracy=0.888, val_f1_score=0.888] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 84:  89%|████████▉ | 228/255 [02:41<00:19,  1.41it/s, loss=0.0527, v_num=1, train_loss=0.0333, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.476, val_accuracy=0.888, val_f1_score=0.888]
Validating:   7%|▋         | 2/29 [00:06<01:12,  2.68s/it][A
Epoch 84:  90%|█████████ | 230/255 [02:41<00:17,  1.42it/s, loss=0.0527, v_num=1, train_loss=0.0333, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.476, val_accuracy=0.888, val_f1_score=0.888]
Validating:  14%|█▍        | 4/29 [00:06<00:25,  1.01s/it][A
Epoch 84:  91%|█████████ | 232/255 [02:41<00:16,  1.43it/s, loss=0.0527, v_num=1, train_loss=0.0333, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.476, val_accuracy=0.888, val

Epoch 84, global step 19209: val_loss was not in top 2


Epoch 85:  89%|████████▊ | 226/255 [02:30<00:19,  1.51it/s, loss=0.0318, v_num=1, train_loss=0.00987, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.368, val_accuracy=0.911, val_f1_score=0.911]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 85:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0318, v_num=1, train_loss=0.00987, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.368, val_accuracy=0.911, val_f1_score=0.911]
Validating:   7%|▋         | 2/29 [00:06<01:11,  2.67s/it][A
Epoch 85:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.0318, v_num=1, train_loss=0.00987, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.368, val_accuracy=0.911, val_f1_score=0.911]
Validating:  14%|█▍        | 4/29 [00:06<00:25,  1.02s/it][A
Epoch 85:  91%|█████████ | 232/255 [02:37<00:15,  1.48it/s, loss=0.0318, v_num=1, train_loss=0.00987, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.368, val_accuracy=0.911, 

Epoch 85, global step 19435: val_loss was not in top 2


Epoch 86:  89%|████████▊ | 226/255 [02:30<00:19,  1.50it/s, loss=0.096, v_num=1, train_loss=0.0492, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.374, val_accuracy=0.909, val_f1_score=0.909]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 86:  89%|████████▉ | 228/255 [02:36<00:18,  1.45it/s, loss=0.096, v_num=1, train_loss=0.0492, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.374, val_accuracy=0.909, val_f1_score=0.909]
Validating:   7%|▋         | 2/29 [00:06<01:12,  2.68s/it][A
Epoch 86:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.096, v_num=1, train_loss=0.0492, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.374, val_accuracy=0.909, val_f1_score=0.909]
Validating:  14%|█▍        | 4/29 [00:06<00:25,  1.02s/it][A
Epoch 86:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.096, v_num=1, train_loss=0.0492, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.374, val_accuracy=0.909, val_f1

Epoch 86, global step 19661: val_loss was not in top 2


Epoch 87:  89%|████████▊ | 226/255 [02:30<00:19,  1.50it/s, loss=0.0578, v_num=1, train_loss=0.013, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.505, val_accuracy=0.886, val_f1_score=0.886]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 87:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0578, v_num=1, train_loss=0.013, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.505, val_accuracy=0.886, val_f1_score=0.886]
Validating:   7%|▋         | 2/29 [00:06<01:08,  2.54s/it][A
Epoch 87:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.0578, v_num=1, train_loss=0.013, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.505, val_accuracy=0.886, val_f1_score=0.886]
Validating:  14%|█▍        | 4/29 [00:06<00:24,  1.02it/s][A
Epoch 87:  91%|█████████ | 232/255 [02:36<00:15,  1.48it/s, loss=0.0578, v_num=1, train_loss=0.013, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.505, val_accuracy=0.886, val_f1

Epoch 87, global step 19887: val_loss was not in top 2


Epoch 88:  89%|████████▊ | 226/255 [02:30<00:19,  1.51it/s, loss=0.0857, v_num=1, train_loss=0.0297, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.421, val_accuracy=0.899, val_f1_score=0.899] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 88:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0857, v_num=1, train_loss=0.0297, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.421, val_accuracy=0.899, val_f1_score=0.899]
Epoch 88:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.0857, v_num=1, train_loss=0.0297, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.421, val_accuracy=0.899, val_f1_score=0.899]
Validating:  14%|█▍        | 4/29 [00:06<00:27,  1.08s/it][A
Epoch 88:  91%|█████████ | 232/255 [02:36<00:15,  1.48it/s, loss=0.0857, v_num=1, train_loss=0.0297, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.421, val_accuracy=0.899, val_f1_score=0.899]
Validating:  21%|██        | 6/29 [00:06<00:1

Epoch 88, global step 20113: val_loss was not in top 2


Epoch 89:  89%|████████▊ | 226/255 [02:30<00:19,  1.50it/s, loss=0.0431, v_num=1, train_loss=0.121, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.702, val_accuracy=0.858, val_f1_score=0.858]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 89:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0431, v_num=1, train_loss=0.121, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.702, val_accuracy=0.858, val_f1_score=0.858]
Validating:   7%|▋         | 2/29 [00:06<01:11,  2.64s/it][A
Epoch 89:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.0431, v_num=1, train_loss=0.121, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.702, val_accuracy=0.858, val_f1_score=0.858]
Validating:  14%|█▍        | 4/29 [00:06<00:25,  1.01s/it][A
Epoch 89:  91%|█████████ | 232/255 [02:37<00:15,  1.48it/s, loss=0.0431, v_num=1, train_loss=0.121, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.702, val_accuracy=0.858, val_f1

Epoch 89, global step 20339: val_loss was not in top 2


Epoch 90:  89%|████████▊ | 226/255 [02:30<00:19,  1.50it/s, loss=0.0375, v_num=1, train_loss=0.00959, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.400, val_accuracy=0.897, val_f1_score=0.897]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 90:  89%|████████▉ | 228/255 [02:36<00:18,  1.45it/s, loss=0.0375, v_num=1, train_loss=0.00959, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.400, val_accuracy=0.897, val_f1_score=0.897]
Validating:   7%|▋         | 2/29 [00:06<01:12,  2.68s/it][A
Epoch 90:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.0375, v_num=1, train_loss=0.00959, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.400, val_accuracy=0.897, val_f1_score=0.897]
Validating:  14%|█▍        | 4/29 [00:06<00:24,  1.02it/s][A
Epoch 90:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.0375, v_num=1, train_loss=0.00959, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.400, val_accuracy=0.897, 

Epoch 90, global step 20565: val_loss was not in top 2


Epoch 91:  89%|████████▊ | 226/255 [02:29<00:19,  1.51it/s, loss=0.041, v_num=1, train_loss=0.0408, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.329, val_accuracy=0.916, val_f1_score=0.916]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 91:  89%|████████▉ | 228/255 [02:35<00:18,  1.46it/s, loss=0.041, v_num=1, train_loss=0.0408, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.329, val_accuracy=0.916, val_f1_score=0.916]
Validating:   7%|▋         | 2/29 [00:06<01:12,  2.68s/it][A
Epoch 91:  90%|█████████ | 230/255 [02:36<00:16,  1.47it/s, loss=0.041, v_num=1, train_loss=0.0408, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.329, val_accuracy=0.916, val_f1_score=0.916]
Validating:  14%|█▍        | 4/29 [00:06<00:25,  1.02s/it][A
Epoch 91:  91%|█████████ | 232/255 [02:36<00:15,  1.48it/s, loss=0.041, v_num=1, train_loss=0.0408, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.329, val_accuracy=0.916, val_f1

Epoch 91, global step 20791: val_loss was not in top 2


Epoch 92:  89%|████████▊ | 226/255 [02:32<00:19,  1.48it/s, loss=0.0503, v_num=1, train_loss=0.0172, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.405, val_accuracy=0.909, val_f1_score=0.909] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 92:  89%|████████▉ | 228/255 [02:38<00:18,  1.43it/s, loss=0.0503, v_num=1, train_loss=0.0172, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.405, val_accuracy=0.909, val_f1_score=0.909]
Epoch 92:  90%|█████████ | 230/255 [02:39<00:17,  1.45it/s, loss=0.0503, v_num=1, train_loss=0.0172, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.405, val_accuracy=0.909, val_f1_score=0.909]
Epoch 92:  91%|█████████ | 232/255 [02:39<00:15,  1.46it/s, loss=0.0503, v_num=1, train_loss=0.0172, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.405, val_accuracy=0.909, val_f1_score=0.909]
Epoch 92:  92%|█████████▏| 234/255 [02:39<00:14,  1.47it/s, loss=0.0503, v_num=1, train_loss=0.0172, train_

Epoch 92, global step 21017: val_loss was not in top 2


Epoch 93:  89%|████████▊ | 226/255 [02:30<00:19,  1.50it/s, loss=0.0509, v_num=1, train_loss=0.131, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.334, val_accuracy=0.921, val_f1_score=0.921]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 93:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0509, v_num=1, train_loss=0.131, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.334, val_accuracy=0.921, val_f1_score=0.921]
Validating:   7%|▋         | 2/29 [00:06<01:11,  2.66s/it][A
Epoch 93:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.0509, v_num=1, train_loss=0.131, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.334, val_accuracy=0.921, val_f1_score=0.921]
Validating:  14%|█▍        | 4/29 [00:06<00:25,  1.01s/it][A
Epoch 93:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.0509, v_num=1, train_loss=0.131, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.334, val_accuracy=0.921, val_f1

Epoch 93, global step 21243: val_loss was not in top 2


Epoch 94:  89%|████████▊ | 226/255 [02:30<00:19,  1.50it/s, loss=0.0381, v_num=1, train_loss=0.0147, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.340, val_accuracy=0.923, val_f1_score=0.923] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 94:  89%|████████▉ | 228/255 [02:36<00:18,  1.45it/s, loss=0.0381, v_num=1, train_loss=0.0147, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.340, val_accuracy=0.923, val_f1_score=0.923]
Validating:   7%|▋         | 2/29 [00:06<01:13,  2.73s/it][A
Epoch 94:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.0381, v_num=1, train_loss=0.0147, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.340, val_accuracy=0.923, val_f1_score=0.923]
Validating:  14%|█▍        | 4/29 [00:06<00:24,  1.00it/s][A
Epoch 94:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.0381, v_num=1, train_loss=0.0147, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.340, val_accuracy=0.923, val

Epoch 94, global step 21469: val_loss was not in top 2


Epoch 95:  89%|████████▊ | 226/255 [02:30<00:19,  1.50it/s, loss=0.129, v_num=1, train_loss=0.0516, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.387, val_accuracy=0.914, val_f1_score=0.914] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 95:  89%|████████▉ | 228/255 [02:36<00:18,  1.45it/s, loss=0.129, v_num=1, train_loss=0.0516, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.387, val_accuracy=0.914, val_f1_score=0.914]
Epoch 95:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.129, v_num=1, train_loss=0.0516, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.387, val_accuracy=0.914, val_f1_score=0.914]
Validating:  14%|█▍        | 4/29 [00:06<00:30,  1.23s/it][A
Epoch 95:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.129, v_num=1, train_loss=0.0516, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.387, val_accuracy=0.914, val_f1_score=0.914]
Validating:  21%|██        | 6/29 [00:07<00:14,  

Epoch 95, global step 21695: val_loss was not in top 2


Epoch 96:  89%|████████▊ | 226/255 [02:30<00:19,  1.50it/s, loss=0.0492, v_num=1, train_loss=0.00757, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.368, val_accuracy=0.881, val_f1_score=0.881]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 96:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0492, v_num=1, train_loss=0.00757, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.368, val_accuracy=0.881, val_f1_score=0.881]
Validating:   7%|▋         | 2/29 [00:06<01:12,  2.67s/it][A
Epoch 96:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.0492, v_num=1, train_loss=0.00757, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.368, val_accuracy=0.881, val_f1_score=0.881]
Validating:  14%|█▍        | 4/29 [00:06<00:25,  1.02s/it][A
Epoch 96:  91%|█████████ | 232/255 [02:37<00:15,  1.48it/s, loss=0.0492, v_num=1, train_loss=0.00757, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.368, val_accuracy=0.881, 

Epoch 96, global step 21921: val_loss was not in top 2


Epoch 97:  89%|████████▊ | 226/255 [02:29<00:19,  1.51it/s, loss=0.0336, v_num=1, train_loss=0.00109, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.336, val_accuracy=0.917, val_f1_score=0.917]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 97:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0336, v_num=1, train_loss=0.00109, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.336, val_accuracy=0.917, val_f1_score=0.917]
Validating:   7%|▋         | 2/29 [00:06<01:12,  2.70s/it][A
Epoch 97:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.0336, v_num=1, train_loss=0.00109, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.336, val_accuracy=0.917, val_f1_score=0.917]
Validating:  14%|█▍        | 4/29 [00:06<00:24,  1.01it/s][A
Epoch 97:  91%|█████████ | 232/255 [02:36<00:15,  1.48it/s, loss=0.0336, v_num=1, train_loss=0.00109, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.336, val_accuracy=0.917, 

Epoch 97, global step 22147: val_loss was not in top 2


Epoch 98:  89%|████████▊ | 226/255 [02:30<00:19,  1.50it/s, loss=0.0482, v_num=1, train_loss=0.152, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.350, val_accuracy=0.918, val_f1_score=0.918]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 98:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0482, v_num=1, train_loss=0.152, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.350, val_accuracy=0.918, val_f1_score=0.918]
Validating:   7%|▋         | 2/29 [00:06<01:12,  2.67s/it][A
Epoch 98:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.0482, v_num=1, train_loss=0.152, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.350, val_accuracy=0.918, val_f1_score=0.918]
Validating:  14%|█▍        | 4/29 [00:06<00:24,  1.02it/s][A
Epoch 98:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.0482, v_num=1, train_loss=0.152, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.350, val_accuracy=0.918, val_f1

Epoch 98, global step 22373: val_loss was not in top 2


Epoch 99:  89%|████████▊ | 226/255 [02:30<00:19,  1.51it/s, loss=0.0763, v_num=1, train_loss=0.0047, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.398, val_accuracy=0.907, val_f1_score=0.907] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 99:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0763, v_num=1, train_loss=0.0047, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.398, val_accuracy=0.907, val_f1_score=0.907]
Validating:   7%|▋         | 2/29 [00:06<01:12,  2.68s/it][A
Epoch 99:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.0763, v_num=1, train_loss=0.0047, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.398, val_accuracy=0.907, val_f1_score=0.907]
Validating:  14%|█▍        | 4/29 [00:06<00:24,  1.01it/s][A
Epoch 99:  91%|█████████ | 232/255 [02:37<00:15,  1.48it/s, loss=0.0763, v_num=1, train_loss=0.0047, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.398, val_accuracy=0.907, val

Epoch 99, global step 22599: val_loss was not in top 2


Epoch 100:  89%|████████▊ | 226/255 [02:32<00:19,  1.48it/s, loss=0.0573, v_num=1, train_loss=0.0596, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.382, val_accuracy=0.906, val_f1_score=0.906] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 100:  89%|████████▉ | 228/255 [02:38<00:18,  1.44it/s, loss=0.0573, v_num=1, train_loss=0.0596, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.382, val_accuracy=0.906, val_f1_score=0.906]
Validating:   7%|▋         | 2/29 [00:06<01:11,  2.64s/it][A
Epoch 100:  90%|█████████ | 230/255 [02:38<00:17,  1.45it/s, loss=0.0573, v_num=1, train_loss=0.0596, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.382, val_accuracy=0.906, val_f1_score=0.906]
Validating:  14%|█▍        | 4/29 [00:06<00:24,  1.02it/s][A
Epoch 100:  91%|█████████ | 232/255 [02:39<00:15,  1.46it/s, loss=0.0573, v_num=1, train_loss=0.0596, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.382, val_accuracy=0.906,

Epoch 100, global step 22825: val_loss was not in top 2


Epoch 101:  89%|████████▊ | 226/255 [02:31<00:19,  1.49it/s, loss=0.0536, v_num=1, train_loss=0.00545, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.385, val_accuracy=0.907, val_f1_score=0.907]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 101:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.0536, v_num=1, train_loss=0.00545, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.385, val_accuracy=0.907, val_f1_score=0.907]
Validating:   7%|▋         | 2/29 [00:06<01:11,  2.66s/it][A
Epoch 101:  90%|█████████ | 230/255 [02:38<00:17,  1.46it/s, loss=0.0536, v_num=1, train_loss=0.00545, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.385, val_accuracy=0.907, val_f1_score=0.907]
Epoch 101:  91%|█████████ | 232/255 [02:38<00:15,  1.46it/s, loss=0.0536, v_num=1, train_loss=0.00545, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.385, val_accuracy=0.907, val_f1_score=0.907]
Validating:  21%|██        | 6/29 [00:

Epoch 101, global step 23051: val_loss was not in top 2


Epoch 102:  89%|████████▊ | 226/255 [02:30<00:19,  1.50it/s, loss=0.063, v_num=1, train_loss=0.405, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.457, val_accuracy=0.889, val_f1_score=0.889]   
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 102:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.063, v_num=1, train_loss=0.405, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.457, val_accuracy=0.889, val_f1_score=0.889]
Validating:   7%|▋         | 2/29 [00:06<01:13,  2.71s/it][A
Epoch 102:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.063, v_num=1, train_loss=0.405, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.457, val_accuracy=0.889, val_f1_score=0.889]
Validating:  14%|█▍        | 4/29 [00:06<00:26,  1.04s/it][A
Epoch 102:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.063, v_num=1, train_loss=0.405, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.457, val_accuracy=0.889, val_f

Epoch 102, global step 23277: val_loss was not in top 2


Epoch 103:  89%|████████▊ | 226/255 [02:30<00:19,  1.50it/s, loss=0.0502, v_num=1, train_loss=0.00758, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.583, val_accuracy=0.883, val_f1_score=0.883]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 103:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0502, v_num=1, train_loss=0.00758, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.583, val_accuracy=0.883, val_f1_score=0.883]
Validating:   7%|▋         | 2/29 [00:06<01:11,  2.63s/it][A
Epoch 103:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.0502, v_num=1, train_loss=0.00758, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.583, val_accuracy=0.883, val_f1_score=0.883]
Validating:  14%|█▍        | 4/29 [00:06<00:25,  1.00s/it][A
Epoch 103:  91%|█████████ | 232/255 [02:37<00:15,  1.48it/s, loss=0.0502, v_num=1, train_loss=0.00758, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.583, val_accuracy=0.8

Epoch 103, global step 23503: val_loss was not in top 2


Epoch 104:  89%|████████▊ | 226/255 [02:29<00:19,  1.51it/s, loss=0.0388, v_num=1, train_loss=0.0246, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.377, val_accuracy=0.913, val_f1_score=0.913] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 104:  89%|████████▉ | 228/255 [02:35<00:18,  1.46it/s, loss=0.0388, v_num=1, train_loss=0.0246, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.377, val_accuracy=0.913, val_f1_score=0.913]
Validating:   7%|▋         | 2/29 [00:06<01:11,  2.67s/it][A
Epoch 104:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.0388, v_num=1, train_loss=0.0246, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.377, val_accuracy=0.913, val_f1_score=0.913]
Validating:  14%|█▍        | 4/29 [00:06<00:25,  1.02s/it][A
Epoch 104:  91%|█████████ | 232/255 [02:36<00:15,  1.48it/s, loss=0.0388, v_num=1, train_loss=0.0246, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.377, val_accuracy=0.913,

Epoch 104, global step 23729: val_loss reached 0.30696 (best 0.30696), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-1-v3.ckpt" as top 2


Epoch 105:  89%|████████▊ | 226/255 [02:30<00:19,  1.50it/s, loss=0.0799, v_num=1, train_loss=0.0944, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.307, val_accuracy=0.923, val_f1_score=0.923] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 105:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0799, v_num=1, train_loss=0.0944, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.307, val_accuracy=0.923, val_f1_score=0.923]
Validating:   7%|▋         | 2/29 [00:06<01:13,  2.71s/it][A
Epoch 105:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.0799, v_num=1, train_loss=0.0944, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.307, val_accuracy=0.923, val_f1_score=0.923]
Validating:  14%|█▍        | 4/29 [00:06<00:24,  1.01it/s][A
Epoch 105:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.0799, v_num=1, train_loss=0.0944, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.307, val_accuracy=0.923,

Epoch 105, global step 23955: val_loss reached 0.31037 (best 0.30696), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-1-v2.ckpt" as top 2


Epoch 106:  89%|████████▊ | 226/255 [02:30<00:19,  1.50it/s, loss=0.0457, v_num=1, train_loss=0.0101, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.310, val_accuracy=0.916, val_f1_score=0.916] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 106:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0457, v_num=1, train_loss=0.0101, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.310, val_accuracy=0.916, val_f1_score=0.916]
Validating:   7%|▋         | 2/29 [00:06<01:12,  2.68s/it][A
Epoch 106:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.0457, v_num=1, train_loss=0.0101, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.310, val_accuracy=0.916, val_f1_score=0.916]
Validating:  14%|█▍        | 4/29 [00:06<00:24,  1.00it/s][A
Epoch 106:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.0457, v_num=1, train_loss=0.0101, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.310, val_accuracy=0.916,

Epoch 106, global step 24181: val_loss was not in top 2


Epoch 107:  89%|████████▊ | 226/255 [02:30<00:19,  1.50it/s, loss=0.297, v_num=1, train_loss=0.190, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.323, val_accuracy=0.920, val_f1_score=0.920]   
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 107:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.297, v_num=1, train_loss=0.190, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.323, val_accuracy=0.920, val_f1_score=0.920]
Validating:   7%|▋         | 2/29 [00:06<01:11,  2.65s/it][A
Epoch 107:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.297, v_num=1, train_loss=0.190, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.323, val_accuracy=0.920, val_f1_score=0.920]
Validating:  14%|█▍        | 4/29 [00:06<00:25,  1.01s/it][A
Epoch 107:  91%|█████████ | 232/255 [02:37<00:15,  1.48it/s, loss=0.297, v_num=1, train_loss=0.190, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.323, val_accuracy=0.920, val_f

Epoch 107, global step 24407: val_loss was not in top 2


Epoch 108:  89%|████████▊ | 226/255 [02:30<00:19,  1.50it/s, loss=0.037, v_num=1, train_loss=0.00518, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.542, val_accuracy=0.858, val_f1_score=0.858] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 108:  89%|████████▉ | 228/255 [02:36<00:18,  1.45it/s, loss=0.037, v_num=1, train_loss=0.00518, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.542, val_accuracy=0.858, val_f1_score=0.858]
Epoch 108:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.037, v_num=1, train_loss=0.00518, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.542, val_accuracy=0.858, val_f1_score=0.858]
Epoch 108:  91%|█████████ | 232/255 [02:37<00:15,  1.48it/s, loss=0.037, v_num=1, train_loss=0.00518, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.542, val_accuracy=0.858, val_f1_score=0.858]
Epoch 108:  92%|█████████▏| 234/255 [02:37<00:14,  1.49it/s, loss=0.037, v_num=1, train_loss=0.00518, t

Epoch 108, global step 24633: val_loss was not in top 2


Epoch 109:  89%|████████▊ | 226/255 [02:33<00:19,  1.47it/s, loss=0.141, v_num=1, train_loss=0.0288, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.346, val_accuracy=0.921, val_f1_score=0.921]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 109:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.141, v_num=1, train_loss=0.0288, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.346, val_accuracy=0.921, val_f1_score=0.921]
Validating:   7%|▋         | 2/29 [00:06<01:13,  2.72s/it][A
Epoch 109:  90%|█████████ | 230/255 [02:40<00:17,  1.44it/s, loss=0.141, v_num=1, train_loss=0.0288, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.346, val_accuracy=0.921, val_f1_score=0.921]
Validating:  14%|█▍        | 4/29 [00:06<00:25,  1.04s/it][A
Epoch 109:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.141, v_num=1, train_loss=0.0288, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.346, val_accuracy=0.921, va

Epoch 109, global step 24859: val_loss was not in top 2


Epoch 110:  89%|████████▊ | 226/255 [02:30<00:19,  1.50it/s, loss=0.0599, v_num=1, train_loss=0.0209, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.364, val_accuracy=0.914, val_f1_score=0.914] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 110:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0599, v_num=1, train_loss=0.0209, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.364, val_accuracy=0.914, val_f1_score=0.914]
Validating:   7%|▋         | 2/29 [00:06<01:11,  2.65s/it][A
Epoch 110:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.0599, v_num=1, train_loss=0.0209, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.364, val_accuracy=0.914, val_f1_score=0.914]
Validating:  14%|█▍        | 4/29 [00:06<00:25,  1.01s/it][A
Epoch 110:  91%|█████████ | 232/255 [02:37<00:15,  1.48it/s, loss=0.0599, v_num=1, train_loss=0.0209, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.364, val_accuracy=0.914,

Epoch 110, global step 25085: val_loss was not in top 2


Epoch 111:  89%|████████▊ | 226/255 [02:30<00:19,  1.50it/s, loss=0.0951, v_num=1, train_loss=0.266, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.322, val_accuracy=0.920, val_f1_score=0.920]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 111:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0951, v_num=1, train_loss=0.266, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.322, val_accuracy=0.920, val_f1_score=0.920]
Validating:   7%|▋         | 2/29 [00:06<01:12,  2.68s/it][A
Epoch 111:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.0951, v_num=1, train_loss=0.266, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.322, val_accuracy=0.920, val_f1_score=0.920]
Validating:  14%|█▍        | 4/29 [00:06<00:24,  1.00it/s][A
Epoch 111:  91%|█████████ | 232/255 [02:37<00:15,  1.48it/s, loss=0.0951, v_num=1, train_loss=0.266, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.322, val_accuracy=0.920, va

Epoch 111, global step 25311: val_loss was not in top 2


Epoch 112:  89%|████████▊ | 226/255 [02:30<00:19,  1.50it/s, loss=0.112, v_num=1, train_loss=0.0274, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.410, val_accuracy=0.904, val_f1_score=0.904] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 112:  89%|████████▉ | 228/255 [02:37<00:18,  1.45it/s, loss=0.112, v_num=1, train_loss=0.0274, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.410, val_accuracy=0.904, val_f1_score=0.904]
Validating:   7%|▋         | 2/29 [00:06<01:11,  2.66s/it][A
Epoch 112:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.112, v_num=1, train_loss=0.0274, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.410, val_accuracy=0.904, val_f1_score=0.904]
Validating:  14%|█▍        | 4/29 [00:06<00:25,  1.01s/it][A
Epoch 112:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.112, v_num=1, train_loss=0.0274, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.410, val_accuracy=0.904, val

Epoch 112, global step 25537: val_loss reached 0.30757 (best 0.30696), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-1-v2.ckpt" as top 2


Epoch 113:  89%|████████▊ | 226/255 [02:30<00:19,  1.50it/s, loss=0.073, v_num=1, train_loss=0.171, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.308, val_accuracy=0.897, val_f1_score=0.897]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 113:  89%|████████▉ | 228/255 [02:36<00:18,  1.45it/s, loss=0.073, v_num=1, train_loss=0.171, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.308, val_accuracy=0.897, val_f1_score=0.897]
Validating:   7%|▋         | 2/29 [00:06<01:10,  2.61s/it][A
Epoch 113:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.073, v_num=1, train_loss=0.171, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.308, val_accuracy=0.897, val_f1_score=0.897]
Validating:  14%|█▍        | 4/29 [00:06<00:24,  1.00it/s][A
Epoch 113:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.073, v_num=1, train_loss=0.171, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.308, val_accuracy=0.897, val_f1

Epoch 113, global step 25763: val_loss was not in top 2


Epoch 114:  89%|████████▊ | 226/255 [02:30<00:19,  1.51it/s, loss=0.0684, v_num=1, train_loss=0.071, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.312, val_accuracy=0.911, val_f1_score=0.911] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 114:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0684, v_num=1, train_loss=0.071, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.312, val_accuracy=0.911, val_f1_score=0.911]
Validating:   7%|▋         | 2/29 [00:06<01:12,  2.70s/it][A
Epoch 114:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.0684, v_num=1, train_loss=0.071, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.312, val_accuracy=0.911, val_f1_score=0.911]
Validating:  14%|█▍        | 4/29 [00:06<00:24,  1.00it/s][A
Epoch 114:  91%|█████████ | 232/255 [02:37<00:15,  1.48it/s, loss=0.0684, v_num=1, train_loss=0.071, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.312, val_accuracy=0.911, val

Epoch 114, global step 25989: val_loss reached 0.27465 (best 0.27465), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-1-v2.ckpt" as top 2


Epoch 115:  89%|████████▊ | 226/255 [02:30<00:19,  1.50it/s, loss=0.0634, v_num=1, train_loss=0.0416, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.275, val_accuracy=0.921, val_f1_score=0.921] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 115:  89%|████████▉ | 228/255 [02:36<00:18,  1.45it/s, loss=0.0634, v_num=1, train_loss=0.0416, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.275, val_accuracy=0.921, val_f1_score=0.921]
Validating:   7%|▋         | 2/29 [00:06<01:11,  2.66s/it][A
Epoch 115:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.0634, v_num=1, train_loss=0.0416, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.275, val_accuracy=0.921, val_f1_score=0.921]
Validating:  14%|█▍        | 4/29 [00:06<00:25,  1.02s/it][A
Epoch 115:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.0634, v_num=1, train_loss=0.0416, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.275, val_accuracy=0.921,

Epoch 115, global step 26215: val_loss was not in top 2


Epoch 116:  89%|████████▊ | 226/255 [02:30<00:19,  1.50it/s, loss=0.0548, v_num=1, train_loss=0.163, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.311, val_accuracy=0.911, val_f1_score=0.911]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 116:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0548, v_num=1, train_loss=0.163, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.311, val_accuracy=0.911, val_f1_score=0.911]
Validating:   7%|▋         | 2/29 [00:06<01:09,  2.58s/it][A
Epoch 116:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.0548, v_num=1, train_loss=0.163, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.311, val_accuracy=0.911, val_f1_score=0.911]
Epoch 116:  91%|█████████ | 232/255 [02:37<00:15,  1.48it/s, loss=0.0548, v_num=1, train_loss=0.163, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.311, val_accuracy=0.911, val_f1_score=0.911]
Validating:  21%|██        | 6/29 [00:06<00:

Epoch 116, global step 26441: val_loss was not in top 2


Epoch 117:  89%|████████▊ | 226/255 [02:32<00:19,  1.48it/s, loss=0.0453, v_num=1, train_loss=0.0383, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.308, val_accuracy=0.919, val_f1_score=0.919] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 117:  89%|████████▉ | 228/255 [02:38<00:18,  1.44it/s, loss=0.0453, v_num=1, train_loss=0.0383, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.308, val_accuracy=0.919, val_f1_score=0.919]
Validating:   7%|▋         | 2/29 [00:06<01:12,  2.68s/it][A
Epoch 117:  90%|█████████ | 230/255 [02:39<00:17,  1.45it/s, loss=0.0453, v_num=1, train_loss=0.0383, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.308, val_accuracy=0.919, val_f1_score=0.919]
Validating:  14%|█▍        | 4/29 [00:06<00:24,  1.00it/s][A
Epoch 117:  91%|█████████ | 232/255 [02:39<00:15,  1.45it/s, loss=0.0453, v_num=1, train_loss=0.0383, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.308, val_accuracy=0.919,

Epoch 117, global step 26667: val_loss reached 0.28477 (best 0.27465), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-1-v3.ckpt" as top 2


Epoch 118:  89%|████████▊ | 226/255 [02:30<00:19,  1.51it/s, loss=0.0982, v_num=1, train_loss=0.291, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.285, val_accuracy=0.922, val_f1_score=0.922]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 118:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0982, v_num=1, train_loss=0.291, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.285, val_accuracy=0.922, val_f1_score=0.922]
Validating:   7%|▋         | 2/29 [00:06<01:12,  2.68s/it][A
Epoch 118:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.0982, v_num=1, train_loss=0.291, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.285, val_accuracy=0.922, val_f1_score=0.922]
Validating:  14%|█▍        | 4/29 [00:06<00:25,  1.02s/it][A
Epoch 118:  91%|█████████ | 232/255 [02:37<00:15,  1.48it/s, loss=0.0982, v_num=1, train_loss=0.291, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.285, val_accuracy=0.922, va

Epoch 118, global step 26893: val_loss was not in top 2


Epoch 119:  89%|████████▊ | 226/255 [02:29<00:19,  1.51it/s, loss=0.0342, v_num=1, train_loss=0.0233, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.296, val_accuracy=0.908, val_f1_score=0.908] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 119:  89%|████████▉ | 228/255 [02:35<00:18,  1.47it/s, loss=0.0342, v_num=1, train_loss=0.0233, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.296, val_accuracy=0.908, val_f1_score=0.908]
Validating:   7%|▋         | 2/29 [00:06<01:11,  2.67s/it][A
Epoch 119:  90%|█████████ | 230/255 [02:35<00:16,  1.48it/s, loss=0.0342, v_num=1, train_loss=0.0233, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.296, val_accuracy=0.908, val_f1_score=0.908]
Validating:  14%|█▍        | 4/29 [00:06<00:24,  1.02it/s][A
Epoch 119:  91%|█████████ | 232/255 [02:36<00:15,  1.48it/s, loss=0.0342, v_num=1, train_loss=0.0233, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.296, val_accuracy=0.908,

Epoch 119, global step 27119: val_loss reached 0.28462 (best 0.27465), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-1-v3.ckpt" as top 2


Epoch 120:  89%|████████▊ | 226/255 [02:30<00:19,  1.50it/s, loss=0.0316, v_num=1, train_loss=0.0548, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.285, val_accuracy=0.922, val_f1_score=0.922] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 120:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0316, v_num=1, train_loss=0.0548, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.285, val_accuracy=0.922, val_f1_score=0.922]
Validating:   7%|▋         | 2/29 [00:06<01:11,  2.65s/it][A
Epoch 120:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.0316, v_num=1, train_loss=0.0548, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.285, val_accuracy=0.922, val_f1_score=0.922]
Validating:  14%|█▍        | 4/29 [00:06<00:24,  1.03it/s][A
Epoch 120:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.0316, v_num=1, train_loss=0.0548, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.285, val_accuracy=0.922,

Epoch 120, global step 27345: val_loss reached 0.28318 (best 0.27465), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-1-v3.ckpt" as top 2


Epoch 121:  89%|████████▊ | 226/255 [02:29<00:19,  1.51it/s, loss=0.0459, v_num=1, train_loss=0.016, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.283, val_accuracy=0.926, val_f1_score=0.926]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 121:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0459, v_num=1, train_loss=0.016, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.283, val_accuracy=0.926, val_f1_score=0.926]
Validating:   7%|▋         | 2/29 [00:06<01:12,  2.69s/it][A
Epoch 121:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.0459, v_num=1, train_loss=0.016, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.283, val_accuracy=0.926, val_f1_score=0.926]
Validating:  14%|█▍        | 4/29 [00:06<00:25,  1.02s/it][A
Epoch 121:  91%|█████████ | 232/255 [02:36<00:15,  1.48it/s, loss=0.0459, v_num=1, train_loss=0.016, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.283, val_accuracy=0.926, va

Epoch 121, global step 27571: val_loss was not in top 2


Epoch 122:  89%|████████▊ | 226/255 [02:30<00:19,  1.50it/s, loss=0.0504, v_num=1, train_loss=0.170, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.315, val_accuracy=0.925, val_f1_score=0.925]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 122:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0504, v_num=1, train_loss=0.170, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.315, val_accuracy=0.925, val_f1_score=0.925]
Validating:   7%|▋         | 2/29 [00:06<01:11,  2.65s/it][A
Epoch 122:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.0504, v_num=1, train_loss=0.170, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.315, val_accuracy=0.925, val_f1_score=0.925]
Validating:  14%|█▍        | 4/29 [00:06<00:25,  1.01s/it][A
Epoch 122:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.0504, v_num=1, train_loss=0.170, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.315, val_accuracy=0.925, va

Epoch 122, global step 27797: val_loss was not in top 2


Epoch 123:  89%|████████▊ | 226/255 [02:30<00:19,  1.51it/s, loss=0.0276, v_num=1, train_loss=0.00241, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.301, val_accuracy=0.928, val_f1_score=0.928]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 123:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0276, v_num=1, train_loss=0.00241, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.301, val_accuracy=0.928, val_f1_score=0.928]
Validating:   7%|▋         | 2/29 [00:06<01:12,  2.68s/it][A
Epoch 123:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.0276, v_num=1, train_loss=0.00241, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.301, val_accuracy=0.928, val_f1_score=0.928]
Validating:  14%|█▍        | 4/29 [00:06<00:24,  1.02it/s][A
Epoch 123:  91%|█████████ | 232/255 [02:37<00:15,  1.48it/s, loss=0.0276, v_num=1, train_loss=0.00241, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.301, val_accuracy=0

Epoch 123, global step 28023: val_loss was not in top 2


Epoch 124:  89%|████████▊ | 226/255 [02:30<00:19,  1.51it/s, loss=0.0237, v_num=1, train_loss=0.0116, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.340, val_accuracy=0.921, val_f1_score=0.921]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 124:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0237, v_num=1, train_loss=0.0116, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.340, val_accuracy=0.921, val_f1_score=0.921]
Validating:   7%|▋         | 2/29 [00:06<01:11,  2.64s/it][A
Epoch 124:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.0237, v_num=1, train_loss=0.0116, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.340, val_accuracy=0.921, val_f1_score=0.921]
Epoch 124:  91%|█████████ | 232/255 [02:36<00:15,  1.48it/s, loss=0.0237, v_num=1, train_loss=0.0116, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.340, val_accuracy=0.921, val_f1_score=0.921]
Validating:  21%|██        | 6/29 [00:07

Epoch 124, global step 28249: val_loss was not in top 2


Epoch 125:  89%|████████▊ | 226/255 [02:34<00:19,  1.46it/s, loss=0.0279, v_num=1, train_loss=0.0138, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.313, val_accuracy=0.931, val_f1_score=0.931] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 125:  89%|████████▉ | 228/255 [02:41<00:19,  1.42it/s, loss=0.0279, v_num=1, train_loss=0.0138, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.313, val_accuracy=0.931, val_f1_score=0.931]
Validating:   7%|▋         | 2/29 [00:06<01:13,  2.73s/it][A
Epoch 125:  90%|█████████ | 230/255 [02:41<00:17,  1.43it/s, loss=0.0279, v_num=1, train_loss=0.0138, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.313, val_accuracy=0.931, val_f1_score=0.931]
Validating:  14%|█▍        | 4/29 [00:06<00:25,  1.02s/it][A
Epoch 125:  91%|█████████ | 232/255 [02:41<00:16,  1.43it/s, loss=0.0279, v_num=1, train_loss=0.0138, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.313, val_accuracy=0.931,

Epoch 125, global step 28475: val_loss was not in top 2


Epoch 126:  89%|████████▊ | 226/255 [02:30<00:19,  1.50it/s, loss=0.0214, v_num=1, train_loss=0.0123, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.381, val_accuracy=0.919, val_f1_score=0.919] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 126:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0214, v_num=1, train_loss=0.0123, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.381, val_accuracy=0.919, val_f1_score=0.919]
Validating:   7%|▋         | 2/29 [00:06<01:11,  2.65s/it][A
Epoch 126:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.0214, v_num=1, train_loss=0.0123, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.381, val_accuracy=0.919, val_f1_score=0.919]
Validating:  14%|█▍        | 4/29 [00:06<00:25,  1.02s/it][A
Epoch 126:  91%|█████████ | 232/255 [02:37<00:15,  1.48it/s, loss=0.0214, v_num=1, train_loss=0.0123, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.381, val_accuracy=0.919,

Epoch 126, global step 28701: val_loss was not in top 2


Epoch 127:  89%|████████▊ | 226/255 [02:30<00:19,  1.51it/s, loss=0.0739, v_num=1, train_loss=0.0789, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.304, val_accuracy=0.928, val_f1_score=0.928] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 127:  89%|████████▉ | 228/255 [02:36<00:18,  1.46it/s, loss=0.0739, v_num=1, train_loss=0.0789, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.304, val_accuracy=0.928, val_f1_score=0.928]
Validating:   7%|▋         | 2/29 [00:06<01:11,  2.66s/it][A
Epoch 127:  90%|█████████ | 230/255 [02:36<00:17,  1.47it/s, loss=0.0739, v_num=1, train_loss=0.0789, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.304, val_accuracy=0.928, val_f1_score=0.928]
Epoch 127:  91%|█████████ | 232/255 [02:36<00:15,  1.48it/s, loss=0.0739, v_num=1, train_loss=0.0789, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.304, val_accuracy=0.928, val_f1_score=0.928]
Validating:  21%|██        | 6/29 [00:07<

Epoch 127, global step 28927: val_loss was not in top 2


Epoch 128:  89%|████████▊ | 226/255 [02:30<00:19,  1.50it/s, loss=0.0484, v_num=1, train_loss=0.0212, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.303, val_accuracy=0.920, val_f1_score=0.920] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 128:  89%|████████▉ | 228/255 [02:36<00:18,  1.45it/s, loss=0.0484, v_num=1, train_loss=0.0212, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.303, val_accuracy=0.920, val_f1_score=0.920]
Validating:   7%|▋         | 2/29 [00:06<01:12,  2.68s/it][A
Epoch 128:  90%|█████████ | 230/255 [02:37<00:17,  1.46it/s, loss=0.0484, v_num=1, train_loss=0.0212, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.303, val_accuracy=0.920, val_f1_score=0.920]
Validating:  14%|█▍        | 4/29 [00:06<00:24,  1.02it/s][A
Epoch 128:  91%|█████████ | 232/255 [02:37<00:15,  1.47it/s, loss=0.0484, v_num=1, train_loss=0.0212, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.303, val_accuracy=0.920,

Epoch 128, global step 29153: val_loss was not in top 2


Epoch 129:  89%|████████▊ | 226/255 [01:58<00:15,  1.90it/s, loss=0.0317, v_num=1, train_loss=0.0012, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.294, val_accuracy=0.924, val_f1_score=0.924] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 129:  89%|████████▉ | 228/255 [02:04<00:14,  1.83it/s, loss=0.0317, v_num=1, train_loss=0.0012, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.294, val_accuracy=0.924, val_f1_score=0.924]
Epoch 129:  90%|█████████ | 230/255 [02:04<00:13,  1.84it/s, loss=0.0317, v_num=1, train_loss=0.0012, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.294, val_accuracy=0.924, val_f1_score=0.924]
Epoch 129:  91%|█████████ | 232/255 [02:05<00:12,  1.86it/s, loss=0.0317, v_num=1, train_loss=0.0012, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.294, val_accuracy=0.924, val_f1_score=0.924]
Epoch 129:  92%|█████████▏| 234/255 [02:05<00:11,  1.87it/s, loss=0.0317, v_num=1, train_loss=0.0012, t

Epoch 129, global step 29379: val_loss was not in top 2


Epoch 130:  89%|████████▊ | 226/255 [01:21<00:10,  2.78it/s, loss=0.0388, v_num=1, train_loss=0.0325, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.346, val_accuracy=0.919, val_f1_score=0.919] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 130:  89%|████████▉ | 228/255 [01:27<00:10,  2.62it/s, loss=0.0388, v_num=1, train_loss=0.0325, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.346, val_accuracy=0.919, val_f1_score=0.919]
Epoch 130:  90%|█████████ | 230/255 [01:27<00:09,  2.64it/s, loss=0.0388, v_num=1, train_loss=0.0325, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.346, val_accuracy=0.919, val_f1_score=0.919]
Epoch 130:  91%|█████████ | 232/255 [01:27<00:08,  2.65it/s, loss=0.0388, v_num=1, train_loss=0.0325, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.346, val_accuracy=0.919, val_f1_score=0.919]
Epoch 130:  92%|█████████▏| 234/255 [01:27<00:07,  2.67it/s, loss=0.0388, v_num=1, train_loss=0.0325, t

Epoch 130, global step 29605: val_loss was not in top 2


Epoch 131:  89%|████████▊ | 226/255 [01:20<00:10,  2.80it/s, loss=0.0235, v_num=1, train_loss=0.0341, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.377, val_accuracy=0.912, val_f1_score=0.912] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 131:  89%|████████▉ | 228/255 [01:26<00:10,  2.64it/s, loss=0.0235, v_num=1, train_loss=0.0341, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.377, val_accuracy=0.912, val_f1_score=0.912]
Epoch 131:  90%|█████████ | 230/255 [01:26<00:09,  2.66it/s, loss=0.0235, v_num=1, train_loss=0.0341, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.377, val_accuracy=0.912, val_f1_score=0.912]
Epoch 131:  91%|█████████ | 232/255 [01:26<00:08,  2.68it/s, loss=0.0235, v_num=1, train_loss=0.0341, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.377, val_accuracy=0.912, val_f1_score=0.912]
Epoch 131:  92%|█████████▏| 234/255 [01:26<00:07,  2.70it/s, loss=0.0235, v_num=1, train_loss=0.0341, t

Epoch 131, global step 29831: val_loss was not in top 2


Epoch 132:  89%|████████▊ | 226/255 [01:20<00:10,  2.80it/s, loss=0.0415, v_num=1, train_loss=0.0293, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.396, val_accuracy=0.919, val_f1_score=0.919]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 132:  89%|████████▉ | 228/255 [01:26<00:10,  2.65it/s, loss=0.0415, v_num=1, train_loss=0.0293, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.396, val_accuracy=0.919, val_f1_score=0.919]
Epoch 132:  90%|█████████ | 230/255 [01:26<00:09,  2.67it/s, loss=0.0415, v_num=1, train_loss=0.0293, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.396, val_accuracy=0.919, val_f1_score=0.919]
Epoch 132:  91%|█████████ | 232/255 [01:26<00:08,  2.68it/s, loss=0.0415, v_num=1, train_loss=0.0293, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.396, val_accuracy=0.919, val_f1_score=0.919]
Epoch 132:  92%|█████████▏| 234/255 [01:26<00:07,  2.70it/s, loss=0.0415, v_num=1, train_loss=0.0293, 

Epoch 132, global step 30057: val_loss was not in top 2


Epoch 133:  89%|████████▊ | 226/255 [01:20<00:10,  2.80it/s, loss=0.0423, v_num=1, train_loss=0.0134, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.349, val_accuracy=0.927, val_f1_score=0.927]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 133:  89%|████████▉ | 228/255 [01:26<00:10,  2.64it/s, loss=0.0423, v_num=1, train_loss=0.0134, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.349, val_accuracy=0.927, val_f1_score=0.927]
Epoch 133:  90%|█████████ | 230/255 [01:26<00:09,  2.66it/s, loss=0.0423, v_num=1, train_loss=0.0134, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.349, val_accuracy=0.927, val_f1_score=0.927]
Epoch 133:  91%|█████████ | 232/255 [01:26<00:08,  2.68it/s, loss=0.0423, v_num=1, train_loss=0.0134, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.349, val_accuracy=0.927, val_f1_score=0.927]
Epoch 133:  92%|█████████▏| 234/255 [01:26<00:07,  2.69it/s, loss=0.0423, v_num=1, train_loss=0.0134, 

Epoch 133, global step 30283: val_loss was not in top 2


Epoch 134:  89%|████████▊ | 226/255 [01:22<00:10,  2.75it/s, loss=0.0209, v_num=1, train_loss=0.0251, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.365, val_accuracy=0.923, val_f1_score=0.923]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 134:  89%|████████▉ | 228/255 [01:27<00:10,  2.60it/s, loss=0.0209, v_num=1, train_loss=0.0251, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.365, val_accuracy=0.923, val_f1_score=0.923]
Epoch 134:  90%|█████████ | 230/255 [01:27<00:09,  2.62it/s, loss=0.0209, v_num=1, train_loss=0.0251, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.365, val_accuracy=0.923, val_f1_score=0.923]
Epoch 134:  91%|█████████ | 232/255 [01:28<00:08,  2.63it/s, loss=0.0209, v_num=1, train_loss=0.0251, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.365, val_accuracy=0.923, val_f1_score=0.923]
Epoch 134:  92%|█████████▏| 234/255 [01:28<00:07,  2.65it/s, loss=0.0209, v_num=1, train_loss=0.0251, 

Epoch 134, global step 30509: val_loss was not in top 2


Epoch 135:  89%|████████▊ | 226/255 [01:24<00:10,  2.67it/s, loss=0.0321, v_num=1, train_loss=0.00252, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.367, val_accuracy=0.929, val_f1_score=0.929]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 135:  89%|████████▉ | 228/255 [01:30<00:10,  2.52it/s, loss=0.0321, v_num=1, train_loss=0.00252, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.367, val_accuracy=0.929, val_f1_score=0.929]
Epoch 135:  90%|█████████ | 230/255 [01:30<00:09,  2.54it/s, loss=0.0321, v_num=1, train_loss=0.00252, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.367, val_accuracy=0.929, val_f1_score=0.929]
Epoch 135:  91%|█████████ | 232/255 [01:30<00:08,  2.56it/s, loss=0.0321, v_num=1, train_loss=0.00252, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.367, val_accuracy=0.929, val_f1_score=0.929]
Epoch 135:  92%|█████████▏| 234/255 [01:30<00:08,  2.57it/s, loss=0.0321, v_num=1, train_loss=0.00

Epoch 135, global step 30735: val_loss was not in top 2


Epoch 136:  89%|████████▊ | 226/255 [01:24<00:10,  2.67it/s, loss=0.0205, v_num=1, train_loss=0.00463, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.367, val_accuracy=0.924, val_f1_score=0.924] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 136:  89%|████████▉ | 228/255 [01:30<00:10,  2.52it/s, loss=0.0205, v_num=1, train_loss=0.00463, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.367, val_accuracy=0.924, val_f1_score=0.924]
Epoch 136:  90%|█████████ | 230/255 [01:30<00:09,  2.54it/s, loss=0.0205, v_num=1, train_loss=0.00463, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.367, val_accuracy=0.924, val_f1_score=0.924]
Epoch 136:  91%|█████████ | 232/255 [01:30<00:08,  2.56it/s, loss=0.0205, v_num=1, train_loss=0.00463, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.367, val_accuracy=0.924, val_f1_score=0.924]
Epoch 136:  92%|█████████▏| 234/255 [01:30<00:08,  2.57it/s, loss=0.0205, v_num=1, train_loss=0.004

Epoch 136, global step 30961: val_loss was not in top 2


Epoch 137:  89%|████████▊ | 226/255 [01:24<00:10,  2.66it/s, loss=0.0192, v_num=1, train_loss=0.000355, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.340, val_accuracy=0.923, val_f1_score=0.923] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 137:  89%|████████▉ | 228/255 [01:30<00:10,  2.52it/s, loss=0.0192, v_num=1, train_loss=0.000355, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.340, val_accuracy=0.923, val_f1_score=0.923]
Epoch 137:  90%|█████████ | 230/255 [01:30<00:09,  2.54it/s, loss=0.0192, v_num=1, train_loss=0.000355, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.340, val_accuracy=0.923, val_f1_score=0.923]
Epoch 137:  91%|█████████ | 232/255 [01:30<00:09,  2.55it/s, loss=0.0192, v_num=1, train_loss=0.000355, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.340, val_accuracy=0.923, val_f1_score=0.923]
Epoch 137:  92%|█████████▏| 234/255 [01:31<00:08,  2.57it/s, loss=0.0192, v_num=1, train_loss=0

Epoch 137, global step 31187: val_loss was not in top 2


Epoch 138:  89%|████████▊ | 226/255 [01:25<00:10,  2.66it/s, loss=0.0195, v_num=1, train_loss=0.000996, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.347, val_accuracy=0.930, val_f1_score=0.930]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 138:  89%|████████▉ | 228/255 [01:30<00:10,  2.51it/s, loss=0.0195, v_num=1, train_loss=0.000996, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.347, val_accuracy=0.930, val_f1_score=0.930]
Epoch 138:  90%|█████████ | 230/255 [01:30<00:09,  2.53it/s, loss=0.0195, v_num=1, train_loss=0.000996, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.347, val_accuracy=0.930, val_f1_score=0.930]
Epoch 138:  91%|█████████ | 232/255 [01:31<00:09,  2.55it/s, loss=0.0195, v_num=1, train_loss=0.000996, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.347, val_accuracy=0.930, val_f1_score=0.930]
Epoch 138:  92%|█████████▏| 234/255 [01:31<00:08,  2.57it/s, loss=0.0195, v_num=1, train_loss=0.

Epoch 138, global step 31413: val_loss was not in top 2


Epoch 139:  89%|████████▊ | 226/255 [01:25<00:10,  2.65it/s, loss=0.0263, v_num=1, train_loss=0.013, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.345, val_accuracy=0.929, val_f1_score=0.929]   
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 139:  89%|████████▉ | 228/255 [01:30<00:10,  2.51it/s, loss=0.0263, v_num=1, train_loss=0.013, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.345, val_accuracy=0.929, val_f1_score=0.929]
Epoch 139:  90%|█████████ | 230/255 [01:31<00:09,  2.52it/s, loss=0.0263, v_num=1, train_loss=0.013, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.345, val_accuracy=0.929, val_f1_score=0.929]
Epoch 139:  91%|█████████ | 232/255 [01:31<00:09,  2.54it/s, loss=0.0263, v_num=1, train_loss=0.013, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.345, val_accuracy=0.929, val_f1_score=0.929]
Epoch 139:  92%|█████████▏| 234/255 [01:31<00:08,  2.56it/s, loss=0.0263, v_num=1, train_loss=0.013, trai

Epoch 139, global step 31639: val_loss was not in top 2


Epoch 140:  89%|████████▊ | 226/255 [01:25<00:10,  2.66it/s, loss=0.0197, v_num=1, train_loss=0.103, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.340, val_accuracy=0.927, val_f1_score=0.927]   
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 140:  89%|████████▉ | 228/255 [01:30<00:10,  2.52it/s, loss=0.0197, v_num=1, train_loss=0.103, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.340, val_accuracy=0.927, val_f1_score=0.927]
Epoch 140:  90%|█████████ | 230/255 [01:30<00:09,  2.53it/s, loss=0.0197, v_num=1, train_loss=0.103, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.340, val_accuracy=0.927, val_f1_score=0.927]
Epoch 140:  91%|█████████ | 232/255 [01:31<00:09,  2.55it/s, loss=0.0197, v_num=1, train_loss=0.103, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.340, val_accuracy=0.927, val_f1_score=0.927]
Epoch 140:  92%|█████████▏| 234/255 [01:31<00:08,  2.57it/s, loss=0.0197, v_num=1, train_loss=0.103, trai

Epoch 140, global step 31865: val_loss was not in top 2


Epoch 141:  89%|████████▊ | 226/255 [01:25<00:10,  2.66it/s, loss=0.0188, v_num=1, train_loss=0.000166, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.406, val_accuracy=0.923, val_f1_score=0.923] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 141:  89%|████████▉ | 228/255 [01:30<00:10,  2.51it/s, loss=0.0188, v_num=1, train_loss=0.000166, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.406, val_accuracy=0.923, val_f1_score=0.923]
Epoch 141:  90%|█████████ | 230/255 [01:31<00:09,  2.52it/s, loss=0.0188, v_num=1, train_loss=0.000166, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.406, val_accuracy=0.923, val_f1_score=0.923]
Epoch 141:  91%|█████████ | 232/255 [01:31<00:09,  2.54it/s, loss=0.0188, v_num=1, train_loss=0.000166, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.406, val_accuracy=0.923, val_f1_score=0.923]
Epoch 141:  92%|█████████▏| 234/255 [01:31<00:08,  2.56it/s, loss=0.0188, v_num=1, train_loss=0

Epoch 141, global step 32091: val_loss was not in top 2


Epoch 142:  89%|████████▊ | 226/255 [01:25<00:10,  2.65it/s, loss=0.0105, v_num=1, train_loss=0.000688, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.393, val_accuracy=0.927, val_f1_score=0.927]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 142:  89%|████████▉ | 228/255 [01:30<00:10,  2.51it/s, loss=0.0105, v_num=1, train_loss=0.000688, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.393, val_accuracy=0.927, val_f1_score=0.927]
Epoch 142:  90%|█████████ | 230/255 [01:31<00:09,  2.52it/s, loss=0.0105, v_num=1, train_loss=0.000688, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.393, val_accuracy=0.927, val_f1_score=0.927]
Epoch 142:  91%|█████████ | 232/255 [01:31<00:09,  2.54it/s, loss=0.0105, v_num=1, train_loss=0.000688, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.393, val_accuracy=0.927, val_f1_score=0.927]
Epoch 142:  92%|█████████▏| 234/255 [01:31<00:08,  2.56it/s, loss=0.0105, v_num=1, train_loss=0.

Epoch 142, global step 32317: val_loss was not in top 2


Epoch 143:  89%|████████▊ | 226/255 [01:24<00:10,  2.66it/s, loss=0.0522, v_num=1, train_loss=0.0343, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.330, val_accuracy=0.933, val_f1_score=0.933]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 143:  89%|████████▉ | 228/255 [01:30<00:10,  2.52it/s, loss=0.0522, v_num=1, train_loss=0.0343, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.330, val_accuracy=0.933, val_f1_score=0.933]
Epoch 143:  90%|█████████ | 230/255 [01:30<00:09,  2.53it/s, loss=0.0522, v_num=1, train_loss=0.0343, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.330, val_accuracy=0.933, val_f1_score=0.933]
Epoch 143:  91%|█████████ | 232/255 [01:30<00:09,  2.55it/s, loss=0.0522, v_num=1, train_loss=0.0343, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.330, val_accuracy=0.933, val_f1_score=0.933]
Epoch 143:  92%|█████████▏| 234/255 [01:31<00:08,  2.57it/s, loss=0.0522, v_num=1, train_loss=0.0343, 

Epoch 143, global step 32543: val_loss was not in top 2


Epoch 144:  89%|████████▊ | 226/255 [01:25<00:10,  2.65it/s, loss=0.0153, v_num=1, train_loss=0.00522, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.349, val_accuracy=0.930, val_f1_score=0.930] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 144:  89%|████████▉ | 228/255 [01:31<00:10,  2.50it/s, loss=0.0153, v_num=1, train_loss=0.00522, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.349, val_accuracy=0.930, val_f1_score=0.930]
Epoch 144:  90%|█████████ | 230/255 [01:31<00:09,  2.52it/s, loss=0.0153, v_num=1, train_loss=0.00522, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.349, val_accuracy=0.930, val_f1_score=0.930]
Epoch 144:  91%|█████████ | 232/255 [01:31<00:09,  2.54it/s, loss=0.0153, v_num=1, train_loss=0.00522, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.349, val_accuracy=0.930, val_f1_score=0.930]
Epoch 144:  92%|█████████▏| 234/255 [01:31<00:08,  2.56it/s, loss=0.0153, v_num=1, train_loss=0.005

Epoch 144, global step 32769: val_loss was not in top 2


Epoch 145:  89%|████████▊ | 226/255 [01:25<00:10,  2.64it/s, loss=0.0289, v_num=1, train_loss=0.0409, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.387, val_accuracy=0.923, val_f1_score=0.923]   
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 145:  89%|████████▉ | 228/255 [01:31<00:10,  2.49it/s, loss=0.0289, v_num=1, train_loss=0.0409, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.387, val_accuracy=0.923, val_f1_score=0.923]
Epoch 145:  90%|█████████ | 230/255 [01:31<00:09,  2.51it/s, loss=0.0289, v_num=1, train_loss=0.0409, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.387, val_accuracy=0.923, val_f1_score=0.923]
Epoch 145:  91%|█████████ | 232/255 [01:31<00:09,  2.53it/s, loss=0.0289, v_num=1, train_loss=0.0409, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.387, val_accuracy=0.923, val_f1_score=0.923]
Epoch 145:  92%|█████████▏| 234/255 [01:31<00:08,  2.55it/s, loss=0.0289, v_num=1, train_loss=0.0409,

Epoch 145, global step 32995: val_loss was not in top 2


Epoch 146:  89%|████████▊ | 226/255 [01:25<00:10,  2.64it/s, loss=0.0458, v_num=1, train_loss=0.000424, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.397, val_accuracy=0.923, val_f1_score=0.923] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 146:  89%|████████▉ | 228/255 [01:31<00:10,  2.49it/s, loss=0.0458, v_num=1, train_loss=0.000424, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.397, val_accuracy=0.923, val_f1_score=0.923]
Validating:   7%|▋         | 2/29 [00:06<01:07,  2.52s/it][A
Epoch 146:  90%|█████████ | 230/255 [01:31<00:09,  2.51it/s, loss=0.0458, v_num=1, train_loss=0.000424, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.397, val_accuracy=0.923, val_f1_score=0.923]
Epoch 146:  91%|█████████ | 232/255 [01:31<00:09,  2.53it/s, loss=0.0458, v_num=1, train_loss=0.000424, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.397, val_accuracy=0.923, val_f1_score=0.923]
Epoch 146:  92%|█████████▏| 234/2

Epoch 146, global step 33221: val_loss was not in top 2


Epoch 147:  89%|████████▊ | 226/255 [01:25<00:10,  2.65it/s, loss=0.0216, v_num=1, train_loss=0.0182, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.331, val_accuracy=0.933, val_f1_score=0.933]   
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 147:  89%|████████▉ | 228/255 [01:31<00:10,  2.50it/s, loss=0.0216, v_num=1, train_loss=0.0182, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.331, val_accuracy=0.933, val_f1_score=0.933]
Epoch 147:  90%|█████████ | 230/255 [01:31<00:09,  2.52it/s, loss=0.0216, v_num=1, train_loss=0.0182, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.331, val_accuracy=0.933, val_f1_score=0.933]
Epoch 147:  91%|█████████ | 232/255 [01:31<00:09,  2.54it/s, loss=0.0216, v_num=1, train_loss=0.0182, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.331, val_accuracy=0.933, val_f1_score=0.933]
Epoch 147:  92%|█████████▏| 234/255 [01:31<00:08,  2.55it/s, loss=0.0216, v_num=1, train_loss=0.0182,

Epoch 147, global step 33447: val_loss was not in top 2


Epoch 148:  89%|████████▊ | 226/255 [01:24<00:10,  2.66it/s, loss=0.0164, v_num=1, train_loss=0.0167, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.338, val_accuracy=0.929, val_f1_score=0.929]   
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 148:  89%|████████▉ | 228/255 [01:30<00:10,  2.51it/s, loss=0.0164, v_num=1, train_loss=0.0167, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.338, val_accuracy=0.929, val_f1_score=0.929]
Epoch 148:  90%|█████████ | 230/255 [01:31<00:09,  2.53it/s, loss=0.0164, v_num=1, train_loss=0.0167, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.338, val_accuracy=0.929, val_f1_score=0.929]
Epoch 148:  91%|█████████ | 232/255 [01:31<00:09,  2.54it/s, loss=0.0164, v_num=1, train_loss=0.0167, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.338, val_accuracy=0.929, val_f1_score=0.929]
Epoch 148:  92%|█████████▏| 234/255 [01:31<00:08,  2.56it/s, loss=0.0164, v_num=1, train_loss=0.0167,

Epoch 148, global step 33673: val_loss was not in top 2


Epoch 149:  89%|████████▊ | 226/255 [01:25<00:10,  2.65it/s, loss=0.0303, v_num=1, train_loss=0.0371, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.336, val_accuracy=0.932, val_f1_score=0.932]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 149:  89%|████████▉ | 228/255 [01:30<00:10,  2.51it/s, loss=0.0303, v_num=1, train_loss=0.0371, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.336, val_accuracy=0.932, val_f1_score=0.932]
Epoch 149:  90%|█████████ | 230/255 [01:31<00:09,  2.52it/s, loss=0.0303, v_num=1, train_loss=0.0371, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.336, val_accuracy=0.932, val_f1_score=0.932]
Epoch 149:  91%|█████████ | 232/255 [01:31<00:09,  2.54it/s, loss=0.0303, v_num=1, train_loss=0.0371, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.336, val_accuracy=0.932, val_f1_score=0.932]
Epoch 149:  92%|█████████▏| 234/255 [01:31<00:08,  2.56it/s, loss=0.0303, v_num=1, train_loss=0.0371, 

Epoch 149, global step 33899: val_loss was not in top 2


Epoch 150:  89%|████████▊ | 226/255 [01:25<00:10,  2.65it/s, loss=0.0138, v_num=1, train_loss=0.000233, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.345, val_accuracy=0.935, val_f1_score=0.935] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 150:  89%|████████▉ | 228/255 [01:31<00:10,  2.50it/s, loss=0.0138, v_num=1, train_loss=0.000233, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.345, val_accuracy=0.935, val_f1_score=0.935]
Epoch 150:  90%|█████████ | 230/255 [01:31<00:09,  2.52it/s, loss=0.0138, v_num=1, train_loss=0.000233, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.345, val_accuracy=0.935, val_f1_score=0.935]
Epoch 150:  91%|█████████ | 232/255 [01:31<00:09,  2.53it/s, loss=0.0138, v_num=1, train_loss=0.000233, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.345, val_accuracy=0.935, val_f1_score=0.935]
Epoch 150:  92%|█████████▏| 234/255 [01:31<00:08,  2.55it/s, loss=0.0138, v_num=1, train_loss=0

Epoch 150, global step 34125: val_loss was not in top 2


Epoch 151:  89%|████████▊ | 226/255 [01:25<00:10,  2.65it/s, loss=0.0161, v_num=1, train_loss=0.00423, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.362, val_accuracy=0.930, val_f1_score=0.930]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 151:  89%|████████▉ | 228/255 [01:31<00:10,  2.50it/s, loss=0.0161, v_num=1, train_loss=0.00423, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.362, val_accuracy=0.930, val_f1_score=0.930]
Epoch 151:  90%|█████████ | 230/255 [01:31<00:09,  2.52it/s, loss=0.0161, v_num=1, train_loss=0.00423, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.362, val_accuracy=0.930, val_f1_score=0.930]
Epoch 151:  91%|█████████ | 232/255 [01:31<00:09,  2.54it/s, loss=0.0161, v_num=1, train_loss=0.00423, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.362, val_accuracy=0.930, val_f1_score=0.930]
Epoch 151:  92%|█████████▏| 234/255 [01:31<00:08,  2.55it/s, loss=0.0161, v_num=1, train_loss=0.00

Epoch 151, global step 34351: val_loss was not in top 2


Epoch 152:  89%|████████▊ | 226/255 [01:25<00:10,  2.66it/s, loss=0.0302, v_num=1, train_loss=0.00821, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.386, val_accuracy=0.936, val_f1_score=0.936] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 152:  89%|████████▉ | 228/255 [01:30<00:10,  2.51it/s, loss=0.0302, v_num=1, train_loss=0.00821, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.386, val_accuracy=0.936, val_f1_score=0.936]
Epoch 152:  90%|█████████ | 230/255 [01:30<00:09,  2.53it/s, loss=0.0302, v_num=1, train_loss=0.00821, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.386, val_accuracy=0.936, val_f1_score=0.936]
Epoch 152:  91%|█████████ | 232/255 [01:31<00:09,  2.55it/s, loss=0.0302, v_num=1, train_loss=0.00821, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.386, val_accuracy=0.936, val_f1_score=0.936]
Epoch 152:  92%|█████████▏| 234/255 [01:31<00:08,  2.56it/s, loss=0.0302, v_num=1, train_loss=0.008

Epoch 152, global step 34577: val_loss was not in top 2


Epoch 153:  89%|████████▊ | 226/255 [01:25<00:10,  2.66it/s, loss=0.0141, v_num=1, train_loss=0.0012, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.341, val_accuracy=0.928, val_f1_score=0.928]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 153:  89%|████████▉ | 228/255 [01:30<00:10,  2.51it/s, loss=0.0141, v_num=1, train_loss=0.0012, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.341, val_accuracy=0.928, val_f1_score=0.928]
Epoch 153:  90%|█████████ | 230/255 [01:30<00:09,  2.53it/s, loss=0.0141, v_num=1, train_loss=0.0012, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.341, val_accuracy=0.928, val_f1_score=0.928]
Epoch 153:  91%|█████████ | 232/255 [01:31<00:09,  2.55it/s, loss=0.0141, v_num=1, train_loss=0.0012, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.341, val_accuracy=0.928, val_f1_score=0.928]
Epoch 153:  92%|█████████▏| 234/255 [01:31<00:08,  2.56it/s, loss=0.0141, v_num=1, train_loss=0.0012, 

Epoch 153, global step 34803: val_loss was not in top 2


Epoch 154:  89%|████████▊ | 226/255 [01:25<00:10,  2.66it/s, loss=0.0186, v_num=1, train_loss=0.115, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.352, val_accuracy=0.931, val_f1_score=0.931]   
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 154:  89%|████████▉ | 228/255 [01:30<00:10,  2.51it/s, loss=0.0186, v_num=1, train_loss=0.115, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.352, val_accuracy=0.931, val_f1_score=0.931]
Epoch 154:  90%|█████████ | 230/255 [01:31<00:09,  2.53it/s, loss=0.0186, v_num=1, train_loss=0.115, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.352, val_accuracy=0.931, val_f1_score=0.931]
Epoch 154:  91%|█████████ | 232/255 [01:31<00:09,  2.54it/s, loss=0.0186, v_num=1, train_loss=0.115, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.352, val_accuracy=0.931, val_f1_score=0.931]
Epoch 154:  92%|█████████▏| 234/255 [01:31<00:08,  2.56it/s, loss=0.0186, v_num=1, train_loss=0.115, trai

Epoch 154, global step 35029: val_loss was not in top 2


Epoch 155:  89%|████████▊ | 226/255 [01:25<00:10,  2.65it/s, loss=0.0133, v_num=1, train_loss=0.00321, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.338, val_accuracy=0.938, val_f1_score=0.938] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 155:  89%|████████▉ | 228/255 [01:31<00:10,  2.50it/s, loss=0.0133, v_num=1, train_loss=0.00321, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.338, val_accuracy=0.938, val_f1_score=0.938]
Epoch 155:  90%|█████████ | 230/255 [01:31<00:09,  2.52it/s, loss=0.0133, v_num=1, train_loss=0.00321, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.338, val_accuracy=0.938, val_f1_score=0.938]
Epoch 155:  91%|█████████ | 232/255 [01:31<00:09,  2.53it/s, loss=0.0133, v_num=1, train_loss=0.00321, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.338, val_accuracy=0.938, val_f1_score=0.938]
Epoch 155:  92%|█████████▏| 234/255 [01:31<00:08,  2.55it/s, loss=0.0133, v_num=1, train_loss=0.003

Epoch 155, global step 35255: val_loss was not in top 2


Epoch 156:  89%|████████▊ | 226/255 [01:25<00:10,  2.66it/s, loss=0.015, v_num=1, train_loss=0.0175, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.361, val_accuracy=0.937, val_f1_score=0.937]    
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 156:  89%|████████▉ | 228/255 [01:30<00:10,  2.51it/s, loss=0.015, v_num=1, train_loss=0.0175, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.361, val_accuracy=0.937, val_f1_score=0.937]
Epoch 156:  90%|█████████ | 230/255 [01:31<00:09,  2.53it/s, loss=0.015, v_num=1, train_loss=0.0175, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.361, val_accuracy=0.937, val_f1_score=0.937]
Epoch 156:  91%|█████████ | 232/255 [01:31<00:09,  2.54it/s, loss=0.015, v_num=1, train_loss=0.0175, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.361, val_accuracy=0.937, val_f1_score=0.937]
Epoch 156:  92%|█████████▏| 234/255 [01:31<00:08,  2.56it/s, loss=0.015, v_num=1, train_loss=0.0175, tra

Epoch 156, global step 35481: val_loss was not in top 2


Epoch 157:  89%|████████▊ | 226/255 [01:24<00:10,  2.66it/s, loss=0.0165, v_num=1, train_loss=0.0024, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.348, val_accuracy=0.938, val_f1_score=0.938]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 157:  89%|████████▉ | 228/255 [01:30<00:10,  2.52it/s, loss=0.0165, v_num=1, train_loss=0.0024, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.348, val_accuracy=0.938, val_f1_score=0.938]
Epoch 157:  90%|█████████ | 230/255 [01:30<00:09,  2.53it/s, loss=0.0165, v_num=1, train_loss=0.0024, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.348, val_accuracy=0.938, val_f1_score=0.938]
Epoch 157:  91%|█████████ | 232/255 [01:30<00:09,  2.55it/s, loss=0.0165, v_num=1, train_loss=0.0024, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.348, val_accuracy=0.938, val_f1_score=0.938]
Epoch 157:  92%|█████████▏| 234/255 [01:31<00:08,  2.57it/s, loss=0.0165, v_num=1, train_loss=0.0024, 

Epoch 157, global step 35707: val_loss was not in top 2


Epoch 158:  89%|████████▊ | 226/255 [01:25<00:10,  2.65it/s, loss=0.00963, v_num=1, train_loss=0.00013, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.328, val_accuracy=0.941, val_f1_score=0.941] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 158:  89%|████████▉ | 228/255 [01:31<00:10,  2.50it/s, loss=0.00963, v_num=1, train_loss=0.00013, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.328, val_accuracy=0.941, val_f1_score=0.941]
Epoch 158:  90%|█████████ | 230/255 [01:31<00:09,  2.52it/s, loss=0.00963, v_num=1, train_loss=0.00013, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.328, val_accuracy=0.941, val_f1_score=0.941]
Epoch 158:  91%|█████████ | 232/255 [01:31<00:09,  2.54it/s, loss=0.00963, v_num=1, train_loss=0.00013, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.328, val_accuracy=0.941, val_f1_score=0.941]
Epoch 158:  92%|█████████▏| 234/255 [01:31<00:08,  2.56it/s, loss=0.00963, v_num=1, train_loss=

Epoch 158, global step 35933: val_loss was not in top 2


Epoch 159:  89%|████████▊ | 226/255 [01:24<00:10,  2.66it/s, loss=0.00361, v_num=1, train_loss=0.00734, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.348, val_accuracy=0.936, val_f1_score=0.936] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 159:  89%|████████▉ | 228/255 [01:30<00:10,  2.51it/s, loss=0.00361, v_num=1, train_loss=0.00734, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.348, val_accuracy=0.936, val_f1_score=0.936]
Epoch 159:  90%|█████████ | 230/255 [01:30<00:09,  2.53it/s, loss=0.00361, v_num=1, train_loss=0.00734, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.348, val_accuracy=0.936, val_f1_score=0.936]
Epoch 159:  91%|█████████ | 232/255 [01:31<00:09,  2.55it/s, loss=0.00361, v_num=1, train_loss=0.00734, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.348, val_accuracy=0.936, val_f1_score=0.936]
Epoch 159:  92%|█████████▏| 234/255 [01:31<00:08,  2.56it/s, loss=0.00361, v_num=1, train_loss=

Epoch 159, global step 36159: val_loss was not in top 2


Epoch 160:  89%|████████▊ | 226/255 [01:25<00:10,  2.66it/s, loss=0.033, v_num=1, train_loss=0.0181, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.360, val_accuracy=0.944, val_f1_score=0.944]   
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 160:  89%|████████▉ | 228/255 [01:30<00:10,  2.51it/s, loss=0.033, v_num=1, train_loss=0.0181, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.360, val_accuracy=0.944, val_f1_score=0.944]
Validating:   7%|▋         | 2/29 [00:05<01:06,  2.44s/it][A
Epoch 160:  90%|█████████ | 230/255 [01:31<00:09,  2.52it/s, loss=0.033, v_num=1, train_loss=0.0181, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.360, val_accuracy=0.944, val_f1_score=0.944]
Epoch 160:  91%|█████████ | 232/255 [01:31<00:09,  2.54it/s, loss=0.033, v_num=1, train_loss=0.0181, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.360, val_accuracy=0.944, val_f1_score=0.944]
Epoch 160:  92%|█████████▏| 234/255 [01:31<

Epoch 160, global step 36385: val_loss was not in top 2


Epoch 161:  89%|████████▊ | 226/255 [01:25<00:10,  2.65it/s, loss=0.0162, v_num=1, train_loss=0.000602, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.355, val_accuracy=0.933, val_f1_score=0.933]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 161:  89%|████████▉ | 228/255 [01:31<00:10,  2.50it/s, loss=0.0162, v_num=1, train_loss=0.000602, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.355, val_accuracy=0.933, val_f1_score=0.933]
Epoch 161:  90%|█████████ | 230/255 [01:31<00:09,  2.52it/s, loss=0.0162, v_num=1, train_loss=0.000602, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.355, val_accuracy=0.933, val_f1_score=0.933]
Epoch 161:  91%|█████████ | 232/255 [01:31<00:09,  2.54it/s, loss=0.0162, v_num=1, train_loss=0.000602, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.355, val_accuracy=0.933, val_f1_score=0.933]
Epoch 161:  92%|█████████▏| 234/255 [01:31<00:08,  2.55it/s, loss=0.0162, v_num=1, train_loss=0.

Epoch 161, global step 36611: val_loss was not in top 2


Epoch 162:  89%|████████▊ | 226/255 [01:25<00:10,  2.65it/s, loss=0.0142, v_num=1, train_loss=0.0268, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.360, val_accuracy=0.928, val_f1_score=0.928]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 162:  89%|████████▉ | 228/255 [01:31<00:10,  2.50it/s, loss=0.0142, v_num=1, train_loss=0.0268, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.360, val_accuracy=0.928, val_f1_score=0.928]
Epoch 162:  90%|█████████ | 230/255 [01:31<00:09,  2.52it/s, loss=0.0142, v_num=1, train_loss=0.0268, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.360, val_accuracy=0.928, val_f1_score=0.928]
Epoch 162:  91%|█████████ | 232/255 [01:31<00:09,  2.54it/s, loss=0.0142, v_num=1, train_loss=0.0268, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.360, val_accuracy=0.928, val_f1_score=0.928]
Epoch 162:  92%|█████████▏| 234/255 [01:31<00:08,  2.56it/s, loss=0.0142, v_num=1, train_loss=0.0268, 

Epoch 162, global step 36837: val_loss was not in top 2


Epoch 163:  89%|████████▊ | 226/255 [01:26<00:11,  2.62it/s, loss=0.00987, v_num=1, train_loss=0.000212, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.338, val_accuracy=0.928, val_f1_score=0.928]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 163:  89%|████████▉ | 228/255 [01:31<00:10,  2.48it/s, loss=0.00987, v_num=1, train_loss=0.000212, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.338, val_accuracy=0.928, val_f1_score=0.928]
Epoch 163:  90%|█████████ | 230/255 [01:32<00:10,  2.50it/s, loss=0.00987, v_num=1, train_loss=0.000212, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.338, val_accuracy=0.928, val_f1_score=0.928]
Epoch 163:  91%|█████████ | 232/255 [01:32<00:09,  2.51it/s, loss=0.00987, v_num=1, train_loss=0.000212, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.338, val_accuracy=0.928, val_f1_score=0.928]
Epoch 163:  92%|█████████▏| 234/255 [01:32<00:08,  2.53it/s, loss=0.00987, v_num=1, train_lo

Epoch 163, global step 37063: val_loss was not in top 2


Epoch 164:  89%|████████▊ | 226/255 [01:25<00:10,  2.64it/s, loss=0.11, v_num=1, train_loss=0.0465, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.340, val_accuracy=0.929, val_f1_score=0.929]     
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 164:  89%|████████▉ | 228/255 [01:31<00:10,  2.49it/s, loss=0.11, v_num=1, train_loss=0.0465, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.340, val_accuracy=0.929, val_f1_score=0.929]
Epoch 164:  90%|█████████ | 230/255 [01:31<00:09,  2.51it/s, loss=0.11, v_num=1, train_loss=0.0465, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.340, val_accuracy=0.929, val_f1_score=0.929]
Epoch 164:  91%|█████████ | 232/255 [01:31<00:09,  2.53it/s, loss=0.11, v_num=1, train_loss=0.0465, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.340, val_accuracy=0.929, val_f1_score=0.929]
Epoch 164:  92%|█████████▏| 234/255 [01:31<00:08,  2.54it/s, loss=0.11, v_num=1, train_loss=0.0465, train_a

Epoch 164, global step 37289: val_loss was not in top 2


Epoch 165:  89%|████████▊ | 226/255 [01:25<00:10,  2.64it/s, loss=0.0139, v_num=1, train_loss=0.00558, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.320, val_accuracy=0.915, val_f1_score=0.915]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 165:  89%|████████▉ | 228/255 [01:31<00:10,  2.49it/s, loss=0.0139, v_num=1, train_loss=0.00558, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.320, val_accuracy=0.915, val_f1_score=0.915]
Epoch 165:  90%|█████████ | 230/255 [01:31<00:09,  2.51it/s, loss=0.0139, v_num=1, train_loss=0.00558, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.320, val_accuracy=0.915, val_f1_score=0.915]
Epoch 165:  91%|█████████ | 232/255 [01:31<00:09,  2.52it/s, loss=0.0139, v_num=1, train_loss=0.00558, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.320, val_accuracy=0.915, val_f1_score=0.915]
Epoch 165:  92%|█████████▏| 234/255 [01:32<00:08,  2.54it/s, loss=0.0139, v_num=1, train_loss=0.0055

Epoch 165, global step 37515: val_loss was not in top 2


Epoch 166:  89%|████████▊ | 226/255 [01:25<00:10,  2.65it/s, loss=0.00811, v_num=1, train_loss=0.0012, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.290, val_accuracy=0.933, val_f1_score=0.933]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 166:  89%|████████▉ | 228/255 [01:31<00:10,  2.50it/s, loss=0.00811, v_num=1, train_loss=0.0012, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.290, val_accuracy=0.933, val_f1_score=0.933]
Epoch 166:  90%|█████████ | 230/255 [01:31<00:09,  2.52it/s, loss=0.00811, v_num=1, train_loss=0.0012, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.290, val_accuracy=0.933, val_f1_score=0.933]
Epoch 166:  91%|█████████ | 232/255 [01:31<00:09,  2.53it/s, loss=0.00811, v_num=1, train_loss=0.0012, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.290, val_accuracy=0.933, val_f1_score=0.933]
Epoch 166:  92%|█████████▏| 234/255 [01:31<00:08,  2.55it/s, loss=0.00811, v_num=1, train_loss=0.0

Epoch 166, global step 37741: val_loss was not in top 2


Epoch 167:  89%|████████▊ | 226/255 [01:25<00:10,  2.66it/s, loss=0.021, v_num=1, train_loss=0.0015, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.329, val_accuracy=0.933, val_f1_score=0.933]   
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 167:  89%|████████▉ | 228/255 [01:30<00:10,  2.51it/s, loss=0.021, v_num=1, train_loss=0.0015, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.329, val_accuracy=0.933, val_f1_score=0.933]
Epoch 167:  90%|█████████ | 230/255 [01:31<00:09,  2.53it/s, loss=0.021, v_num=1, train_loss=0.0015, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.329, val_accuracy=0.933, val_f1_score=0.933]
Epoch 167:  91%|█████████ | 232/255 [01:31<00:09,  2.54it/s, loss=0.021, v_num=1, train_loss=0.0015, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.329, val_accuracy=0.933, val_f1_score=0.933]
Epoch 167:  92%|█████████▏| 234/255 [01:31<00:08,  2.56it/s, loss=0.021, v_num=1, train_loss=0.0015, trai

Epoch 167, global step 37967: val_loss was not in top 2


Epoch 168:  89%|████████▊ | 226/255 [01:25<00:10,  2.66it/s, loss=0.0489, v_num=1, train_loss=0.00298, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.340, val_accuracy=0.933, val_f1_score=0.933]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 168:  89%|████████▉ | 228/255 [01:30<00:10,  2.51it/s, loss=0.0489, v_num=1, train_loss=0.00298, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.340, val_accuracy=0.933, val_f1_score=0.933]
Validating:   7%|▋         | 2/29 [00:05<01:05,  2.43s/it][A
Epoch 168:  90%|█████████ | 230/255 [01:30<00:09,  2.53it/s, loss=0.0489, v_num=1, train_loss=0.00298, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.340, val_accuracy=0.933, val_f1_score=0.933]
Epoch 168:  91%|█████████ | 232/255 [01:31<00:09,  2.54it/s, loss=0.0489, v_num=1, train_loss=0.00298, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.340, val_accuracy=0.933, val_f1_score=0.933]
Epoch 168:  92%|█████████▏| 234/255 

Epoch 168, global step 38193: val_loss was not in top 2


Epoch 169:  89%|████████▊ | 226/255 [01:25<00:11,  2.63it/s, loss=0.0208, v_num=1, train_loss=0.00331, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.355, val_accuracy=0.930, val_f1_score=0.930] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 169:  89%|████████▉ | 228/255 [01:31<00:10,  2.49it/s, loss=0.0208, v_num=1, train_loss=0.00331, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.355, val_accuracy=0.930, val_f1_score=0.930]
Epoch 169:  90%|█████████ | 230/255 [01:31<00:09,  2.50it/s, loss=0.0208, v_num=1, train_loss=0.00331, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.355, val_accuracy=0.930, val_f1_score=0.930]
Epoch 169:  91%|█████████ | 232/255 [01:32<00:09,  2.52it/s, loss=0.0208, v_num=1, train_loss=0.00331, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.355, val_accuracy=0.930, val_f1_score=0.930]
Epoch 169:  92%|█████████▏| 234/255 [01:32<00:08,  2.54it/s, loss=0.0208, v_num=1, train_loss=0.003

Epoch 169, global step 38419: val_loss was not in top 2


Epoch 170:  89%|████████▊ | 226/255 [01:25<00:10,  2.64it/s, loss=0.0157, v_num=1, train_loss=0.0397, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.331, val_accuracy=0.938, val_f1_score=0.938] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 170:  89%|████████▉ | 228/255 [01:31<00:10,  2.50it/s, loss=0.0157, v_num=1, train_loss=0.0397, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.331, val_accuracy=0.938, val_f1_score=0.938]
Epoch 170:  90%|█████████ | 230/255 [01:31<00:09,  2.52it/s, loss=0.0157, v_num=1, train_loss=0.0397, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.331, val_accuracy=0.938, val_f1_score=0.938]
Epoch 170:  91%|█████████ | 232/255 [01:31<00:09,  2.53it/s, loss=0.0157, v_num=1, train_loss=0.0397, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.331, val_accuracy=0.938, val_f1_score=0.938]
Epoch 170:  92%|█████████▏| 234/255 [01:31<00:08,  2.55it/s, loss=0.0157, v_num=1, train_loss=0.0397, t

Epoch 170, global step 38645: val_loss was not in top 2


Epoch 171:  89%|████████▊ | 226/255 [01:24<00:10,  2.66it/s, loss=0.00951, v_num=1, train_loss=0.00465, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.297, val_accuracy=0.935, val_f1_score=0.935] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 171:  89%|████████▉ | 228/255 [01:30<00:10,  2.51it/s, loss=0.00951, v_num=1, train_loss=0.00465, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.297, val_accuracy=0.935, val_f1_score=0.935]
Epoch 171:  90%|█████████ | 230/255 [01:30<00:09,  2.53it/s, loss=0.00951, v_num=1, train_loss=0.00465, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.297, val_accuracy=0.935, val_f1_score=0.935]
Epoch 171:  91%|█████████ | 232/255 [01:31<00:09,  2.55it/s, loss=0.00951, v_num=1, train_loss=0.00465, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.297, val_accuracy=0.935, val_f1_score=0.935]
Epoch 171:  92%|█████████▏| 234/255 [01:31<00:08,  2.56it/s, loss=0.00951, v_num=1, train_loss=

Epoch 171, global step 38871: val_loss was not in top 2


Epoch 172:  89%|████████▊ | 226/255 [01:24<00:10,  2.66it/s, loss=0.0171, v_num=1, train_loss=0.004, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.287, val_accuracy=0.940, val_f1_score=0.940]    
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 172:  89%|████████▉ | 228/255 [01:30<00:10,  2.51it/s, loss=0.0171, v_num=1, train_loss=0.004, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.287, val_accuracy=0.940, val_f1_score=0.940]
Epoch 172:  90%|█████████ | 230/255 [01:31<00:09,  2.53it/s, loss=0.0171, v_num=1, train_loss=0.004, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.287, val_accuracy=0.940, val_f1_score=0.940]
Epoch 172:  91%|█████████ | 232/255 [01:31<00:09,  2.54it/s, loss=0.0171, v_num=1, train_loss=0.004, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.287, val_accuracy=0.940, val_f1_score=0.940]
Epoch 172:  92%|█████████▏| 234/255 [01:31<00:08,  2.56it/s, loss=0.0171, v_num=1, train_loss=0.004, tra

Epoch 172, global step 39097: val_loss was not in top 2


Epoch 173:  89%|████████▊ | 226/255 [01:25<00:10,  2.65it/s, loss=0.00799, v_num=1, train_loss=0.00189, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.343, val_accuracy=0.932, val_f1_score=0.932] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 173:  89%|████████▉ | 228/255 [01:31<00:10,  2.50it/s, loss=0.00799, v_num=1, train_loss=0.00189, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.343, val_accuracy=0.932, val_f1_score=0.932]
Epoch 173:  90%|█████████ | 230/255 [01:31<00:09,  2.52it/s, loss=0.00799, v_num=1, train_loss=0.00189, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.343, val_accuracy=0.932, val_f1_score=0.932]
Epoch 173:  91%|█████████ | 232/255 [01:31<00:09,  2.53it/s, loss=0.00799, v_num=1, train_loss=0.00189, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.343, val_accuracy=0.932, val_f1_score=0.932]
Epoch 173:  92%|█████████▏| 234/255 [01:31<00:08,  2.55it/s, loss=0.00799, v_num=1, train_loss=

Epoch 173, global step 39323: val_loss was not in top 2


Epoch 174:  89%|████████▊ | 226/255 [01:24<00:10,  2.66it/s, loss=0.0127, v_num=1, train_loss=0.00047, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.293, val_accuracy=0.943, val_f1_score=0.943]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 174:  89%|████████▉ | 228/255 [01:30<00:10,  2.51it/s, loss=0.0127, v_num=1, train_loss=0.00047, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.293, val_accuracy=0.943, val_f1_score=0.943]
Epoch 174:  90%|█████████ | 230/255 [01:30<00:09,  2.53it/s, loss=0.0127, v_num=1, train_loss=0.00047, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.293, val_accuracy=0.943, val_f1_score=0.943]
Epoch 174:  91%|█████████ | 232/255 [01:31<00:09,  2.55it/s, loss=0.0127, v_num=1, train_loss=0.00047, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.293, val_accuracy=0.943, val_f1_score=0.943]
Epoch 174:  92%|█████████▏| 234/255 [01:31<00:08,  2.57it/s, loss=0.0127, v_num=1, train_loss=0.00

Epoch 174, global step 39549: val_loss was not in top 2


Epoch 175:  89%|████████▊ | 226/255 [01:25<00:10,  2.65it/s, loss=0.00457, v_num=1, train_loss=0.000308, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.321, val_accuracy=0.940, val_f1_score=0.940]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 175:  89%|████████▉ | 228/255 [01:31<00:10,  2.50it/s, loss=0.00457, v_num=1, train_loss=0.000308, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.321, val_accuracy=0.940, val_f1_score=0.940]
Epoch 175:  90%|█████████ | 230/255 [01:31<00:09,  2.52it/s, loss=0.00457, v_num=1, train_loss=0.000308, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.321, val_accuracy=0.940, val_f1_score=0.940]
Epoch 175:  91%|█████████ | 232/255 [01:31<00:09,  2.54it/s, loss=0.00457, v_num=1, train_loss=0.000308, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.321, val_accuracy=0.940, val_f1_score=0.940]
Epoch 175:  92%|█████████▏| 234/255 [01:31<00:08,  2.55it/s, loss=0.00457, v_num=1, train_lo

Epoch 175, global step 39775: val_loss was not in top 2


Epoch 176:  89%|████████▊ | 226/255 [01:25<00:10,  2.65it/s, loss=0.0115, v_num=1, train_loss=0.0566, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.303, val_accuracy=0.942, val_f1_score=0.942]   
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 176:  89%|████████▉ | 228/255 [01:31<00:10,  2.50it/s, loss=0.0115, v_num=1, train_loss=0.0566, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.303, val_accuracy=0.942, val_f1_score=0.942]
Epoch 176:  90%|█████████ | 230/255 [01:31<00:09,  2.52it/s, loss=0.0115, v_num=1, train_loss=0.0566, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.303, val_accuracy=0.942, val_f1_score=0.942]
Epoch 176:  91%|█████████ | 232/255 [01:31<00:09,  2.54it/s, loss=0.0115, v_num=1, train_loss=0.0566, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.303, val_accuracy=0.942, val_f1_score=0.942]
Epoch 176:  92%|█████████▏| 234/255 [01:31<00:08,  2.55it/s, loss=0.0115, v_num=1, train_loss=0.0566,

Epoch 176, global step 40001: val_loss was not in top 2


Epoch 177:  89%|████████▊ | 226/255 [01:25<00:10,  2.65it/s, loss=0.0153, v_num=1, train_loss=0.00133, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.344, val_accuracy=0.937, val_f1_score=0.937]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 177:  89%|████████▉ | 228/255 [01:31<00:10,  2.50it/s, loss=0.0153, v_num=1, train_loss=0.00133, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.344, val_accuracy=0.937, val_f1_score=0.937]
Epoch 177:  90%|█████████ | 230/255 [01:31<00:09,  2.52it/s, loss=0.0153, v_num=1, train_loss=0.00133, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.344, val_accuracy=0.937, val_f1_score=0.937]
Epoch 177:  91%|█████████ | 232/255 [01:31<00:09,  2.54it/s, loss=0.0153, v_num=1, train_loss=0.00133, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.344, val_accuracy=0.937, val_f1_score=0.937]
Epoch 177:  92%|█████████▏| 234/255 [01:31<00:08,  2.55it/s, loss=0.0153, v_num=1, train_loss=0.00

Epoch 177, global step 40227: val_loss was not in top 2


Epoch 178:  89%|████████▊ | 226/255 [01:25<00:10,  2.65it/s, loss=0.0447, v_num=1, train_loss=0.000694, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.350, val_accuracy=0.939, val_f1_score=0.939] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 178:  89%|████████▉ | 228/255 [01:31<00:10,  2.50it/s, loss=0.0447, v_num=1, train_loss=0.000694, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.350, val_accuracy=0.939, val_f1_score=0.939]
Epoch 178:  90%|█████████ | 230/255 [01:31<00:09,  2.52it/s, loss=0.0447, v_num=1, train_loss=0.000694, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.350, val_accuracy=0.939, val_f1_score=0.939]
Epoch 178:  91%|█████████ | 232/255 [01:31<00:09,  2.54it/s, loss=0.0447, v_num=1, train_loss=0.000694, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.350, val_accuracy=0.939, val_f1_score=0.939]
Epoch 178:  92%|█████████▏| 234/255 [01:31<00:08,  2.55it/s, loss=0.0447, v_num=1, train_loss=0

Epoch 178, global step 40453: val_loss was not in top 2


Epoch 179:  89%|████████▊ | 226/255 [01:25<00:10,  2.65it/s, loss=0.0285, v_num=1, train_loss=0.00194, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.319, val_accuracy=0.928, val_f1_score=0.928] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 179:  89%|████████▉ | 228/255 [01:31<00:10,  2.50it/s, loss=0.0285, v_num=1, train_loss=0.00194, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.319, val_accuracy=0.928, val_f1_score=0.928]
Epoch 179:  90%|█████████ | 230/255 [01:31<00:09,  2.52it/s, loss=0.0285, v_num=1, train_loss=0.00194, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.319, val_accuracy=0.928, val_f1_score=0.928]
Epoch 179:  91%|█████████ | 232/255 [01:31<00:09,  2.53it/s, loss=0.0285, v_num=1, train_loss=0.00194, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.319, val_accuracy=0.928, val_f1_score=0.928]
Epoch 179:  92%|█████████▏| 234/255 [01:31<00:08,  2.55it/s, loss=0.0285, v_num=1, train_loss=0.001

Epoch 179, global step 40679: val_loss was not in top 2


Epoch 180:  89%|████████▊ | 226/255 [01:25<00:10,  2.65it/s, loss=0.00589, v_num=1, train_loss=0.00122, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.300, val_accuracy=0.936, val_f1_score=0.936]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 180:  89%|████████▉ | 228/255 [01:31<00:10,  2.50it/s, loss=0.00589, v_num=1, train_loss=0.00122, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.300, val_accuracy=0.936, val_f1_score=0.936]
Epoch 180:  90%|█████████ | 230/255 [01:31<00:09,  2.52it/s, loss=0.00589, v_num=1, train_loss=0.00122, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.300, val_accuracy=0.936, val_f1_score=0.936]
Epoch 180:  91%|█████████ | 232/255 [01:31<00:09,  2.54it/s, loss=0.00589, v_num=1, train_loss=0.00122, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.300, val_accuracy=0.936, val_f1_score=0.936]
Epoch 180:  92%|█████████▏| 234/255 [01:31<00:08,  2.55it/s, loss=0.00589, v_num=1, train_loss=0

Epoch 180, global step 40905: val_loss reached 0.25943 (best 0.25943), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-1-v3.ckpt" as top 2


Epoch 181:  89%|████████▊ | 226/255 [01:25<00:10,  2.64it/s, loss=0.0104, v_num=1, train_loss=0.00192, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.259, val_accuracy=0.948, val_f1_score=0.948]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 181:  89%|████████▉ | 228/255 [01:31<00:10,  2.49it/s, loss=0.0104, v_num=1, train_loss=0.00192, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.259, val_accuracy=0.948, val_f1_score=0.948]
Epoch 181:  90%|█████████ | 230/255 [01:31<00:09,  2.51it/s, loss=0.0104, v_num=1, train_loss=0.00192, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.259, val_accuracy=0.948, val_f1_score=0.948]
Epoch 181:  91%|█████████ | 232/255 [01:31<00:09,  2.53it/s, loss=0.0104, v_num=1, train_loss=0.00192, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.259, val_accuracy=0.948, val_f1_score=0.948]
Epoch 181:  92%|█████████▏| 234/255 [01:31<00:08,  2.54it/s, loss=0.0104, v_num=1, train_loss=0.00

Epoch 181, global step 41131: val_loss reached 0.25566 (best 0.25566), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-1-v2.ckpt" as top 2


Epoch 182:  89%|████████▊ | 226/255 [01:25<00:11,  2.64it/s, loss=0.0382, v_num=1, train_loss=0.00501, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.256, val_accuracy=0.948, val_f1_score=0.948]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 182:  89%|████████▉ | 228/255 [01:31<00:10,  2.48it/s, loss=0.0382, v_num=1, train_loss=0.00501, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.256, val_accuracy=0.948, val_f1_score=0.948]
Epoch 182:  90%|█████████ | 230/255 [01:32<00:10,  2.50it/s, loss=0.0382, v_num=1, train_loss=0.00501, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.256, val_accuracy=0.948, val_f1_score=0.948]
Epoch 182:  91%|█████████ | 232/255 [01:32<00:09,  2.52it/s, loss=0.0382, v_num=1, train_loss=0.00501, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.256, val_accuracy=0.948, val_f1_score=0.948]
Epoch 182:  92%|█████████▏| 234/255 [01:32<00:08,  2.53it/s, loss=0.0382, v_num=1, train_loss=0.00

Epoch 182, global step 41357: val_loss was not in top 2


Epoch 183:  89%|████████▊ | 226/255 [01:25<00:11,  2.63it/s, loss=0.0276, v_num=1, train_loss=0.311, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.317, val_accuracy=0.939, val_f1_score=0.939]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 183:  89%|████████▉ | 228/255 [01:31<00:10,  2.48it/s, loss=0.0276, v_num=1, train_loss=0.311, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.317, val_accuracy=0.939, val_f1_score=0.939]
Epoch 183:  90%|█████████ | 230/255 [01:32<00:10,  2.50it/s, loss=0.0276, v_num=1, train_loss=0.311, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.317, val_accuracy=0.939, val_f1_score=0.939]
Epoch 183:  91%|█████████ | 232/255 [01:32<00:09,  2.52it/s, loss=0.0276, v_num=1, train_loss=0.311, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.317, val_accuracy=0.939, val_f1_score=0.939]
Epoch 183:  92%|█████████▏| 234/255 [01:32<00:08,  2.53it/s, loss=0.0276, v_num=1, train_loss=0.311, train

Epoch 183, global step 41583: val_loss reached 0.21615 (best 0.21615), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-1-v3.ckpt" as top 2


Epoch 184:  89%|████████▊ | 226/255 [01:25<00:10,  2.64it/s, loss=0.0123, v_num=1, train_loss=0.000905, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.216, val_accuracy=0.948, val_f1_score=0.948]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 184:  89%|████████▉ | 228/255 [01:31<00:10,  2.49it/s, loss=0.0123, v_num=1, train_loss=0.000905, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.216, val_accuracy=0.948, val_f1_score=0.948]
Epoch 184:  90%|█████████ | 230/255 [01:31<00:09,  2.51it/s, loss=0.0123, v_num=1, train_loss=0.000905, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.216, val_accuracy=0.948, val_f1_score=0.948]
Epoch 184:  91%|█████████ | 232/255 [01:31<00:09,  2.53it/s, loss=0.0123, v_num=1, train_loss=0.000905, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.216, val_accuracy=0.948, val_f1_score=0.948]
Epoch 184:  92%|█████████▏| 234/255 [01:31<00:08,  2.54it/s, loss=0.0123, v_num=1, train_loss=0.

Epoch 184, global step 41809: val_loss reached 0.23878 (best 0.21615), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-1-v2.ckpt" as top 2


Epoch 185:  89%|████████▊ | 226/255 [01:25<00:10,  2.65it/s, loss=0.00436, v_num=1, train_loss=0.00169, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.239, val_accuracy=0.945, val_f1_score=0.945] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 185:  89%|████████▉ | 228/255 [01:31<00:10,  2.50it/s, loss=0.00436, v_num=1, train_loss=0.00169, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.239, val_accuracy=0.945, val_f1_score=0.945]
Epoch 185:  90%|█████████ | 230/255 [01:31<00:09,  2.52it/s, loss=0.00436, v_num=1, train_loss=0.00169, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.239, val_accuracy=0.945, val_f1_score=0.945]
Epoch 185:  91%|█████████ | 232/255 [01:31<00:09,  2.53it/s, loss=0.00436, v_num=1, train_loss=0.00169, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.239, val_accuracy=0.945, val_f1_score=0.945]
Epoch 185:  92%|█████████▏| 234/255 [01:31<00:08,  2.55it/s, loss=0.00436, v_num=1, train_loss=

Epoch 185, global step 42035: val_loss was not in top 2


Epoch 186:  89%|████████▊ | 226/255 [01:25<00:10,  2.65it/s, loss=0.0338, v_num=1, train_loss=0.00232, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.271, val_accuracy=0.942, val_f1_score=0.942]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 186:  89%|████████▉ | 228/255 [01:31<00:10,  2.50it/s, loss=0.0338, v_num=1, train_loss=0.00232, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.271, val_accuracy=0.942, val_f1_score=0.942]
Epoch 186:  90%|█████████ | 230/255 [01:31<00:09,  2.52it/s, loss=0.0338, v_num=1, train_loss=0.00232, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.271, val_accuracy=0.942, val_f1_score=0.942]
Epoch 186:  91%|█████████ | 232/255 [01:31<00:09,  2.54it/s, loss=0.0338, v_num=1, train_loss=0.00232, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.271, val_accuracy=0.942, val_f1_score=0.942]
Epoch 186:  92%|█████████▏| 234/255 [01:31<00:08,  2.55it/s, loss=0.0338, v_num=1, train_loss=0.00

Epoch 186, global step 42261: val_loss was not in top 2


Epoch 187:  89%|████████▊ | 226/255 [01:25<00:10,  2.65it/s, loss=0.0111, v_num=1, train_loss=0.000829, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.297, val_accuracy=0.938, val_f1_score=0.938]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 187:  89%|████████▉ | 228/255 [01:30<00:10,  2.51it/s, loss=0.0111, v_num=1, train_loss=0.000829, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.297, val_accuracy=0.938, val_f1_score=0.938]
Epoch 187:  90%|█████████ | 230/255 [01:31<00:09,  2.52it/s, loss=0.0111, v_num=1, train_loss=0.000829, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.297, val_accuracy=0.938, val_f1_score=0.938]
Epoch 187:  91%|█████████ | 232/255 [01:31<00:09,  2.54it/s, loss=0.0111, v_num=1, train_loss=0.000829, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.297, val_accuracy=0.938, val_f1_score=0.938]
Epoch 187:  92%|█████████▏| 234/255 [01:31<00:08,  2.56it/s, loss=0.0111, v_num=1, train_loss=0.

Epoch 187, global step 42487: val_loss was not in top 2


Epoch 188:  89%|████████▊ | 226/255 [01:25<00:10,  2.65it/s, loss=0.0626, v_num=1, train_loss=0.00652, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.255, val_accuracy=0.945, val_f1_score=0.945]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 188:  89%|████████▉ | 228/255 [01:31<00:10,  2.50it/s, loss=0.0626, v_num=1, train_loss=0.00652, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.255, val_accuracy=0.945, val_f1_score=0.945]
Epoch 188:  90%|█████████ | 230/255 [01:31<00:09,  2.52it/s, loss=0.0626, v_num=1, train_loss=0.00652, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.255, val_accuracy=0.945, val_f1_score=0.945]
Epoch 188:  91%|█████████ | 232/255 [01:31<00:09,  2.54it/s, loss=0.0626, v_num=1, train_loss=0.00652, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.255, val_accuracy=0.945, val_f1_score=0.945]
Epoch 188:  92%|█████████▏| 234/255 [01:31<00:08,  2.55it/s, loss=0.0626, v_num=1, train_loss=0.00

Epoch 188, global step 42713: val_loss was not in top 2


Epoch 189:  89%|████████▊ | 226/255 [01:24<00:10,  2.66it/s, loss=0.0127, v_num=1, train_loss=0.00599, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.258, val_accuracy=0.929, val_f1_score=0.929]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 189:  89%|████████▉ | 228/255 [01:30<00:10,  2.51it/s, loss=0.0127, v_num=1, train_loss=0.00599, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.258, val_accuracy=0.929, val_f1_score=0.929]
Epoch 189:  90%|█████████ | 230/255 [01:30<00:09,  2.53it/s, loss=0.0127, v_num=1, train_loss=0.00599, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.258, val_accuracy=0.929, val_f1_score=0.929]
Epoch 189:  91%|█████████ | 232/255 [01:31<00:09,  2.54it/s, loss=0.0127, v_num=1, train_loss=0.00599, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.258, val_accuracy=0.929, val_f1_score=0.929]
Epoch 189:  92%|█████████▏| 234/255 [01:31<00:08,  2.56it/s, loss=0.0127, v_num=1, train_loss=0.0059

Epoch 189, global step 42939: val_loss was not in top 2


Epoch 190:  89%|████████▊ | 226/255 [01:24<00:10,  2.66it/s, loss=0.0029, v_num=1, train_loss=0.00569, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.254, val_accuracy=0.943, val_f1_score=0.943]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 190:  89%|████████▉ | 228/255 [01:30<00:10,  2.51it/s, loss=0.0029, v_num=1, train_loss=0.00569, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.254, val_accuracy=0.943, val_f1_score=0.943]
Epoch 190:  90%|█████████ | 230/255 [01:31<00:09,  2.52it/s, loss=0.0029, v_num=1, train_loss=0.00569, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.254, val_accuracy=0.943, val_f1_score=0.943]
Epoch 190:  91%|█████████ | 232/255 [01:31<00:09,  2.54it/s, loss=0.0029, v_num=1, train_loss=0.00569, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.254, val_accuracy=0.943, val_f1_score=0.943]
Epoch 190:  92%|█████████▏| 234/255 [01:31<00:08,  2.56it/s, loss=0.0029, v_num=1, train_loss=0.00

Epoch 190, global step 43165: val_loss was not in top 2


Epoch 191:  89%|████████▊ | 226/255 [01:25<00:10,  2.65it/s, loss=0.0116, v_num=1, train_loss=0.000572, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.249, val_accuracy=0.945, val_f1_score=0.945] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 191:  89%|████████▉ | 228/255 [01:31<00:10,  2.50it/s, loss=0.0116, v_num=1, train_loss=0.000572, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.249, val_accuracy=0.945, val_f1_score=0.945]
Epoch 191:  90%|█████████ | 230/255 [01:31<00:09,  2.52it/s, loss=0.0116, v_num=1, train_loss=0.000572, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.249, val_accuracy=0.945, val_f1_score=0.945]
Epoch 191:  91%|█████████ | 232/255 [01:31<00:09,  2.54it/s, loss=0.0116, v_num=1, train_loss=0.000572, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.249, val_accuracy=0.945, val_f1_score=0.945]
Epoch 191:  92%|█████████▏| 234/255 [01:31<00:08,  2.56it/s, loss=0.0116, v_num=1, train_loss=0

Epoch 191, global step 43391: val_loss was not in top 2


Epoch 192:  89%|████████▊ | 226/255 [01:25<00:10,  2.66it/s, loss=0.00903, v_num=1, train_loss=0.00886, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.308, val_accuracy=0.938, val_f1_score=0.938] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 192:  89%|████████▉ | 228/255 [01:30<00:10,  2.51it/s, loss=0.00903, v_num=1, train_loss=0.00886, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.308, val_accuracy=0.938, val_f1_score=0.938]
Epoch 192:  90%|█████████ | 230/255 [01:31<00:09,  2.52it/s, loss=0.00903, v_num=1, train_loss=0.00886, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.308, val_accuracy=0.938, val_f1_score=0.938]
Epoch 192:  91%|█████████ | 232/255 [01:31<00:09,  2.54it/s, loss=0.00903, v_num=1, train_loss=0.00886, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.308, val_accuracy=0.938, val_f1_score=0.938]
Epoch 192:  92%|█████████▏| 234/255 [01:31<00:08,  2.56it/s, loss=0.00903, v_num=1, train_loss=

Epoch 192, global step 43617: val_loss was not in top 2


Epoch 193:  89%|████████▊ | 226/255 [01:25<00:10,  2.66it/s, loss=0.0158, v_num=1, train_loss=0.000753, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.294, val_accuracy=0.940, val_f1_score=0.940] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 193:  89%|████████▉ | 228/255 [01:31<00:10,  2.50it/s, loss=0.0158, v_num=1, train_loss=0.000753, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.294, val_accuracy=0.940, val_f1_score=0.940]
Epoch 193:  90%|█████████ | 230/255 [01:31<00:09,  2.52it/s, loss=0.0158, v_num=1, train_loss=0.000753, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.294, val_accuracy=0.940, val_f1_score=0.940]
Epoch 193:  91%|█████████ | 232/255 [01:31<00:09,  2.54it/s, loss=0.0158, v_num=1, train_loss=0.000753, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.294, val_accuracy=0.940, val_f1_score=0.940]
Epoch 193:  92%|█████████▏| 234/255 [01:31<00:08,  2.55it/s, loss=0.0158, v_num=1, train_loss=0

Epoch 193, global step 43843: val_loss was not in top 2


Epoch 194:  89%|████████▊ | 226/255 [01:25<00:10,  2.64it/s, loss=0.0186, v_num=1, train_loss=0.00741, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.282, val_accuracy=0.941, val_f1_score=0.941]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 194:  89%|████████▉ | 228/255 [01:31<00:10,  2.49it/s, loss=0.0186, v_num=1, train_loss=0.00741, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.282, val_accuracy=0.941, val_f1_score=0.941]
Epoch 194:  90%|█████████ | 230/255 [01:31<00:09,  2.51it/s, loss=0.0186, v_num=1, train_loss=0.00741, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.282, val_accuracy=0.941, val_f1_score=0.941]
Epoch 194:  91%|█████████ | 232/255 [01:31<00:09,  2.52it/s, loss=0.0186, v_num=1, train_loss=0.00741, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.282, val_accuracy=0.941, val_f1_score=0.941]
Epoch 194:  92%|█████████▏| 234/255 [01:32<00:08,  2.54it/s, loss=0.0186, v_num=1, train_loss=0.00

Epoch 194, global step 44069: val_loss was not in top 2


Epoch 195:  89%|████████▊ | 226/255 [01:25<00:10,  2.65it/s, loss=0.00574, v_num=1, train_loss=0.00101, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.292, val_accuracy=0.938, val_f1_score=0.938] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 195:  89%|████████▉ | 228/255 [01:31<00:10,  2.49it/s, loss=0.00574, v_num=1, train_loss=0.00101, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.292, val_accuracy=0.938, val_f1_score=0.938]
Epoch 195:  90%|█████████ | 230/255 [01:31<00:09,  2.51it/s, loss=0.00574, v_num=1, train_loss=0.00101, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.292, val_accuracy=0.938, val_f1_score=0.938]
Epoch 195:  91%|█████████ | 232/255 [01:31<00:09,  2.52it/s, loss=0.00574, v_num=1, train_loss=0.00101, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.292, val_accuracy=0.938, val_f1_score=0.938]
Epoch 195:  92%|█████████▏| 234/255 [01:32<00:08,  2.54it/s, loss=0.00574, v_num=1, train_loss=

Epoch 195, global step 44295: val_loss was not in top 2


Epoch 196:  89%|████████▊ | 226/255 [01:25<00:10,  2.64it/s, loss=0.0133, v_num=1, train_loss=0.00123, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.275, val_accuracy=0.945, val_f1_score=0.945]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 196:  89%|████████▉ | 228/255 [01:31<00:10,  2.49it/s, loss=0.0133, v_num=1, train_loss=0.00123, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.275, val_accuracy=0.945, val_f1_score=0.945]
Epoch 196:  90%|█████████ | 230/255 [01:31<00:09,  2.51it/s, loss=0.0133, v_num=1, train_loss=0.00123, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.275, val_accuracy=0.945, val_f1_score=0.945]
Epoch 196:  91%|█████████ | 232/255 [01:31<00:09,  2.53it/s, loss=0.0133, v_num=1, train_loss=0.00123, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.275, val_accuracy=0.945, val_f1_score=0.945]
Epoch 196:  92%|█████████▏| 234/255 [01:31<00:08,  2.54it/s, loss=0.0133, v_num=1, train_loss=0.00

Epoch 196, global step 44521: val_loss was not in top 2


Epoch 197:  89%|████████▊ | 226/255 [01:24<00:10,  2.66it/s, loss=0.00274, v_num=1, train_loss=0.00024, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.297, val_accuracy=0.943, val_f1_score=0.943] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 197:  89%|████████▉ | 228/255 [01:30<00:10,  2.51it/s, loss=0.00274, v_num=1, train_loss=0.00024, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.297, val_accuracy=0.943, val_f1_score=0.943]
Epoch 197:  90%|█████████ | 230/255 [01:30<00:09,  2.53it/s, loss=0.00274, v_num=1, train_loss=0.00024, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.297, val_accuracy=0.943, val_f1_score=0.943]
Epoch 197:  91%|█████████ | 232/255 [01:31<00:09,  2.54it/s, loss=0.00274, v_num=1, train_loss=0.00024, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.297, val_accuracy=0.943, val_f1_score=0.943]
Epoch 197:  92%|█████████▏| 234/255 [01:31<00:08,  2.56it/s, loss=0.00274, v_num=1, train_loss=

Epoch 197, global step 44747: val_loss was not in top 2


Epoch 198:  89%|████████▊ | 226/255 [01:25<00:10,  2.65it/s, loss=0.00761, v_num=1, train_loss=0.000316, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.282, val_accuracy=0.941, val_f1_score=0.941]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 198:  89%|████████▉ | 228/255 [01:31<00:10,  2.50it/s, loss=0.00761, v_num=1, train_loss=0.000316, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.282, val_accuracy=0.941, val_f1_score=0.941]
Epoch 198:  90%|█████████ | 230/255 [01:31<00:09,  2.52it/s, loss=0.00761, v_num=1, train_loss=0.000316, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.282, val_accuracy=0.941, val_f1_score=0.941]
Epoch 198:  91%|█████████ | 232/255 [01:31<00:09,  2.53it/s, loss=0.00761, v_num=1, train_loss=0.000316, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.282, val_accuracy=0.941, val_f1_score=0.941]
Epoch 198:  92%|█████████▏| 234/255 [01:31<00:08,  2.55it/s, loss=0.00761, v_num=1, train_lo

Epoch 198, global step 44973: val_loss was not in top 2


Epoch 199:  89%|████████▊ | 226/255 [01:25<00:10,  2.65it/s, loss=0.00306, v_num=1, train_loss=0.000938, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.266, val_accuracy=0.947, val_f1_score=0.947]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 199:  89%|████████▉ | 228/255 [01:31<00:10,  2.50it/s, loss=0.00306, v_num=1, train_loss=0.000938, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.266, val_accuracy=0.947, val_f1_score=0.947]
Epoch 199:  90%|█████████ | 230/255 [01:31<00:09,  2.52it/s, loss=0.00306, v_num=1, train_loss=0.000938, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.266, val_accuracy=0.947, val_f1_score=0.947]
Epoch 199:  91%|█████████ | 232/255 [01:31<00:09,  2.53it/s, loss=0.00306, v_num=1, train_loss=0.000938, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.266, val_accuracy=0.947, val_f1_score=0.947]
Epoch 199:  92%|█████████▏| 234/255 [01:31<00:08,  2.55it/s, loss=0.00306, v_num=1, train_lo

Epoch 199, global step 45199: val_loss was not in top 2


Epoch 199: 100%|██████████| 255/255 [01:34<00:00,  2.70it/s, loss=0.00306, v_num=1, train_loss=0.000938, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.260, val_accuracy=0.942, val_f1_score=0.942]


LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1,2]


Testing: 100%|██████████| 29/29 [00:09<00:00,  4.52it/s]--------------------------------------------------------------------------------
DATALOADER:0 TEST RESULTS
{'test_f1_score': 0.943222165107727,
 'test_train_accuracy': 0.943222165107727,
 'test_train_loss': 0.24168267846107483}
--------------------------------------------------------------------------------
Testing: 100%|██████████| 29/29 [00:09<00:00,  3.19it/s]
------------------ Round: 2 ------------------
['FCZ', 'FT10', 'O2', 'O1', 'FT7', 'F4', 'TP7', 'C3', 'C4', 'F3', 'FT8', 'T6', 'HEOR', 'T5', 'VEOL', 'F7', 'FZ', 'VEOU', 'A1', 'P3', 'PZ', 'CP3', 'P4', 'CPZ', 'A2', 'HEOL', 'CP4', 'FT9', 'F8', 'OZ', 'CZ', 'FC4', 'FC3', 'FP1', 'PO1', 'T3', 'T4', 'PO2']
Len: 38


GPU available: True, used: True
TPU available: False, using: 0 TPU cores
IPU available: False, using: 0 IPUs
LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1,2]
Missing logger folder: lightning_logs/Drowsy_2

  | Name      | Type             | Params
-----------------------------------------------
0 | model     | DrowsyModel      | 1.4 M 
1 | criterion | CrossEntropyLoss | 0     
-----------------------------------------------
1.4 M     Trainable params
0         Non-trainable params
1.4 M     Total params
5.425     Total estimated model params size (MB)


                                                                      

Global seed set to 42


Epoch 0:  89%|████████▊ | 226/255 [01:23<00:10,  2.69it/s, loss=0.61, v_num=0, train_loss=0.572, train_accuracy=0.778, train_f1_score=0.778] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 0:  89%|████████▉ | 228/255 [01:29<00:10,  2.54it/s, loss=0.61, v_num=0, train_loss=0.572, train_accuracy=0.778, train_f1_score=0.778]
Epoch 0:  90%|█████████ | 230/255 [01:29<00:09,  2.56it/s, loss=0.61, v_num=0, train_loss=0.572, train_accuracy=0.778, train_f1_score=0.778]
Epoch 0:  91%|█████████ | 232/255 [01:30<00:08,  2.58it/s, loss=0.61, v_num=0, train_loss=0.572, train_accuracy=0.778, train_f1_score=0.778]
Epoch 0:  92%|█████████▏| 234/255 [01:30<00:08,  2.59it/s, loss=0.61, v_num=0, train_loss=0.572, train_accuracy=0.778, train_f1_score=0.778]
Epoch 0:  93%|█████████▎| 236/255 [01:30<00:07,  2.61it/s, loss=0.61, v_num=0, train_loss=0.572, train_accuracy=0.778, train_f1_score=0.778]
Epoch 0:  93%|█████████▎| 238/255 [01:30<00:06,  2.63it/s, loss=0

Epoch 0, global step 225: val_loss reached 0.66079 (best 0.66079), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-2.ckpt" as top 2


Epoch 1:  89%|████████▊ | 226/255 [01:23<00:10,  2.70it/s, loss=0.526, v_num=0, train_loss=0.435, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.661, val_accuracy=0.630, val_f1_score=0.630]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 1:  89%|████████▉ | 228/255 [01:29<00:10,  2.54it/s, loss=0.526, v_num=0, train_loss=0.435, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.661, val_accuracy=0.630, val_f1_score=0.630]
Epoch 1:  90%|█████████ | 230/255 [01:29<00:09,  2.56it/s, loss=0.526, v_num=0, train_loss=0.435, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.661, val_accuracy=0.630, val_f1_score=0.630]
Epoch 1:  91%|█████████ | 232/255 [01:30<00:08,  2.57it/s, loss=0.526, v_num=0, train_loss=0.435, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.661, val_accuracy=0.630, val_f1_score=0.630]
Epoch 1:  92%|█████████▏| 234/255 [01:30<00:08,  2.59it/s, loss=0.526, v_num=0, train_loss=0.435, train_accuracy=0.889, 

Epoch 1, global step 451: val_loss reached 0.53729 (best 0.53729), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-2-v1.ckpt" as top 2


Epoch 2:  89%|████████▊ | 226/255 [01:24<00:10,  2.69it/s, loss=0.81, v_num=0, train_loss=0.674, train_accuracy=0.611, train_f1_score=0.611, val_loss=0.537, val_accuracy=0.755, val_f1_score=0.755] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 2:  89%|████████▉ | 228/255 [01:29<00:10,  2.54it/s, loss=0.81, v_num=0, train_loss=0.674, train_accuracy=0.611, train_f1_score=0.611, val_loss=0.537, val_accuracy=0.755, val_f1_score=0.755]
Epoch 2:  90%|█████████ | 230/255 [01:30<00:09,  2.55it/s, loss=0.81, v_num=0, train_loss=0.674, train_accuracy=0.611, train_f1_score=0.611, val_loss=0.537, val_accuracy=0.755, val_f1_score=0.755]
Epoch 2:  91%|█████████ | 232/255 [01:30<00:08,  2.57it/s, loss=0.81, v_num=0, train_loss=0.674, train_accuracy=0.611, train_f1_score=0.611, val_loss=0.537, val_accuracy=0.755, val_f1_score=0.755]
Validating:  21%|██        | 6/29 [00:06<00:12,  1.83it/s][A
Epoch 2:  92%|█████████▏| 234/255 [01:30<00:08,  2.59it/s, lo

Epoch 2, global step 677: val_loss reached 0.65275 (best 0.53729), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-2.ckpt" as top 2


Epoch 3:  89%|████████▊ | 226/255 [01:24<00:10,  2.68it/s, loss=0.608, v_num=0, train_loss=0.604, train_accuracy=0.667, train_f1_score=0.667, val_loss=0.653, val_accuracy=0.610, val_f1_score=0.610]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 3:  89%|████████▉ | 228/255 [01:30<00:10,  2.53it/s, loss=0.608, v_num=0, train_loss=0.604, train_accuracy=0.667, train_f1_score=0.667, val_loss=0.653, val_accuracy=0.610, val_f1_score=0.610]
Epoch 3:  90%|█████████ | 230/255 [01:30<00:09,  2.55it/s, loss=0.608, v_num=0, train_loss=0.604, train_accuracy=0.667, train_f1_score=0.667, val_loss=0.653, val_accuracy=0.610, val_f1_score=0.610]
Epoch 3:  91%|█████████ | 232/255 [01:30<00:08,  2.57it/s, loss=0.608, v_num=0, train_loss=0.604, train_accuracy=0.667, train_f1_score=0.667, val_loss=0.653, val_accuracy=0.610, val_f1_score=0.610]
Epoch 3:  92%|█████████▏| 234/255 [01:30<00:08,  2.58it/s, loss=0.608, v_num=0, train_loss=0.604, train_accuracy=0.667, 

Epoch 3, global step 903: val_loss reached 0.62433 (best 0.53729), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-2.ckpt" as top 2


Epoch 4:  89%|████████▊ | 226/255 [01:23<00:10,  2.70it/s, loss=0.446, v_num=0, train_loss=0.327, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.624, val_accuracy=0.667, val_f1_score=0.667]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 4:  89%|████████▉ | 228/255 [01:29<00:10,  2.55it/s, loss=0.446, v_num=0, train_loss=0.327, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.624, val_accuracy=0.667, val_f1_score=0.667]
Epoch 4:  90%|█████████ | 230/255 [01:29<00:09,  2.56it/s, loss=0.446, v_num=0, train_loss=0.327, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.624, val_accuracy=0.667, val_f1_score=0.667]
Epoch 4:  91%|█████████ | 232/255 [01:29<00:08,  2.58it/s, loss=0.446, v_num=0, train_loss=0.327, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.624, val_accuracy=0.667, val_f1_score=0.667]
Epoch 4:  92%|█████████▏| 234/255 [01:30<00:08,  2.60it/s, loss=0.446, v_num=0, train_loss=0.327, train_accuracy=0.889, 

Epoch 4, global step 1129: val_loss reached 0.52442 (best 0.52442), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-2.ckpt" as top 2


Epoch 5:  89%|████████▊ | 226/255 [01:24<00:10,  2.69it/s, loss=0.493, v_num=0, train_loss=0.612, train_accuracy=0.722, train_f1_score=0.722, val_loss=0.524, val_accuracy=0.762, val_f1_score=0.762]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 5:  89%|████████▉ | 228/255 [01:29<00:10,  2.54it/s, loss=0.493, v_num=0, train_loss=0.612, train_accuracy=0.722, train_f1_score=0.722, val_loss=0.524, val_accuracy=0.762, val_f1_score=0.762]
Epoch 5:  90%|█████████ | 230/255 [01:29<00:09,  2.56it/s, loss=0.493, v_num=0, train_loss=0.612, train_accuracy=0.722, train_f1_score=0.722, val_loss=0.524, val_accuracy=0.762, val_f1_score=0.762]
Epoch 5:  91%|█████████ | 232/255 [01:30<00:08,  2.57it/s, loss=0.493, v_num=0, train_loss=0.612, train_accuracy=0.722, train_f1_score=0.722, val_loss=0.524, val_accuracy=0.762, val_f1_score=0.762]
Epoch 5:  92%|█████████▏| 234/255 [01:30<00:08,  2.59it/s, loss=0.493, v_num=0, train_loss=0.612, train_accuracy=0.722, 

Epoch 5, global step 1355: val_loss reached 0.51720 (best 0.51720), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-2-v1.ckpt" as top 2


Epoch 6:  89%|████████▊ | 226/255 [01:23<00:10,  2.70it/s, loss=0.505, v_num=0, train_loss=0.520, train_accuracy=0.667, train_f1_score=0.667, val_loss=0.517, val_accuracy=0.774, val_f1_score=0.774]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 6:  89%|████████▉ | 228/255 [01:29<00:10,  2.55it/s, loss=0.505, v_num=0, train_loss=0.520, train_accuracy=0.667, train_f1_score=0.667, val_loss=0.517, val_accuracy=0.774, val_f1_score=0.774]
Epoch 6:  90%|█████████ | 230/255 [01:29<00:09,  2.56it/s, loss=0.505, v_num=0, train_loss=0.520, train_accuracy=0.667, train_f1_score=0.667, val_loss=0.517, val_accuracy=0.774, val_f1_score=0.774]
Epoch 6:  91%|█████████ | 232/255 [01:29<00:08,  2.58it/s, loss=0.505, v_num=0, train_loss=0.520, train_accuracy=0.667, train_f1_score=0.667, val_loss=0.517, val_accuracy=0.774, val_f1_score=0.774]
Epoch 6:  92%|█████████▏| 234/255 [01:30<00:08,  2.60it/s, loss=0.505, v_num=0, train_loss=0.520, train_accuracy=0.667, 

Epoch 6, global step 1581: val_loss was not in top 2


Epoch 7:  89%|████████▊ | 226/255 [01:24<00:10,  2.68it/s, loss=0.432, v_num=0, train_loss=0.338, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.528, val_accuracy=0.739, val_f1_score=0.739]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 7:  89%|████████▉ | 228/255 [01:29<00:10,  2.53it/s, loss=0.432, v_num=0, train_loss=0.338, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.528, val_accuracy=0.739, val_f1_score=0.739]
Epoch 7:  90%|█████████ | 230/255 [01:30<00:09,  2.55it/s, loss=0.432, v_num=0, train_loss=0.338, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.528, val_accuracy=0.739, val_f1_score=0.739]
Epoch 7:  91%|█████████ | 232/255 [01:30<00:08,  2.57it/s, loss=0.432, v_num=0, train_loss=0.338, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.528, val_accuracy=0.739, val_f1_score=0.739]
Epoch 7:  92%|█████████▏| 234/255 [01:30<00:08,  2.59it/s, loss=0.432, v_num=0, train_loss=0.338, train_accuracy=0.833, 

Epoch 7, global step 1807: val_loss reached 0.51466 (best 0.51466), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-2.ckpt" as top 2


Epoch 8:  89%|████████▊ | 226/255 [01:24<00:10,  2.68it/s, loss=0.474, v_num=0, train_loss=0.637, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.515, val_accuracy=0.769, val_f1_score=0.769]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 8:  89%|████████▉ | 228/255 [01:30<00:10,  2.53it/s, loss=0.474, v_num=0, train_loss=0.637, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.515, val_accuracy=0.769, val_f1_score=0.769]
Epoch 8:  90%|█████████ | 230/255 [01:30<00:09,  2.55it/s, loss=0.474, v_num=0, train_loss=0.637, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.515, val_accuracy=0.769, val_f1_score=0.769]
Epoch 8:  91%|█████████ | 232/255 [01:30<00:08,  2.56it/s, loss=0.474, v_num=0, train_loss=0.637, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.515, val_accuracy=0.769, val_f1_score=0.769]
Epoch 8:  92%|█████████▏| 234/255 [01:30<00:08,  2.58it/s, loss=0.474, v_num=0, train_loss=0.637, train_accuracy=0.778, 

Epoch 8, global step 2033: val_loss was not in top 2


Epoch 9:  89%|████████▊ | 226/255 [01:23<00:10,  2.70it/s, loss=0.469, v_num=0, train_loss=0.673, train_accuracy=0.722, train_f1_score=0.722, val_loss=0.638, val_accuracy=0.736, val_f1_score=0.736]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 9:  89%|████████▉ | 228/255 [01:29<00:10,  2.55it/s, loss=0.469, v_num=0, train_loss=0.673, train_accuracy=0.722, train_f1_score=0.722, val_loss=0.638, val_accuracy=0.736, val_f1_score=0.736]
Epoch 9:  90%|█████████ | 230/255 [01:29<00:09,  2.56it/s, loss=0.469, v_num=0, train_loss=0.673, train_accuracy=0.722, train_f1_score=0.722, val_loss=0.638, val_accuracy=0.736, val_f1_score=0.736]
Epoch 9:  91%|█████████ | 232/255 [01:29<00:08,  2.58it/s, loss=0.469, v_num=0, train_loss=0.673, train_accuracy=0.722, train_f1_score=0.722, val_loss=0.638, val_accuracy=0.736, val_f1_score=0.736]
Epoch 9:  92%|█████████▏| 234/255 [01:30<00:08,  2.60it/s, loss=0.469, v_num=0, train_loss=0.673, train_accuracy=0.722, 

Epoch 9, global step 2259: val_loss reached 0.47678 (best 0.47678), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-2-v1.ckpt" as top 2


Epoch 10:  89%|████████▊ | 226/255 [01:23<00:10,  2.70it/s, loss=0.48, v_num=0, train_loss=0.484, train_accuracy=0.722, train_f1_score=0.722, val_loss=0.477, val_accuracy=0.790, val_f1_score=0.790] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 10:  89%|████████▉ | 228/255 [01:29<00:10,  2.55it/s, loss=0.48, v_num=0, train_loss=0.484, train_accuracy=0.722, train_f1_score=0.722, val_loss=0.477, val_accuracy=0.790, val_f1_score=0.790]
Epoch 10:  90%|█████████ | 230/255 [01:29<00:09,  2.57it/s, loss=0.48, v_num=0, train_loss=0.484, train_accuracy=0.722, train_f1_score=0.722, val_loss=0.477, val_accuracy=0.790, val_f1_score=0.790]
Epoch 10:  91%|█████████ | 232/255 [01:29<00:08,  2.59it/s, loss=0.48, v_num=0, train_loss=0.484, train_accuracy=0.722, train_f1_score=0.722, val_loss=0.477, val_accuracy=0.790, val_f1_score=0.790]
Epoch 10:  92%|█████████▏| 234/255 [01:29<00:08,  2.60it/s, loss=0.48, v_num=0, train_loss=0.484, train_accuracy=0.722,

Epoch 10, global step 2485: val_loss was not in top 2


Epoch 11:  89%|████████▊ | 226/255 [01:24<00:10,  2.69it/s, loss=0.431, v_num=0, train_loss=0.442, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.545, val_accuracy=0.732, val_f1_score=0.732]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 11:  89%|████████▉ | 228/255 [01:29<00:10,  2.54it/s, loss=0.431, v_num=0, train_loss=0.442, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.545, val_accuracy=0.732, val_f1_score=0.732]
Epoch 11:  90%|█████████ | 230/255 [01:30<00:09,  2.55it/s, loss=0.431, v_num=0, train_loss=0.442, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.545, val_accuracy=0.732, val_f1_score=0.732]
Epoch 11:  91%|█████████ | 232/255 [01:30<00:08,  2.57it/s, loss=0.431, v_num=0, train_loss=0.442, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.545, val_accuracy=0.732, val_f1_score=0.732]
Epoch 11:  92%|█████████▏| 234/255 [01:30<00:08,  2.59it/s, loss=0.431, v_num=0, train_loss=0.442, train_accuracy=0.

Epoch 11, global step 2711: val_loss reached 0.50602 (best 0.47678), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-2.ckpt" as top 2


Epoch 12:  89%|████████▊ | 226/255 [01:24<00:10,  2.69it/s, loss=0.413, v_num=0, train_loss=0.247, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.506, val_accuracy=0.761, val_f1_score=0.761]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 12:  89%|████████▉ | 228/255 [01:29<00:10,  2.54it/s, loss=0.413, v_num=0, train_loss=0.247, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.506, val_accuracy=0.761, val_f1_score=0.761]
Epoch 12:  90%|█████████ | 230/255 [01:30<00:09,  2.55it/s, loss=0.413, v_num=0, train_loss=0.247, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.506, val_accuracy=0.761, val_f1_score=0.761]
Epoch 12:  91%|█████████ | 232/255 [01:30<00:08,  2.57it/s, loss=0.413, v_num=0, train_loss=0.247, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.506, val_accuracy=0.761, val_f1_score=0.761]
Epoch 12:  92%|█████████▏| 234/255 [01:30<00:08,  2.59it/s, loss=0.413, v_num=0, train_loss=0.247, train_accuracy=0.

Epoch 12, global step 2937: val_loss was not in top 2


Epoch 13:  89%|████████▊ | 226/255 [01:23<00:10,  2.69it/s, loss=0.425, v_num=0, train_loss=0.676, train_accuracy=0.667, train_f1_score=0.667, val_loss=0.551, val_accuracy=0.742, val_f1_score=0.742]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 13:  89%|████████▉ | 228/255 [01:29<00:10,  2.54it/s, loss=0.425, v_num=0, train_loss=0.676, train_accuracy=0.667, train_f1_score=0.667, val_loss=0.551, val_accuracy=0.742, val_f1_score=0.742]
Epoch 13:  90%|█████████ | 230/255 [01:29<00:09,  2.56it/s, loss=0.425, v_num=0, train_loss=0.676, train_accuracy=0.667, train_f1_score=0.667, val_loss=0.551, val_accuracy=0.742, val_f1_score=0.742]
Epoch 13:  91%|█████████ | 232/255 [01:30<00:08,  2.58it/s, loss=0.425, v_num=0, train_loss=0.676, train_accuracy=0.667, train_f1_score=0.667, val_loss=0.551, val_accuracy=0.742, val_f1_score=0.742]
Epoch 13:  92%|█████████▏| 234/255 [01:30<00:08,  2.59it/s, loss=0.425, v_num=0, train_loss=0.676, train_accuracy=0.

Epoch 13, global step 3163: val_loss was not in top 2


Epoch 14:  89%|████████▊ | 226/255 [01:23<00:10,  2.70it/s, loss=0.397, v_num=0, train_loss=0.355, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.641, val_accuracy=0.697, val_f1_score=0.697]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 14:  89%|████████▉ | 228/255 [01:29<00:10,  2.54it/s, loss=0.397, v_num=0, train_loss=0.355, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.641, val_accuracy=0.697, val_f1_score=0.697]
Epoch 14:  90%|█████████ | 230/255 [01:29<00:09,  2.56it/s, loss=0.397, v_num=0, train_loss=0.355, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.641, val_accuracy=0.697, val_f1_score=0.697]
Epoch 14:  91%|█████████ | 232/255 [01:30<00:08,  2.58it/s, loss=0.397, v_num=0, train_loss=0.355, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.641, val_accuracy=0.697, val_f1_score=0.697]
Epoch 14:  92%|█████████▏| 234/255 [01:30<00:08,  2.59it/s, loss=0.397, v_num=0, train_loss=0.355, train_accuracy=0.

Epoch 14, global step 3389: val_loss was not in top 2


Epoch 15:  89%|████████▊ | 226/255 [01:24<00:10,  2.68it/s, loss=0.355, v_num=0, train_loss=0.438, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.689, val_accuracy=0.722, val_f1_score=0.722]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 15:  89%|████████▉ | 228/255 [01:30<00:10,  2.53it/s, loss=0.355, v_num=0, train_loss=0.438, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.689, val_accuracy=0.722, val_f1_score=0.722]
Epoch 15:  90%|█████████ | 230/255 [01:30<00:09,  2.54it/s, loss=0.355, v_num=0, train_loss=0.438, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.689, val_accuracy=0.722, val_f1_score=0.722]
Epoch 15:  91%|█████████ | 232/255 [01:30<00:08,  2.56it/s, loss=0.355, v_num=0, train_loss=0.438, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.689, val_accuracy=0.722, val_f1_score=0.722]
Epoch 15:  92%|█████████▏| 234/255 [01:30<00:08,  2.58it/s, loss=0.355, v_num=0, train_loss=0.438, train_accuracy=0.

Epoch 15, global step 3615: val_loss was not in top 2


Epoch 16:  89%|████████▊ | 226/255 [01:24<00:10,  2.68it/s, loss=0.373, v_num=0, train_loss=0.579, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.831, val_accuracy=0.713, val_f1_score=0.713]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 16:  89%|████████▉ | 228/255 [01:30<00:10,  2.53it/s, loss=0.373, v_num=0, train_loss=0.579, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.831, val_accuracy=0.713, val_f1_score=0.713]
Epoch 16:  90%|█████████ | 230/255 [01:30<00:09,  2.54it/s, loss=0.373, v_num=0, train_loss=0.579, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.831, val_accuracy=0.713, val_f1_score=0.713]
Epoch 16:  91%|█████████ | 232/255 [01:30<00:08,  2.56it/s, loss=0.373, v_num=0, train_loss=0.579, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.831, val_accuracy=0.713, val_f1_score=0.713]
Epoch 16:  92%|█████████▏| 234/255 [01:30<00:08,  2.58it/s, loss=0.373, v_num=0, train_loss=0.579, train_accuracy=0.

Epoch 16, global step 3841: val_loss was not in top 2


Epoch 17:  89%|████████▊ | 226/255 [01:24<00:10,  2.68it/s, loss=0.39, v_num=0, train_loss=0.317, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.756, val_accuracy=0.742, val_f1_score=0.742] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 17:  89%|████████▉ | 228/255 [01:30<00:10,  2.53it/s, loss=0.39, v_num=0, train_loss=0.317, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.756, val_accuracy=0.742, val_f1_score=0.742]
Validating:   7%|▋         | 2/29 [00:05<01:05,  2.44s/it][A
Epoch 17:  90%|█████████ | 230/255 [01:30<00:09,  2.55it/s, loss=0.39, v_num=0, train_loss=0.317, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.756, val_accuracy=0.742, val_f1_score=0.742]
Epoch 17:  91%|█████████ | 232/255 [01:30<00:08,  2.57it/s, loss=0.39, v_num=0, train_loss=0.317, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.756, val_accuracy=0.742, val_f1_score=0.742]
Epoch 17:  92%|█████████▏| 234/255 [01:30<00:08,  2.58it/

Epoch 17, global step 4067: val_loss reached 0.45839 (best 0.45839), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-2.ckpt" as top 2


Epoch 18:  89%|████████▊ | 226/255 [01:24<00:10,  2.69it/s, loss=0.315, v_num=0, train_loss=0.249, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.458, val_accuracy=0.779, val_f1_score=0.779]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 18:  89%|████████▉ | 228/255 [01:29<00:10,  2.53it/s, loss=0.315, v_num=0, train_loss=0.249, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.458, val_accuracy=0.779, val_f1_score=0.779]
Epoch 18:  90%|█████████ | 230/255 [01:30<00:09,  2.55it/s, loss=0.315, v_num=0, train_loss=0.249, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.458, val_accuracy=0.779, val_f1_score=0.779]
Epoch 18:  91%|█████████ | 232/255 [01:30<00:08,  2.57it/s, loss=0.315, v_num=0, train_loss=0.249, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.458, val_accuracy=0.779, val_f1_score=0.779]
Epoch 18:  92%|█████████▏| 234/255 [01:30<00:08,  2.59it/s, loss=0.315, v_num=0, train_loss=0.249, train_accuracy=0.

Epoch 18, global step 4293: val_loss was not in top 2


Epoch 19:  89%|████████▊ | 226/255 [01:24<00:10,  2.68it/s, loss=0.327, v_num=0, train_loss=0.242, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.552, val_accuracy=0.771, val_f1_score=0.771]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 19:  89%|████████▉ | 228/255 [01:30<00:10,  2.53it/s, loss=0.327, v_num=0, train_loss=0.242, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.552, val_accuracy=0.771, val_f1_score=0.771]
Epoch 19:  90%|█████████ | 230/255 [01:30<00:09,  2.54it/s, loss=0.327, v_num=0, train_loss=0.242, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.552, val_accuracy=0.771, val_f1_score=0.771]
Epoch 19:  91%|█████████ | 232/255 [01:30<00:08,  2.56it/s, loss=0.327, v_num=0, train_loss=0.242, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.552, val_accuracy=0.771, val_f1_score=0.771]
Epoch 19:  92%|█████████▏| 234/255 [01:30<00:08,  2.58it/s, loss=0.327, v_num=0, train_loss=0.242, train_accuracy=0.

Epoch 19, global step 4519: val_loss was not in top 2


Epoch 20:  89%|████████▊ | 226/255 [01:24<00:10,  2.68it/s, loss=0.289, v_num=0, train_loss=0.113, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.583, val_accuracy=0.755, val_f1_score=0.755]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 20:  89%|████████▉ | 228/255 [01:30<00:10,  2.53it/s, loss=0.289, v_num=0, train_loss=0.113, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.583, val_accuracy=0.755, val_f1_score=0.755]
Epoch 20:  90%|█████████ | 230/255 [01:30<00:09,  2.55it/s, loss=0.289, v_num=0, train_loss=0.113, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.583, val_accuracy=0.755, val_f1_score=0.755]
Epoch 20:  91%|█████████ | 232/255 [01:30<00:08,  2.57it/s, loss=0.289, v_num=0, train_loss=0.113, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.583, val_accuracy=0.755, val_f1_score=0.755]
Epoch 20:  92%|█████████▏| 234/255 [01:30<00:08,  2.58it/s, loss=0.289, v_num=0, train_loss=0.113, train_accuracy=1.

Epoch 20, global step 4745: val_loss was not in top 2


Epoch 21:  89%|████████▊ | 226/255 [01:24<00:10,  2.67it/s, loss=0.369, v_num=0, train_loss=0.409, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.861, val_accuracy=0.736, val_f1_score=0.736]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 21:  89%|████████▉ | 228/255 [01:30<00:10,  2.52it/s, loss=0.369, v_num=0, train_loss=0.409, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.861, val_accuracy=0.736, val_f1_score=0.736]
Epoch 21:  90%|█████████ | 230/255 [01:30<00:09,  2.54it/s, loss=0.369, v_num=0, train_loss=0.409, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.861, val_accuracy=0.736, val_f1_score=0.736]
Epoch 21:  91%|█████████ | 232/255 [01:30<00:09,  2.55it/s, loss=0.369, v_num=0, train_loss=0.409, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.861, val_accuracy=0.736, val_f1_score=0.736]
Epoch 21:  92%|█████████▏| 234/255 [01:30<00:08,  2.57it/s, loss=0.369, v_num=0, train_loss=0.409, train_accuracy=0.

Epoch 21, global step 4971: val_loss was not in top 2


Epoch 22:  89%|████████▊ | 226/255 [01:24<00:10,  2.67it/s, loss=0.313, v_num=0, train_loss=0.251, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.497, val_accuracy=0.776, val_f1_score=0.776]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 22:  89%|████████▉ | 228/255 [01:30<00:10,  2.52it/s, loss=0.313, v_num=0, train_loss=0.251, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.497, val_accuracy=0.776, val_f1_score=0.776]
Epoch 22:  90%|█████████ | 230/255 [01:30<00:09,  2.53it/s, loss=0.313, v_num=0, train_loss=0.251, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.497, val_accuracy=0.776, val_f1_score=0.776]
Epoch 22:  91%|█████████ | 232/255 [01:30<00:09,  2.55it/s, loss=0.313, v_num=0, train_loss=0.251, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.497, val_accuracy=0.776, val_f1_score=0.776]
Epoch 22:  92%|█████████▏| 234/255 [01:31<00:08,  2.57it/s, loss=0.313, v_num=0, train_loss=0.251, train_accuracy=0.

Epoch 22, global step 5197: val_loss reached 0.44958 (best 0.44958), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-2-v1.ckpt" as top 2


Epoch 23:  89%|████████▊ | 226/255 [01:24<00:10,  2.66it/s, loss=0.296, v_num=0, train_loss=0.0136, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.450, val_accuracy=0.795, val_f1_score=0.795]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 23:  89%|████████▉ | 228/255 [01:30<00:10,  2.51it/s, loss=0.296, v_num=0, train_loss=0.0136, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.450, val_accuracy=0.795, val_f1_score=0.795]
Epoch 23:  90%|█████████ | 230/255 [01:30<00:09,  2.53it/s, loss=0.296, v_num=0, train_loss=0.0136, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.450, val_accuracy=0.795, val_f1_score=0.795]
Epoch 23:  91%|█████████ | 232/255 [01:31<00:09,  2.55it/s, loss=0.296, v_num=0, train_loss=0.0136, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.450, val_accuracy=0.795, val_f1_score=0.795]
Epoch 23:  92%|█████████▏| 234/255 [01:31<00:08,  2.57it/s, loss=0.296, v_num=0, train_loss=0.0136, train_accura

Epoch 23, global step 5423: val_loss was not in top 2


Epoch 24:  89%|████████▊ | 226/255 [01:24<00:10,  2.68it/s, loss=0.282, v_num=0, train_loss=0.307, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.554, val_accuracy=0.797, val_f1_score=0.797] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 24:  89%|████████▉ | 228/255 [01:30<00:10,  2.53it/s, loss=0.282, v_num=0, train_loss=0.307, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.554, val_accuracy=0.797, val_f1_score=0.797]
Epoch 24:  90%|█████████ | 230/255 [01:30<00:09,  2.55it/s, loss=0.282, v_num=0, train_loss=0.307, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.554, val_accuracy=0.797, val_f1_score=0.797]
Epoch 24:  91%|█████████ | 232/255 [01:30<00:08,  2.57it/s, loss=0.282, v_num=0, train_loss=0.307, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.554, val_accuracy=0.797, val_f1_score=0.797]
Epoch 24:  92%|█████████▏| 234/255 [01:30<00:08,  2.58it/s, loss=0.282, v_num=0, train_loss=0.307, train_accuracy=0

Epoch 24, global step 5649: val_loss was not in top 2


Epoch 25:  89%|████████▊ | 226/255 [01:24<00:10,  2.67it/s, loss=0.334, v_num=0, train_loss=0.120, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.526, val_accuracy=0.799, val_f1_score=0.799]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 25:  89%|████████▉ | 228/255 [01:30<00:10,  2.53it/s, loss=0.334, v_num=0, train_loss=0.120, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.526, val_accuracy=0.799, val_f1_score=0.799]
Epoch 25:  90%|█████████ | 230/255 [01:30<00:09,  2.54it/s, loss=0.334, v_num=0, train_loss=0.120, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.526, val_accuracy=0.799, val_f1_score=0.799]
Epoch 25:  91%|█████████ | 232/255 [01:30<00:08,  2.56it/s, loss=0.334, v_num=0, train_loss=0.120, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.526, val_accuracy=0.799, val_f1_score=0.799]
Epoch 25:  92%|█████████▏| 234/255 [01:30<00:08,  2.58it/s, loss=0.334, v_num=0, train_loss=0.120, train_accuracy=1.

Epoch 25, global step 5875: val_loss was not in top 2


Epoch 26:  89%|████████▊ | 226/255 [01:24<00:10,  2.69it/s, loss=0.313, v_num=0, train_loss=0.567, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.522, val_accuracy=0.796, val_f1_score=0.796]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 26:  89%|████████▉ | 228/255 [01:29<00:10,  2.54it/s, loss=0.313, v_num=0, train_loss=0.567, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.522, val_accuracy=0.796, val_f1_score=0.796]
Epoch 26:  90%|█████████ | 230/255 [01:30<00:09,  2.55it/s, loss=0.313, v_num=0, train_loss=0.567, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.522, val_accuracy=0.796, val_f1_score=0.796]
Epoch 26:  91%|█████████ | 232/255 [01:30<00:08,  2.57it/s, loss=0.313, v_num=0, train_loss=0.567, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.522, val_accuracy=0.796, val_f1_score=0.796]
Epoch 26:  92%|█████████▏| 234/255 [01:30<00:08,  2.59it/s, loss=0.313, v_num=0, train_loss=0.567, train_accuracy=0.

Epoch 26, global step 6101: val_loss reached 0.42467 (best 0.42467), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-2.ckpt" as top 2


Epoch 27:  89%|████████▊ | 226/255 [01:24<00:10,  2.68it/s, loss=0.269, v_num=0, train_loss=0.448, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.425, val_accuracy=0.811, val_f1_score=0.811]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 27:  89%|████████▉ | 228/255 [01:29<00:10,  2.53it/s, loss=0.269, v_num=0, train_loss=0.448, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.425, val_accuracy=0.811, val_f1_score=0.811]
Epoch 27:  90%|█████████ | 230/255 [01:30<00:09,  2.55it/s, loss=0.269, v_num=0, train_loss=0.448, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.425, val_accuracy=0.811, val_f1_score=0.811]
Epoch 27:  91%|█████████ | 232/255 [01:30<00:08,  2.57it/s, loss=0.269, v_num=0, train_loss=0.448, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.425, val_accuracy=0.811, val_f1_score=0.811]
Epoch 27:  92%|█████████▏| 234/255 [01:30<00:08,  2.59it/s, loss=0.269, v_num=0, train_loss=0.448, train_accuracy=0.

Epoch 27, global step 6327: val_loss was not in top 2


Epoch 28:  89%|████████▊ | 226/255 [01:24<00:10,  2.68it/s, loss=0.242, v_num=0, train_loss=0.121, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.512, val_accuracy=0.813, val_f1_score=0.813]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 28:  89%|████████▉ | 228/255 [01:30<00:10,  2.53it/s, loss=0.242, v_num=0, train_loss=0.121, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.512, val_accuracy=0.813, val_f1_score=0.813]
Epoch 28:  90%|█████████ | 230/255 [01:30<00:09,  2.55it/s, loss=0.242, v_num=0, train_loss=0.121, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.512, val_accuracy=0.813, val_f1_score=0.813]
Epoch 28:  91%|█████████ | 232/255 [01:30<00:08,  2.57it/s, loss=0.242, v_num=0, train_loss=0.121, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.512, val_accuracy=0.813, val_f1_score=0.813]
Epoch 28:  92%|█████████▏| 234/255 [01:30<00:08,  2.58it/s, loss=0.242, v_num=0, train_loss=0.121, train_accuracy=0.

Epoch 28, global step 6553: val_loss was not in top 2


Epoch 29:  89%|████████▊ | 226/255 [01:24<00:10,  2.69it/s, loss=0.326, v_num=0, train_loss=0.426, train_accuracy=0.722, train_f1_score=0.722, val_loss=0.505, val_accuracy=0.843, val_f1_score=0.843]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 29:  89%|████████▉ | 228/255 [01:29<00:10,  2.53it/s, loss=0.326, v_num=0, train_loss=0.426, train_accuracy=0.722, train_f1_score=0.722, val_loss=0.505, val_accuracy=0.843, val_f1_score=0.843]
Epoch 29:  90%|█████████ | 230/255 [01:30<00:09,  2.55it/s, loss=0.326, v_num=0, train_loss=0.426, train_accuracy=0.722, train_f1_score=0.722, val_loss=0.505, val_accuracy=0.843, val_f1_score=0.843]
Epoch 29:  91%|█████████ | 232/255 [01:30<00:08,  2.57it/s, loss=0.326, v_num=0, train_loss=0.426, train_accuracy=0.722, train_f1_score=0.722, val_loss=0.505, val_accuracy=0.843, val_f1_score=0.843]
Epoch 29:  92%|█████████▏| 234/255 [01:30<00:08,  2.59it/s, loss=0.326, v_num=0, train_loss=0.426, train_accuracy=0.

Epoch 29, global step 6779: val_loss was not in top 2


Epoch 30:  89%|████████▊ | 226/255 [01:23<00:10,  2.70it/s, loss=0.362, v_num=0, train_loss=0.214, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.604, val_accuracy=0.823, val_f1_score=0.823]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 30:  89%|████████▉ | 228/255 [01:29<00:10,  2.55it/s, loss=0.362, v_num=0, train_loss=0.214, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.604, val_accuracy=0.823, val_f1_score=0.823]
Epoch 30:  90%|█████████ | 230/255 [01:29<00:09,  2.57it/s, loss=0.362, v_num=0, train_loss=0.214, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.604, val_accuracy=0.823, val_f1_score=0.823]
Epoch 30:  91%|█████████ | 232/255 [01:29<00:08,  2.58it/s, loss=0.362, v_num=0, train_loss=0.214, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.604, val_accuracy=0.823, val_f1_score=0.823]
Epoch 30:  92%|█████████▏| 234/255 [01:29<00:08,  2.60it/s, loss=0.362, v_num=0, train_loss=0.214, train_accuracy=0.

Epoch 30, global step 7005: val_loss was not in top 2


Epoch 31:  89%|████████▊ | 226/255 [01:23<00:10,  2.70it/s, loss=0.289, v_num=0, train_loss=0.432, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.604, val_accuracy=0.798, val_f1_score=0.798] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 31:  89%|████████▉ | 228/255 [01:29<00:10,  2.55it/s, loss=0.289, v_num=0, train_loss=0.432, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.604, val_accuracy=0.798, val_f1_score=0.798]
Epoch 31:  90%|█████████ | 230/255 [01:29<00:09,  2.57it/s, loss=0.289, v_num=0, train_loss=0.432, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.604, val_accuracy=0.798, val_f1_score=0.798]
Epoch 31:  91%|█████████ | 232/255 [01:29<00:08,  2.59it/s, loss=0.289, v_num=0, train_loss=0.432, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.604, val_accuracy=0.798, val_f1_score=0.798]
Epoch 31:  92%|█████████▏| 234/255 [01:29<00:08,  2.60it/s, loss=0.289, v_num=0, train_loss=0.432, train_accuracy=0

Epoch 31, global step 7231: val_loss reached 0.41158 (best 0.41158), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-2-v1.ckpt" as top 2


Epoch 32:  89%|████████▊ | 226/255 [01:24<00:10,  2.68it/s, loss=0.273, v_num=0, train_loss=0.268, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.412, val_accuracy=0.840, val_f1_score=0.840]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 32:  89%|████████▉ | 228/255 [01:30<00:10,  2.53it/s, loss=0.273, v_num=0, train_loss=0.268, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.412, val_accuracy=0.840, val_f1_score=0.840]
Epoch 32:  90%|█████████ | 230/255 [01:30<00:09,  2.55it/s, loss=0.273, v_num=0, train_loss=0.268, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.412, val_accuracy=0.840, val_f1_score=0.840]
Epoch 32:  91%|█████████ | 232/255 [01:30<00:08,  2.57it/s, loss=0.273, v_num=0, train_loss=0.268, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.412, val_accuracy=0.840, val_f1_score=0.840]
Epoch 32:  92%|█████████▏| 234/255 [01:30<00:08,  2.58it/s, loss=0.273, v_num=0, train_loss=0.268, train_accuracy=0.

Epoch 32, global step 7457: val_loss reached 0.40237 (best 0.40237), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-2.ckpt" as top 2


Epoch 33:  89%|████████▊ | 226/255 [01:24<00:10,  2.68it/s, loss=0.622, v_num=0, train_loss=0.622, train_accuracy=0.722, train_f1_score=0.722, val_loss=0.402, val_accuracy=0.854, val_f1_score=0.854]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 33:  89%|████████▉ | 228/255 [01:30<00:10,  2.53it/s, loss=0.622, v_num=0, train_loss=0.622, train_accuracy=0.722, train_f1_score=0.722, val_loss=0.402, val_accuracy=0.854, val_f1_score=0.854]
Epoch 33:  90%|█████████ | 230/255 [01:30<00:09,  2.55it/s, loss=0.622, v_num=0, train_loss=0.622, train_accuracy=0.722, train_f1_score=0.722, val_loss=0.402, val_accuracy=0.854, val_f1_score=0.854]
Epoch 33:  91%|█████████ | 232/255 [01:30<00:08,  2.57it/s, loss=0.622, v_num=0, train_loss=0.622, train_accuracy=0.722, train_f1_score=0.722, val_loss=0.402, val_accuracy=0.854, val_f1_score=0.854]
Epoch 33:  92%|█████████▏| 234/255 [01:30<00:08,  2.58it/s, loss=0.622, v_num=0, train_loss=0.622, train_accuracy=0.

Epoch 33, global step 7683: val_loss was not in top 2


Epoch 34:  89%|████████▊ | 226/255 [01:24<00:10,  2.68it/s, loss=0.445, v_num=0, train_loss=0.504, train_accuracy=0.667, train_f1_score=0.667, val_loss=0.591, val_accuracy=0.688, val_f1_score=0.688]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 34:  89%|████████▉ | 228/255 [01:30<00:10,  2.53it/s, loss=0.445, v_num=0, train_loss=0.504, train_accuracy=0.667, train_f1_score=0.667, val_loss=0.591, val_accuracy=0.688, val_f1_score=0.688]
Epoch 34:  90%|█████████ | 230/255 [01:30<00:09,  2.54it/s, loss=0.445, v_num=0, train_loss=0.504, train_accuracy=0.667, train_f1_score=0.667, val_loss=0.591, val_accuracy=0.688, val_f1_score=0.688]
Epoch 34:  91%|█████████ | 232/255 [01:30<00:08,  2.56it/s, loss=0.445, v_num=0, train_loss=0.504, train_accuracy=0.667, train_f1_score=0.667, val_loss=0.591, val_accuracy=0.688, val_f1_score=0.688]
Epoch 34:  92%|█████████▏| 234/255 [01:30<00:08,  2.58it/s, loss=0.445, v_num=0, train_loss=0.504, train_accuracy=0.

Epoch 34, global step 7909: val_loss was not in top 2


Epoch 35:  89%|████████▊ | 226/255 [01:24<00:10,  2.68it/s, loss=0.377, v_num=0, train_loss=0.288, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.540, val_accuracy=0.743, val_f1_score=0.743]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 35:  89%|████████▉ | 228/255 [01:30<00:10,  2.53it/s, loss=0.377, v_num=0, train_loss=0.288, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.540, val_accuracy=0.743, val_f1_score=0.743]
Epoch 35:  90%|█████████ | 230/255 [01:30<00:09,  2.55it/s, loss=0.377, v_num=0, train_loss=0.288, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.540, val_accuracy=0.743, val_f1_score=0.743]
Epoch 35:  91%|█████████ | 232/255 [01:30<00:08,  2.57it/s, loss=0.377, v_num=0, train_loss=0.288, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.540, val_accuracy=0.743, val_f1_score=0.743]
Epoch 35:  92%|█████████▏| 234/255 [01:30<00:08,  2.58it/s, loss=0.377, v_num=0, train_loss=0.288, train_accuracy=0.

Epoch 35, global step 8135: val_loss was not in top 2


Epoch 36:  89%|████████▊ | 226/255 [01:24<00:10,  2.69it/s, loss=0.281, v_num=0, train_loss=0.169, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.457, val_accuracy=0.771, val_f1_score=0.771]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 36:  89%|████████▉ | 228/255 [01:30<00:10,  2.53it/s, loss=0.281, v_num=0, train_loss=0.169, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.457, val_accuracy=0.771, val_f1_score=0.771]
Epoch 36:  90%|█████████ | 230/255 [01:30<00:09,  2.55it/s, loss=0.281, v_num=0, train_loss=0.169, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.457, val_accuracy=0.771, val_f1_score=0.771]
Epoch 36:  91%|█████████ | 232/255 [01:30<00:08,  2.56it/s, loss=0.281, v_num=0, train_loss=0.169, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.457, val_accuracy=0.771, val_f1_score=0.771]
Epoch 36:  92%|█████████▏| 234/255 [01:30<00:08,  2.58it/s, loss=0.281, v_num=0, train_loss=0.169, train_accuracy=0.

Epoch 36, global step 8361: val_loss was not in top 2


Epoch 37:  89%|████████▊ | 226/255 [01:24<00:10,  2.67it/s, loss=0.326, v_num=0, train_loss=0.505, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.412, val_accuracy=0.812, val_f1_score=0.812] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 37:  89%|████████▉ | 228/255 [01:30<00:10,  2.52it/s, loss=0.326, v_num=0, train_loss=0.505, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.412, val_accuracy=0.812, val_f1_score=0.812]
Epoch 37:  90%|█████████ | 230/255 [01:30<00:09,  2.53it/s, loss=0.326, v_num=0, train_loss=0.505, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.412, val_accuracy=0.812, val_f1_score=0.812]
Epoch 37:  91%|█████████ | 232/255 [01:30<00:09,  2.55it/s, loss=0.326, v_num=0, train_loss=0.505, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.412, val_accuracy=0.812, val_f1_score=0.812]
Epoch 37:  92%|█████████▏| 234/255 [01:31<00:08,  2.57it/s, loss=0.326, v_num=0, train_loss=0.505, train_accuracy=0

Epoch 37, global step 8587: val_loss was not in top 2


Epoch 38:  89%|████████▊ | 226/255 [01:24<00:10,  2.69it/s, loss=0.207, v_num=0, train_loss=0.150, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.489, val_accuracy=0.834, val_f1_score=0.834]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 38:  89%|████████▉ | 228/255 [01:29<00:10,  2.54it/s, loss=0.207, v_num=0, train_loss=0.150, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.489, val_accuracy=0.834, val_f1_score=0.834]
Epoch 38:  90%|█████████ | 230/255 [01:30<00:09,  2.55it/s, loss=0.207, v_num=0, train_loss=0.150, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.489, val_accuracy=0.834, val_f1_score=0.834]
Epoch 38:  91%|█████████ | 232/255 [01:30<00:08,  2.57it/s, loss=0.207, v_num=0, train_loss=0.150, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.489, val_accuracy=0.834, val_f1_score=0.834]
Epoch 38:  92%|█████████▏| 234/255 [01:30<00:08,  2.59it/s, loss=0.207, v_num=0, train_loss=0.150, train_accuracy=1.

Epoch 38, global step 8813: val_loss was not in top 2


Epoch 39:  89%|████████▊ | 226/255 [01:23<00:10,  2.70it/s, loss=0.254, v_num=0, train_loss=0.280, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.497, val_accuracy=0.823, val_f1_score=0.823] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 39:  89%|████████▉ | 228/255 [01:29<00:10,  2.54it/s, loss=0.254, v_num=0, train_loss=0.280, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.497, val_accuracy=0.823, val_f1_score=0.823]
Epoch 39:  90%|█████████ | 230/255 [01:29<00:09,  2.56it/s, loss=0.254, v_num=0, train_loss=0.280, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.497, val_accuracy=0.823, val_f1_score=0.823]
Epoch 39:  91%|█████████ | 232/255 [01:29<00:08,  2.58it/s, loss=0.254, v_num=0, train_loss=0.280, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.497, val_accuracy=0.823, val_f1_score=0.823]
Epoch 39:  92%|█████████▏| 234/255 [01:30<00:08,  2.60it/s, loss=0.254, v_num=0, train_loss=0.280, train_accuracy=0

Epoch 39, global step 9039: val_loss was not in top 2


Epoch 40:  89%|████████▊ | 226/255 [01:23<00:10,  2.70it/s, loss=0.265, v_num=0, train_loss=0.225, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.468, val_accuracy=0.795, val_f1_score=0.795] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 40:  89%|████████▉ | 228/255 [01:29<00:10,  2.54it/s, loss=0.265, v_num=0, train_loss=0.225, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.468, val_accuracy=0.795, val_f1_score=0.795]
Epoch 40:  90%|█████████ | 230/255 [01:29<00:09,  2.56it/s, loss=0.265, v_num=0, train_loss=0.225, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.468, val_accuracy=0.795, val_f1_score=0.795]
Epoch 40:  91%|█████████ | 232/255 [01:30<00:08,  2.58it/s, loss=0.265, v_num=0, train_loss=0.225, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.468, val_accuracy=0.795, val_f1_score=0.795]
Epoch 40:  92%|█████████▏| 234/255 [01:30<00:08,  2.59it/s, loss=0.265, v_num=0, train_loss=0.225, train_accuracy=0

Epoch 40, global step 9265: val_loss was not in top 2


Epoch 41:  89%|████████▊ | 226/255 [01:23<00:10,  2.69it/s, loss=0.226, v_num=0, train_loss=0.310, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.440, val_accuracy=0.817, val_f1_score=0.817] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 41:  89%|████████▉ | 228/255 [01:29<00:10,  2.54it/s, loss=0.226, v_num=0, train_loss=0.310, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.440, val_accuracy=0.817, val_f1_score=0.817]
Epoch 41:  90%|█████████ | 230/255 [01:30<00:09,  2.55it/s, loss=0.226, v_num=0, train_loss=0.310, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.440, val_accuracy=0.817, val_f1_score=0.817]
Epoch 41:  91%|█████████ | 232/255 [01:30<00:08,  2.57it/s, loss=0.226, v_num=0, train_loss=0.310, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.440, val_accuracy=0.817, val_f1_score=0.817]
Epoch 41:  92%|█████████▏| 234/255 [01:30<00:08,  2.59it/s, loss=0.226, v_num=0, train_loss=0.310, train_accuracy=0

Epoch 41, global step 9491: val_loss was not in top 2


Epoch 42:  89%|████████▊ | 226/255 [01:24<00:10,  2.69it/s, loss=0.221, v_num=0, train_loss=0.224, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.498, val_accuracy=0.823, val_f1_score=0.823] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 42:  89%|████████▉ | 228/255 [01:30<00:10,  2.53it/s, loss=0.221, v_num=0, train_loss=0.224, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.498, val_accuracy=0.823, val_f1_score=0.823]
Epoch 42:  90%|█████████ | 230/255 [01:30<00:09,  2.55it/s, loss=0.221, v_num=0, train_loss=0.224, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.498, val_accuracy=0.823, val_f1_score=0.823]
Epoch 42:  91%|█████████ | 232/255 [01:30<00:08,  2.57it/s, loss=0.221, v_num=0, train_loss=0.224, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.498, val_accuracy=0.823, val_f1_score=0.823]
Epoch 42:  92%|█████████▏| 234/255 [01:30<00:08,  2.58it/s, loss=0.221, v_num=0, train_loss=0.224, train_accuracy=0

Epoch 42, global step 9717: val_loss reached 0.39008 (best 0.39008), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-2-v1.ckpt" as top 2


Epoch 43:  89%|████████▊ | 226/255 [01:24<00:10,  2.68it/s, loss=0.413, v_num=0, train_loss=0.191, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.390, val_accuracy=0.856, val_f1_score=0.856] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 43:  89%|████████▉ | 228/255 [01:30<00:10,  2.52it/s, loss=0.413, v_num=0, train_loss=0.191, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.390, val_accuracy=0.856, val_f1_score=0.856]
Epoch 43:  90%|█████████ | 230/255 [01:30<00:09,  2.54it/s, loss=0.413, v_num=0, train_loss=0.191, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.390, val_accuracy=0.856, val_f1_score=0.856]
Epoch 43:  91%|█████████ | 232/255 [01:30<00:08,  2.56it/s, loss=0.413, v_num=0, train_loss=0.191, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.390, val_accuracy=0.856, val_f1_score=0.856]
Epoch 43:  92%|█████████▏| 234/255 [01:30<00:08,  2.57it/s, loss=0.413, v_num=0, train_loss=0.191, train_accuracy=0

Epoch 43, global step 9943: val_loss was not in top 2


Epoch 44:  89%|████████▊ | 226/255 [01:24<00:10,  2.68it/s, loss=0.304, v_num=0, train_loss=0.208, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.413, val_accuracy=0.825, val_f1_score=0.825]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 44:  89%|████████▉ | 228/255 [01:30<00:10,  2.53it/s, loss=0.304, v_num=0, train_loss=0.208, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.413, val_accuracy=0.825, val_f1_score=0.825]
Epoch 44:  90%|█████████ | 230/255 [01:30<00:09,  2.55it/s, loss=0.304, v_num=0, train_loss=0.208, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.413, val_accuracy=0.825, val_f1_score=0.825]
Epoch 44:  91%|█████████ | 232/255 [01:30<00:08,  2.56it/s, loss=0.304, v_num=0, train_loss=0.208, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.413, val_accuracy=0.825, val_f1_score=0.825]
Epoch 44:  92%|█████████▏| 234/255 [01:30<00:08,  2.58it/s, loss=0.304, v_num=0, train_loss=0.208, train_accuracy=0.

Epoch 44, global step 10169: val_loss was not in top 2


Epoch 45:  89%|████████▊ | 226/255 [01:23<00:10,  2.69it/s, loss=0.23, v_num=0, train_loss=0.567, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.570, val_accuracy=0.784, val_f1_score=0.784]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 45:  89%|████████▉ | 228/255 [01:29<00:10,  2.53it/s, loss=0.23, v_num=0, train_loss=0.567, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.570, val_accuracy=0.784, val_f1_score=0.784]
Epoch 45:  90%|█████████ | 230/255 [01:30<00:09,  2.55it/s, loss=0.23, v_num=0, train_loss=0.567, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.570, val_accuracy=0.784, val_f1_score=0.784]
Epoch 45:  91%|█████████ | 232/255 [01:30<00:08,  2.57it/s, loss=0.23, v_num=0, train_loss=0.567, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.570, val_accuracy=0.784, val_f1_score=0.784]
Epoch 45:  92%|█████████▏| 234/255 [01:30<00:08,  2.58it/s, loss=0.23, v_num=0, train_loss=0.567, train_accuracy=0.778

Epoch 45, global step 10395: val_loss reached 0.32372 (best 0.32372), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-2.ckpt" as top 2


Epoch 46:  89%|████████▊ | 226/255 [01:23<00:10,  2.69it/s, loss=0.268, v_num=0, train_loss=0.249, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.324, val_accuracy=0.875, val_f1_score=0.875] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 46:  89%|████████▉ | 228/255 [01:29<00:10,  2.54it/s, loss=0.268, v_num=0, train_loss=0.249, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.324, val_accuracy=0.875, val_f1_score=0.875]
Epoch 46:  90%|█████████ | 230/255 [01:30<00:09,  2.55it/s, loss=0.268, v_num=0, train_loss=0.249, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.324, val_accuracy=0.875, val_f1_score=0.875]
Epoch 46:  91%|█████████ | 232/255 [01:30<00:08,  2.57it/s, loss=0.268, v_num=0, train_loss=0.249, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.324, val_accuracy=0.875, val_f1_score=0.875]
Epoch 46:  92%|█████████▏| 234/255 [01:30<00:08,  2.59it/s, loss=0.268, v_num=0, train_loss=0.249, train_accuracy=0

Epoch 46, global step 10621: val_loss reached 0.35150 (best 0.32372), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-2-v1.ckpt" as top 2


Epoch 47:  89%|████████▊ | 226/255 [01:24<00:10,  2.66it/s, loss=0.258, v_num=0, train_loss=0.052, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.352, val_accuracy=0.856, val_f1_score=0.856] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 47:  89%|████████▉ | 228/255 [01:30<00:10,  2.52it/s, loss=0.258, v_num=0, train_loss=0.052, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.352, val_accuracy=0.856, val_f1_score=0.856]
Epoch 47:  90%|█████████ | 230/255 [01:30<00:09,  2.53it/s, loss=0.258, v_num=0, train_loss=0.052, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.352, val_accuracy=0.856, val_f1_score=0.856]
Epoch 47:  91%|█████████ | 232/255 [01:30<00:09,  2.55it/s, loss=0.258, v_num=0, train_loss=0.052, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.352, val_accuracy=0.856, val_f1_score=0.856]
Epoch 47:  92%|█████████▏| 234/255 [01:31<00:08,  2.57it/s, loss=0.258, v_num=0, train_loss=0.052, train_accuracy=1

Epoch 47, global step 10847: val_loss was not in top 2


Epoch 48:  89%|████████▊ | 226/255 [01:24<00:10,  2.68it/s, loss=0.293, v_num=0, train_loss=0.493, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.357, val_accuracy=0.856, val_f1_score=0.856]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 48:  89%|████████▉ | 228/255 [01:30<00:10,  2.53it/s, loss=0.293, v_num=0, train_loss=0.493, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.357, val_accuracy=0.856, val_f1_score=0.856]
Epoch 48:  90%|█████████ | 230/255 [01:30<00:09,  2.54it/s, loss=0.293, v_num=0, train_loss=0.493, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.357, val_accuracy=0.856, val_f1_score=0.856]
Epoch 48:  91%|█████████ | 232/255 [01:30<00:08,  2.56it/s, loss=0.293, v_num=0, train_loss=0.493, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.357, val_accuracy=0.856, val_f1_score=0.856]
Epoch 48:  92%|█████████▏| 234/255 [01:30<00:08,  2.58it/s, loss=0.293, v_num=0, train_loss=0.493, train_accuracy=0.

Epoch 48, global step 11073: val_loss was not in top 2


Epoch 49:  89%|████████▊ | 226/255 [01:25<00:10,  2.66it/s, loss=0.25, v_num=0, train_loss=0.317, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.358, val_accuracy=0.846, val_f1_score=0.846]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 49:  89%|████████▉ | 228/255 [01:30<00:10,  2.51it/s, loss=0.25, v_num=0, train_loss=0.317, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.358, val_accuracy=0.846, val_f1_score=0.846]
Epoch 49:  90%|█████████ | 230/255 [01:31<00:09,  2.53it/s, loss=0.25, v_num=0, train_loss=0.317, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.358, val_accuracy=0.846, val_f1_score=0.846]
Epoch 49:  91%|█████████ | 232/255 [01:31<00:09,  2.54it/s, loss=0.25, v_num=0, train_loss=0.317, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.358, val_accuracy=0.846, val_f1_score=0.846]
Epoch 49:  92%|█████████▏| 234/255 [01:31<00:08,  2.56it/s, loss=0.25, v_num=0, train_loss=0.317, train_accuracy=0.944

Epoch 49, global step 11299: val_loss was not in top 2


Epoch 50:  89%|████████▊ | 226/255 [01:24<00:10,  2.67it/s, loss=0.206, v_num=0, train_loss=0.197, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.357, val_accuracy=0.853, val_f1_score=0.853] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 50:  89%|████████▉ | 228/255 [01:30<00:10,  2.52it/s, loss=0.206, v_num=0, train_loss=0.197, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.357, val_accuracy=0.853, val_f1_score=0.853]
Epoch 50:  90%|█████████ | 230/255 [01:30<00:09,  2.54it/s, loss=0.206, v_num=0, train_loss=0.197, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.357, val_accuracy=0.853, val_f1_score=0.853]
Epoch 50:  91%|█████████ | 232/255 [01:30<00:08,  2.56it/s, loss=0.206, v_num=0, train_loss=0.197, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.357, val_accuracy=0.853, val_f1_score=0.853]
Epoch 50:  92%|█████████▏| 234/255 [01:30<00:08,  2.57it/s, loss=0.206, v_num=0, train_loss=0.197, train_accuracy=0

Epoch 50, global step 11525: val_loss was not in top 2


Epoch 51:  89%|████████▊ | 226/255 [01:24<00:10,  2.68it/s, loss=0.31, v_num=0, train_loss=0.262, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.379, val_accuracy=0.855, val_f1_score=0.855]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 51:  89%|████████▉ | 228/255 [01:30<00:10,  2.53it/s, loss=0.31, v_num=0, train_loss=0.262, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.379, val_accuracy=0.855, val_f1_score=0.855]
Epoch 51:  90%|█████████ | 230/255 [01:30<00:09,  2.54it/s, loss=0.31, v_num=0, train_loss=0.262, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.379, val_accuracy=0.855, val_f1_score=0.855]
Epoch 51:  91%|█████████ | 232/255 [01:30<00:08,  2.56it/s, loss=0.31, v_num=0, train_loss=0.262, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.379, val_accuracy=0.855, val_f1_score=0.855]
Epoch 51:  92%|█████████▏| 234/255 [01:30<00:08,  2.58it/s, loss=0.31, v_num=0, train_loss=0.262, train_accuracy=0.889

Epoch 51, global step 11751: val_loss was not in top 2


Epoch 52:  89%|████████▊ | 226/255 [01:24<00:10,  2.68it/s, loss=0.227, v_num=0, train_loss=0.235, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.504, val_accuracy=0.839, val_f1_score=0.839] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 52:  89%|████████▉ | 228/255 [01:30<00:10,  2.53it/s, loss=0.227, v_num=0, train_loss=0.235, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.504, val_accuracy=0.839, val_f1_score=0.839]
Epoch 52:  90%|█████████ | 230/255 [01:30<00:09,  2.55it/s, loss=0.227, v_num=0, train_loss=0.235, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.504, val_accuracy=0.839, val_f1_score=0.839]
Epoch 52:  91%|█████████ | 232/255 [01:30<00:08,  2.57it/s, loss=0.227, v_num=0, train_loss=0.235, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.504, val_accuracy=0.839, val_f1_score=0.839]
Epoch 52:  92%|█████████▏| 234/255 [01:30<00:08,  2.58it/s, loss=0.227, v_num=0, train_loss=0.235, train_accuracy=0

Epoch 52, global step 11977: val_loss was not in top 2


Epoch 53:  89%|████████▊ | 226/255 [01:23<00:10,  2.70it/s, loss=0.188, v_num=0, train_loss=0.159, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.388, val_accuracy=0.823, val_f1_score=0.823] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 53:  89%|████████▉ | 228/255 [01:29<00:10,  2.54it/s, loss=0.188, v_num=0, train_loss=0.159, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.388, val_accuracy=0.823, val_f1_score=0.823]
Epoch 53:  90%|█████████ | 230/255 [01:29<00:09,  2.56it/s, loss=0.188, v_num=0, train_loss=0.159, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.388, val_accuracy=0.823, val_f1_score=0.823]
Epoch 53:  91%|█████████ | 232/255 [01:29<00:08,  2.58it/s, loss=0.188, v_num=0, train_loss=0.159, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.388, val_accuracy=0.823, val_f1_score=0.823]
Epoch 53:  92%|█████████▏| 234/255 [01:30<00:08,  2.60it/s, loss=0.188, v_num=0, train_loss=0.159, train_accuracy=0

Epoch 53, global step 12203: val_loss was not in top 2


Epoch 54:  89%|████████▊ | 226/255 [01:24<00:10,  2.68it/s, loss=0.217, v_num=0, train_loss=0.195, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.578, val_accuracy=0.820, val_f1_score=0.820] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 54:  89%|████████▉ | 228/255 [01:30<00:10,  2.53it/s, loss=0.217, v_num=0, train_loss=0.195, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.578, val_accuracy=0.820, val_f1_score=0.820]
Epoch 54:  90%|█████████ | 230/255 [01:30<00:09,  2.55it/s, loss=0.217, v_num=0, train_loss=0.195, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.578, val_accuracy=0.820, val_f1_score=0.820]
Epoch 54:  91%|█████████ | 232/255 [01:30<00:08,  2.56it/s, loss=0.217, v_num=0, train_loss=0.195, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.578, val_accuracy=0.820, val_f1_score=0.820]
Epoch 54:  92%|█████████▏| 234/255 [01:30<00:08,  2.58it/s, loss=0.217, v_num=0, train_loss=0.195, train_accuracy=0

Epoch 54, global step 12429: val_loss was not in top 2


Epoch 55:  89%|████████▊ | 226/255 [01:23<00:10,  2.69it/s, loss=0.217, v_num=0, train_loss=0.0762, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.394, val_accuracy=0.851, val_f1_score=0.851]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 55:  89%|████████▉ | 228/255 [01:29<00:10,  2.54it/s, loss=0.217, v_num=0, train_loss=0.0762, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.394, val_accuracy=0.851, val_f1_score=0.851]
Epoch 55:  90%|█████████ | 230/255 [01:29<00:09,  2.56it/s, loss=0.217, v_num=0, train_loss=0.0762, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.394, val_accuracy=0.851, val_f1_score=0.851]
Epoch 55:  91%|█████████ | 232/255 [01:30<00:08,  2.58it/s, loss=0.217, v_num=0, train_loss=0.0762, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.394, val_accuracy=0.851, val_f1_score=0.851]
Epoch 55:  92%|█████████▏| 234/255 [01:30<00:08,  2.59it/s, loss=0.217, v_num=0, train_loss=0.0762, train_accura

Epoch 55, global step 12655: val_loss reached 0.34934 (best 0.32372), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-2-v1.ckpt" as top 2


Epoch 56:  89%|████████▊ | 226/255 [01:23<00:10,  2.69it/s, loss=0.199, v_num=0, train_loss=0.241, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.349, val_accuracy=0.867, val_f1_score=0.867] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 56:  89%|████████▉ | 228/255 [01:29<00:10,  2.54it/s, loss=0.199, v_num=0, train_loss=0.241, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.349, val_accuracy=0.867, val_f1_score=0.867]
Epoch 56:  90%|█████████ | 230/255 [01:30<00:09,  2.55it/s, loss=0.199, v_num=0, train_loss=0.241, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.349, val_accuracy=0.867, val_f1_score=0.867]
Epoch 56:  91%|█████████ | 232/255 [01:30<00:08,  2.57it/s, loss=0.199, v_num=0, train_loss=0.241, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.349, val_accuracy=0.867, val_f1_score=0.867]
Epoch 56:  92%|█████████▏| 234/255 [01:30<00:08,  2.59it/s, loss=0.199, v_num=0, train_loss=0.241, train_accuracy=0

Epoch 56, global step 12881: val_loss was not in top 2


Epoch 57:  89%|████████▊ | 226/255 [01:24<00:10,  2.67it/s, loss=0.184, v_num=0, train_loss=0.333, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.433, val_accuracy=0.858, val_f1_score=0.858] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 57:  89%|████████▉ | 228/255 [01:30<00:10,  2.52it/s, loss=0.184, v_num=0, train_loss=0.333, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.433, val_accuracy=0.858, val_f1_score=0.858]
Epoch 57:  90%|█████████ | 230/255 [01:30<00:09,  2.54it/s, loss=0.184, v_num=0, train_loss=0.333, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.433, val_accuracy=0.858, val_f1_score=0.858]
Epoch 57:  91%|█████████ | 232/255 [01:30<00:09,  2.55it/s, loss=0.184, v_num=0, train_loss=0.333, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.433, val_accuracy=0.858, val_f1_score=0.858]
Epoch 57:  92%|█████████▏| 234/255 [01:30<00:08,  2.57it/s, loss=0.184, v_num=0, train_loss=0.333, train_accuracy=0

Epoch 57, global step 13107: val_loss was not in top 2


Epoch 58:  89%|████████▊ | 226/255 [01:24<00:10,  2.68it/s, loss=0.155, v_num=0, train_loss=0.131, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.359, val_accuracy=0.878, val_f1_score=0.878] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 58:  89%|████████▉ | 228/255 [01:30<00:10,  2.52it/s, loss=0.155, v_num=0, train_loss=0.131, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.359, val_accuracy=0.878, val_f1_score=0.878]
Epoch 58:  90%|█████████ | 230/255 [01:30<00:09,  2.54it/s, loss=0.155, v_num=0, train_loss=0.131, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.359, val_accuracy=0.878, val_f1_score=0.878]
Epoch 58:  91%|█████████ | 232/255 [01:30<00:09,  2.55it/s, loss=0.155, v_num=0, train_loss=0.131, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.359, val_accuracy=0.878, val_f1_score=0.878]
Epoch 58:  92%|█████████▏| 234/255 [01:31<00:08,  2.57it/s, loss=0.155, v_num=0, train_loss=0.131, train_accuracy=0

Epoch 58, global step 13333: val_loss reached 0.32503 (best 0.32372), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-2-v1.ckpt" as top 2


Epoch 59:  89%|████████▊ | 226/255 [01:24<00:10,  2.69it/s, loss=0.183, v_num=0, train_loss=0.0404, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.325, val_accuracy=0.881, val_f1_score=0.881]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 59:  89%|████████▉ | 228/255 [01:30<00:10,  2.53it/s, loss=0.183, v_num=0, train_loss=0.0404, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.325, val_accuracy=0.881, val_f1_score=0.881]
Epoch 59:  90%|█████████ | 230/255 [01:30<00:09,  2.55it/s, loss=0.183, v_num=0, train_loss=0.0404, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.325, val_accuracy=0.881, val_f1_score=0.881]
Epoch 59:  91%|█████████ | 232/255 [01:30<00:08,  2.57it/s, loss=0.183, v_num=0, train_loss=0.0404, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.325, val_accuracy=0.881, val_f1_score=0.881]
Epoch 59:  92%|█████████▏| 234/255 [01:30<00:08,  2.58it/s, loss=0.183, v_num=0, train_loss=0.0404, train_accura

Epoch 59, global step 13559: val_loss was not in top 2


Epoch 60:  89%|████████▊ | 226/255 [01:24<00:10,  2.69it/s, loss=0.181, v_num=0, train_loss=0.234, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.523, val_accuracy=0.865, val_f1_score=0.865] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 60:  89%|████████▉ | 228/255 [01:30<00:10,  2.53it/s, loss=0.181, v_num=0, train_loss=0.234, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.523, val_accuracy=0.865, val_f1_score=0.865]
Epoch 60:  90%|█████████ | 230/255 [01:30<00:09,  2.55it/s, loss=0.181, v_num=0, train_loss=0.234, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.523, val_accuracy=0.865, val_f1_score=0.865]
Epoch 60:  91%|█████████ | 232/255 [01:30<00:08,  2.57it/s, loss=0.181, v_num=0, train_loss=0.234, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.523, val_accuracy=0.865, val_f1_score=0.865]
Epoch 60:  92%|█████████▏| 234/255 [01:30<00:08,  2.58it/s, loss=0.181, v_num=0, train_loss=0.234, train_accuracy=0

Epoch 60, global step 13785: val_loss reached 0.31470 (best 0.31470), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-2-v1.ckpt" as top 2


Epoch 61:  89%|████████▊ | 226/255 [01:24<00:10,  2.68it/s, loss=0.148, v_num=0, train_loss=0.0324, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.315, val_accuracy=0.886, val_f1_score=0.886]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 61:  89%|████████▉ | 228/255 [01:30<00:10,  2.53it/s, loss=0.148, v_num=0, train_loss=0.0324, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.315, val_accuracy=0.886, val_f1_score=0.886]
Epoch 61:  90%|█████████ | 230/255 [01:30<00:09,  2.54it/s, loss=0.148, v_num=0, train_loss=0.0324, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.315, val_accuracy=0.886, val_f1_score=0.886]
Validating:  14%|█▍        | 4/29 [00:06<00:24,  1.04it/s][A
Epoch 61:  91%|█████████ | 232/255 [01:30<00:08,  2.56it/s, loss=0.148, v_num=0, train_loss=0.0324, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.315, val_accuracy=0.886, val_f1_score=0.886]
Epoch 61:  92%|█████████▏| 234/255 [01:30<00:08,  

Epoch 61, global step 14011: val_loss was not in top 2


Epoch 62:  89%|████████▊ | 226/255 [01:24<00:10,  2.68it/s, loss=0.141, v_num=0, train_loss=0.0789, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.368, val_accuracy=0.885, val_f1_score=0.885]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 62:  89%|████████▉ | 228/255 [01:30<00:10,  2.53it/s, loss=0.141, v_num=0, train_loss=0.0789, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.368, val_accuracy=0.885, val_f1_score=0.885]
Epoch 62:  90%|█████████ | 230/255 [01:30<00:09,  2.55it/s, loss=0.141, v_num=0, train_loss=0.0789, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.368, val_accuracy=0.885, val_f1_score=0.885]
Epoch 62:  91%|█████████ | 232/255 [01:30<00:08,  2.57it/s, loss=0.141, v_num=0, train_loss=0.0789, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.368, val_accuracy=0.885, val_f1_score=0.885]
Epoch 62:  92%|█████████▏| 234/255 [01:30<00:08,  2.58it/s, loss=0.141, v_num=0, train_loss=0.0789, train_accura

Epoch 62, global step 14237: val_loss was not in top 2


Epoch 63:  89%|████████▊ | 226/255 [01:24<00:10,  2.68it/s, loss=0.184, v_num=0, train_loss=0.312, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.324, val_accuracy=0.884, val_f1_score=0.884] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 63:  89%|████████▉ | 228/255 [01:30<00:10,  2.53it/s, loss=0.184, v_num=0, train_loss=0.312, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.324, val_accuracy=0.884, val_f1_score=0.884]
Epoch 63:  90%|█████████ | 230/255 [01:30<00:09,  2.55it/s, loss=0.184, v_num=0, train_loss=0.312, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.324, val_accuracy=0.884, val_f1_score=0.884]
Epoch 63:  91%|█████████ | 232/255 [01:30<00:08,  2.56it/s, loss=0.184, v_num=0, train_loss=0.312, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.324, val_accuracy=0.884, val_f1_score=0.884]
Epoch 63:  92%|█████████▏| 234/255 [01:30<00:08,  2.58it/s, loss=0.184, v_num=0, train_loss=0.312, train_accuracy=0

Epoch 63, global step 14463: val_loss reached 0.28561 (best 0.28561), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-2.ckpt" as top 2


Epoch 64:  89%|████████▊ | 226/255 [01:24<00:10,  2.69it/s, loss=0.181, v_num=0, train_loss=0.107, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.286, val_accuracy=0.881, val_f1_score=0.881] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 64:  89%|████████▉ | 228/255 [01:29<00:10,  2.53it/s, loss=0.181, v_num=0, train_loss=0.107, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.286, val_accuracy=0.881, val_f1_score=0.881]
Epoch 64:  90%|█████████ | 230/255 [01:30<00:09,  2.55it/s, loss=0.181, v_num=0, train_loss=0.107, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.286, val_accuracy=0.881, val_f1_score=0.881]
Epoch 64:  91%|█████████ | 232/255 [01:30<00:08,  2.57it/s, loss=0.181, v_num=0, train_loss=0.107, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.286, val_accuracy=0.881, val_f1_score=0.881]
Epoch 64:  92%|█████████▏| 234/255 [01:30<00:08,  2.59it/s, loss=0.181, v_num=0, train_loss=0.107, train_accuracy=1

Epoch 64, global step 14689: val_loss was not in top 2


Epoch 65:  89%|████████▊ | 226/255 [01:24<00:10,  2.68it/s, loss=0.278, v_num=0, train_loss=0.152, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.329, val_accuracy=0.874, val_f1_score=0.874] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 65:  89%|████████▉ | 228/255 [01:30<00:10,  2.53it/s, loss=0.278, v_num=0, train_loss=0.152, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.329, val_accuracy=0.874, val_f1_score=0.874]
Epoch 65:  90%|█████████ | 230/255 [01:30<00:09,  2.55it/s, loss=0.278, v_num=0, train_loss=0.152, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.329, val_accuracy=0.874, val_f1_score=0.874]
Epoch 65:  91%|█████████ | 232/255 [01:30<00:08,  2.57it/s, loss=0.278, v_num=0, train_loss=0.152, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.329, val_accuracy=0.874, val_f1_score=0.874]
Epoch 65:  92%|█████████▏| 234/255 [01:30<00:08,  2.58it/s, loss=0.278, v_num=0, train_loss=0.152, train_accuracy=0

Epoch 65, global step 14915: val_loss was not in top 2


Epoch 66:  89%|████████▊ | 226/255 [01:24<00:10,  2.68it/s, loss=0.198, v_num=0, train_loss=0.229, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.565, val_accuracy=0.821, val_f1_score=0.821] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 66:  89%|████████▉ | 228/255 [01:30<00:10,  2.53it/s, loss=0.198, v_num=0, train_loss=0.229, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.565, val_accuracy=0.821, val_f1_score=0.821]
Epoch 66:  90%|█████████ | 230/255 [01:30<00:09,  2.55it/s, loss=0.198, v_num=0, train_loss=0.229, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.565, val_accuracy=0.821, val_f1_score=0.821]
Epoch 66:  91%|█████████ | 232/255 [01:30<00:08,  2.56it/s, loss=0.198, v_num=0, train_loss=0.229, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.565, val_accuracy=0.821, val_f1_score=0.821]
Epoch 66:  92%|█████████▏| 234/255 [01:30<00:08,  2.58it/s, loss=0.198, v_num=0, train_loss=0.229, train_accuracy=0

Epoch 66, global step 15141: val_loss was not in top 2


Epoch 67:  89%|████████▊ | 226/255 [01:24<00:10,  2.69it/s, loss=0.139, v_num=0, train_loss=0.0787, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.363, val_accuracy=0.867, val_f1_score=0.867]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 67:  89%|████████▉ | 228/255 [01:30<00:10,  2.53it/s, loss=0.139, v_num=0, train_loss=0.0787, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.363, val_accuracy=0.867, val_f1_score=0.867]
Epoch 67:  90%|█████████ | 230/255 [01:30<00:09,  2.55it/s, loss=0.139, v_num=0, train_loss=0.0787, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.363, val_accuracy=0.867, val_f1_score=0.867]
Epoch 67:  91%|█████████ | 232/255 [01:30<00:08,  2.57it/s, loss=0.139, v_num=0, train_loss=0.0787, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.363, val_accuracy=0.867, val_f1_score=0.867]
Epoch 67:  92%|█████████▏| 234/255 [01:30<00:08,  2.58it/s, loss=0.139, v_num=0, train_loss=0.0787, train_accura

Epoch 67, global step 15367: val_loss was not in top 2


Epoch 68:  89%|████████▊ | 226/255 [01:24<00:10,  2.68it/s, loss=0.24, v_num=0, train_loss=0.0649, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.371, val_accuracy=0.875, val_f1_score=0.875] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 68:  89%|████████▉ | 228/255 [01:30<00:10,  2.53it/s, loss=0.24, v_num=0, train_loss=0.0649, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.371, val_accuracy=0.875, val_f1_score=0.875]
Epoch 68:  90%|█████████ | 230/255 [01:30<00:09,  2.54it/s, loss=0.24, v_num=0, train_loss=0.0649, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.371, val_accuracy=0.875, val_f1_score=0.875]
Epoch 68:  91%|█████████ | 232/255 [01:30<00:08,  2.56it/s, loss=0.24, v_num=0, train_loss=0.0649, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.371, val_accuracy=0.875, val_f1_score=0.875]
Epoch 68:  92%|█████████▏| 234/255 [01:30<00:08,  2.58it/s, loss=0.24, v_num=0, train_loss=0.0649, train_accuracy=0

Epoch 68, global step 15593: val_loss was not in top 2


Epoch 69:  89%|████████▊ | 226/255 [01:24<00:10,  2.68it/s, loss=0.159, v_num=0, train_loss=0.254, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.407, val_accuracy=0.867, val_f1_score=0.867] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 69:  89%|████████▉ | 228/255 [01:30<00:10,  2.52it/s, loss=0.159, v_num=0, train_loss=0.254, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.407, val_accuracy=0.867, val_f1_score=0.867]
Epoch 69:  90%|█████████ | 230/255 [01:30<00:09,  2.54it/s, loss=0.159, v_num=0, train_loss=0.254, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.407, val_accuracy=0.867, val_f1_score=0.867]
Epoch 69:  91%|█████████ | 232/255 [01:30<00:08,  2.56it/s, loss=0.159, v_num=0, train_loss=0.254, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.407, val_accuracy=0.867, val_f1_score=0.867]
Epoch 69:  92%|█████████▏| 234/255 [01:30<00:08,  2.57it/s, loss=0.159, v_num=0, train_loss=0.254, train_accuracy=0

Epoch 69, global step 15819: val_loss was not in top 2


Epoch 70:  89%|████████▊ | 226/255 [01:24<00:10,  2.68it/s, loss=0.132, v_num=0, train_loss=0.0258, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.368, val_accuracy=0.877, val_f1_score=0.877]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 70:  89%|████████▉ | 228/255 [01:30<00:10,  2.52it/s, loss=0.132, v_num=0, train_loss=0.0258, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.368, val_accuracy=0.877, val_f1_score=0.877]
Epoch 70:  90%|█████████ | 230/255 [01:30<00:09,  2.54it/s, loss=0.132, v_num=0, train_loss=0.0258, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.368, val_accuracy=0.877, val_f1_score=0.877]
Epoch 70:  91%|█████████ | 232/255 [01:30<00:09,  2.55it/s, loss=0.132, v_num=0, train_loss=0.0258, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.368, val_accuracy=0.877, val_f1_score=0.877]
Epoch 70:  92%|█████████▏| 234/255 [01:31<00:08,  2.57it/s, loss=0.132, v_num=0, train_loss=0.0258, train_accura

Epoch 70, global step 16045: val_loss was not in top 2


Epoch 71:  89%|████████▊ | 226/255 [01:24<00:10,  2.69it/s, loss=0.143, v_num=0, train_loss=0.0496, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.426, val_accuracy=0.874, val_f1_score=0.874]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 71:  89%|████████▉ | 228/255 [01:30<00:10,  2.53it/s, loss=0.143, v_num=0, train_loss=0.0496, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.426, val_accuracy=0.874, val_f1_score=0.874]
Epoch 71:  90%|█████████ | 230/255 [01:30<00:09,  2.55it/s, loss=0.143, v_num=0, train_loss=0.0496, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.426, val_accuracy=0.874, val_f1_score=0.874]
Epoch 71:  91%|█████████ | 232/255 [01:30<00:08,  2.56it/s, loss=0.143, v_num=0, train_loss=0.0496, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.426, val_accuracy=0.874, val_f1_score=0.874]
Epoch 71:  92%|█████████▏| 234/255 [01:30<00:08,  2.58it/s, loss=0.143, v_num=0, train_loss=0.0496, train_accura

Epoch 71, global step 16271: val_loss was not in top 2


Epoch 72:  89%|████████▊ | 226/255 [01:24<00:10,  2.67it/s, loss=0.184, v_num=0, train_loss=0.141, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.497, val_accuracy=0.857, val_f1_score=0.857] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 72:  89%|████████▉ | 228/255 [01:30<00:10,  2.52it/s, loss=0.184, v_num=0, train_loss=0.141, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.497, val_accuracy=0.857, val_f1_score=0.857]
Epoch 72:  90%|█████████ | 230/255 [01:30<00:09,  2.54it/s, loss=0.184, v_num=0, train_loss=0.141, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.497, val_accuracy=0.857, val_f1_score=0.857]
Epoch 72:  91%|█████████ | 232/255 [01:30<00:09,  2.55it/s, loss=0.184, v_num=0, train_loss=0.141, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.497, val_accuracy=0.857, val_f1_score=0.857]
Epoch 72:  92%|█████████▏| 234/255 [01:31<00:08,  2.57it/s, loss=0.184, v_num=0, train_loss=0.141, train_accuracy=0

Epoch 72, global step 16497: val_loss was not in top 2


Epoch 73:  89%|████████▊ | 226/255 [01:24<00:10,  2.67it/s, loss=0.163, v_num=0, train_loss=0.152, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.393, val_accuracy=0.864, val_f1_score=0.864] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 73:  89%|████████▉ | 228/255 [01:30<00:10,  2.52it/s, loss=0.163, v_num=0, train_loss=0.152, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.393, val_accuracy=0.864, val_f1_score=0.864]
Epoch 73:  90%|█████████ | 230/255 [01:30<00:09,  2.53it/s, loss=0.163, v_num=0, train_loss=0.152, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.393, val_accuracy=0.864, val_f1_score=0.864]
Epoch 73:  91%|█████████ | 232/255 [01:30<00:09,  2.55it/s, loss=0.163, v_num=0, train_loss=0.152, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.393, val_accuracy=0.864, val_f1_score=0.864]
Epoch 73:  92%|█████████▏| 234/255 [01:31<00:08,  2.57it/s, loss=0.163, v_num=0, train_loss=0.152, train_accuracy=1

Epoch 73, global step 16723: val_loss reached 0.29068 (best 0.28561), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-2-v1.ckpt" as top 2


Epoch 74:  89%|████████▊ | 226/255 [01:24<00:10,  2.67it/s, loss=0.139, v_num=0, train_loss=0.146, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.291, val_accuracy=0.890, val_f1_score=0.890] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 74:  89%|████████▉ | 228/255 [01:30<00:10,  2.52it/s, loss=0.139, v_num=0, train_loss=0.146, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.291, val_accuracy=0.890, val_f1_score=0.890]
Epoch 74:  90%|█████████ | 230/255 [01:30<00:09,  2.53it/s, loss=0.139, v_num=0, train_loss=0.146, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.291, val_accuracy=0.890, val_f1_score=0.890]
Epoch 74:  91%|█████████ | 232/255 [01:30<00:09,  2.55it/s, loss=0.139, v_num=0, train_loss=0.146, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.291, val_accuracy=0.890, val_f1_score=0.890]
Epoch 74:  92%|█████████▏| 234/255 [01:31<00:08,  2.57it/s, loss=0.139, v_num=0, train_loss=0.146, train_accuracy=0

Epoch 74, global step 16949: val_loss was not in top 2


Epoch 75:  89%|████████▊ | 226/255 [01:24<00:10,  2.68it/s, loss=0.163, v_num=0, train_loss=0.135, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.305, val_accuracy=0.895, val_f1_score=0.895] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 75:  89%|████████▉ | 228/255 [01:30<00:10,  2.53it/s, loss=0.163, v_num=0, train_loss=0.135, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.305, val_accuracy=0.895, val_f1_score=0.895]
Epoch 75:  90%|█████████ | 230/255 [01:30<00:09,  2.55it/s, loss=0.163, v_num=0, train_loss=0.135, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.305, val_accuracy=0.895, val_f1_score=0.895]
Epoch 75:  91%|█████████ | 232/255 [01:30<00:08,  2.56it/s, loss=0.163, v_num=0, train_loss=0.135, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.305, val_accuracy=0.895, val_f1_score=0.895]
Epoch 75:  92%|█████████▏| 234/255 [01:30<00:08,  2.58it/s, loss=0.163, v_num=0, train_loss=0.135, train_accuracy=0

Epoch 75, global step 17175: val_loss was not in top 2


Epoch 76:  89%|████████▊ | 226/255 [01:24<00:10,  2.69it/s, loss=0.161, v_num=0, train_loss=0.0564, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.314, val_accuracy=0.891, val_f1_score=0.891]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 76:  89%|████████▉ | 228/255 [01:29<00:10,  2.53it/s, loss=0.161, v_num=0, train_loss=0.0564, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.314, val_accuracy=0.891, val_f1_score=0.891]
Epoch 76:  90%|█████████ | 230/255 [01:30<00:09,  2.55it/s, loss=0.161, v_num=0, train_loss=0.0564, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.314, val_accuracy=0.891, val_f1_score=0.891]
Epoch 76:  91%|█████████ | 232/255 [01:30<00:08,  2.57it/s, loss=0.161, v_num=0, train_loss=0.0564, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.314, val_accuracy=0.891, val_f1_score=0.891]
Epoch 76:  92%|█████████▏| 234/255 [01:30<00:08,  2.59it/s, loss=0.161, v_num=0, train_loss=0.0564, train_accura

Epoch 76, global step 17401: val_loss was not in top 2


Epoch 77:  89%|████████▊ | 226/255 [01:24<00:10,  2.66it/s, loss=0.104, v_num=0, train_loss=0.0478, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.356, val_accuracy=0.887, val_f1_score=0.887]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 77:  89%|████████▉ | 228/255 [01:30<00:10,  2.51it/s, loss=0.104, v_num=0, train_loss=0.0478, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.356, val_accuracy=0.887, val_f1_score=0.887]
Epoch 77:  90%|█████████ | 230/255 [01:30<00:09,  2.53it/s, loss=0.104, v_num=0, train_loss=0.0478, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.356, val_accuracy=0.887, val_f1_score=0.887]
Epoch 77:  91%|█████████ | 232/255 [01:31<00:09,  2.55it/s, loss=0.104, v_num=0, train_loss=0.0478, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.356, val_accuracy=0.887, val_f1_score=0.887]
Epoch 77:  92%|█████████▏| 234/255 [01:31<00:08,  2.56it/s, loss=0.104, v_num=0, train_loss=0.0478, train_accura

Epoch 77, global step 17627: val_loss was not in top 2


Epoch 78:  89%|████████▊ | 226/255 [01:23<00:10,  2.69it/s, loss=0.154, v_num=0, train_loss=0.0515, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.327, val_accuracy=0.904, val_f1_score=0.904]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 78:  89%|████████▉ | 228/255 [01:29<00:10,  2.54it/s, loss=0.154, v_num=0, train_loss=0.0515, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.327, val_accuracy=0.904, val_f1_score=0.904]
Epoch 78:  90%|█████████ | 230/255 [01:30<00:09,  2.55it/s, loss=0.154, v_num=0, train_loss=0.0515, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.327, val_accuracy=0.904, val_f1_score=0.904]
Epoch 78:  91%|█████████ | 232/255 [01:30<00:08,  2.57it/s, loss=0.154, v_num=0, train_loss=0.0515, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.327, val_accuracy=0.904, val_f1_score=0.904]
Epoch 78:  92%|█████████▏| 234/255 [01:30<00:08,  2.59it/s, loss=0.154, v_num=0, train_loss=0.0515, train_accura

Epoch 78, global step 17853: val_loss was not in top 2


Epoch 79:  89%|████████▊ | 226/255 [01:24<00:10,  2.68it/s, loss=0.167, v_num=0, train_loss=0.123, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.342, val_accuracy=0.888, val_f1_score=0.888] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 79:  89%|████████▉ | 228/255 [01:30<00:10,  2.53it/s, loss=0.167, v_num=0, train_loss=0.123, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.342, val_accuracy=0.888, val_f1_score=0.888]
Epoch 79:  90%|█████████ | 230/255 [01:30<00:09,  2.55it/s, loss=0.167, v_num=0, train_loss=0.123, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.342, val_accuracy=0.888, val_f1_score=0.888]
Epoch 79:  91%|█████████ | 232/255 [01:30<00:08,  2.56it/s, loss=0.167, v_num=0, train_loss=0.123, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.342, val_accuracy=0.888, val_f1_score=0.888]
Epoch 79:  92%|█████████▏| 234/255 [01:30<00:08,  2.58it/s, loss=0.167, v_num=0, train_loss=0.123, train_accuracy=0

Epoch 79, global step 18079: val_loss reached 0.27609 (best 0.27609), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-2-v1.ckpt" as top 2


Epoch 80:  89%|████████▊ | 226/255 [01:23<00:10,  2.70it/s, loss=0.178, v_num=0, train_loss=0.222, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.276, val_accuracy=0.891, val_f1_score=0.891] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 80:  89%|████████▉ | 228/255 [01:29<00:10,  2.54it/s, loss=0.178, v_num=0, train_loss=0.222, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.276, val_accuracy=0.891, val_f1_score=0.891]
Epoch 80:  90%|█████████ | 230/255 [01:30<00:09,  2.55it/s, loss=0.178, v_num=0, train_loss=0.222, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.276, val_accuracy=0.891, val_f1_score=0.891]
Epoch 80:  91%|█████████ | 232/255 [01:30<00:08,  2.57it/s, loss=0.178, v_num=0, train_loss=0.222, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.276, val_accuracy=0.891, val_f1_score=0.891]
Epoch 80:  92%|█████████▏| 234/255 [01:30<00:08,  2.59it/s, loss=0.178, v_num=0, train_loss=0.222, train_accuracy=0

Epoch 80, global step 18305: val_loss reached 0.28363 (best 0.27609), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-2.ckpt" as top 2


Epoch 81:  89%|████████▊ | 226/255 [01:24<00:10,  2.68it/s, loss=0.128, v_num=0, train_loss=0.228, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.284, val_accuracy=0.888, val_f1_score=0.888] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 81:  89%|████████▉ | 228/255 [01:30<00:10,  2.53it/s, loss=0.128, v_num=0, train_loss=0.228, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.284, val_accuracy=0.888, val_f1_score=0.888]
Epoch 81:  90%|█████████ | 230/255 [01:30<00:09,  2.54it/s, loss=0.128, v_num=0, train_loss=0.228, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.284, val_accuracy=0.888, val_f1_score=0.888]
Epoch 81:  91%|█████████ | 232/255 [01:30<00:08,  2.56it/s, loss=0.128, v_num=0, train_loss=0.228, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.284, val_accuracy=0.888, val_f1_score=0.888]
Epoch 81:  92%|█████████▏| 234/255 [01:30<00:08,  2.58it/s, loss=0.128, v_num=0, train_loss=0.228, train_accuracy=0

Epoch 81, global step 18531: val_loss was not in top 2


Epoch 82:  89%|████████▊ | 226/255 [01:24<00:10,  2.68it/s, loss=0.16, v_num=0, train_loss=0.0408, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.315, val_accuracy=0.899, val_f1_score=0.899] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 82:  89%|████████▉ | 228/255 [01:30<00:10,  2.53it/s, loss=0.16, v_num=0, train_loss=0.0408, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.315, val_accuracy=0.899, val_f1_score=0.899]
Epoch 82:  90%|█████████ | 230/255 [01:30<00:09,  2.54it/s, loss=0.16, v_num=0, train_loss=0.0408, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.315, val_accuracy=0.899, val_f1_score=0.899]
Epoch 82:  91%|█████████ | 232/255 [01:30<00:08,  2.56it/s, loss=0.16, v_num=0, train_loss=0.0408, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.315, val_accuracy=0.899, val_f1_score=0.899]
Epoch 82:  92%|█████████▏| 234/255 [01:30<00:08,  2.58it/s, loss=0.16, v_num=0, train_loss=0.0408, train_accuracy=1

Epoch 82, global step 18757: val_loss was not in top 2


Epoch 83:  89%|████████▊ | 226/255 [01:24<00:10,  2.68it/s, loss=0.153, v_num=0, train_loss=0.184, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.302, val_accuracy=0.899, val_f1_score=0.899] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 83:  89%|████████▉ | 228/255 [01:30<00:10,  2.53it/s, loss=0.153, v_num=0, train_loss=0.184, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.302, val_accuracy=0.899, val_f1_score=0.899]
Epoch 83:  90%|█████████ | 230/255 [01:30<00:09,  2.55it/s, loss=0.153, v_num=0, train_loss=0.184, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.302, val_accuracy=0.899, val_f1_score=0.899]
Epoch 83:  91%|█████████ | 232/255 [01:30<00:08,  2.57it/s, loss=0.153, v_num=0, train_loss=0.184, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.302, val_accuracy=0.899, val_f1_score=0.899]
Epoch 83:  92%|█████████▏| 234/255 [01:30<00:08,  2.58it/s, loss=0.153, v_num=0, train_loss=0.184, train_accuracy=0

Epoch 83, global step 18983: val_loss was not in top 2


Epoch 84:  89%|████████▊ | 226/255 [01:24<00:10,  2.69it/s, loss=0.141, v_num=0, train_loss=0.0489, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.316, val_accuracy=0.901, val_f1_score=0.901]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 84:  89%|████████▉ | 228/255 [01:29<00:10,  2.54it/s, loss=0.141, v_num=0, train_loss=0.0489, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.316, val_accuracy=0.901, val_f1_score=0.901]
Epoch 84:  90%|█████████ | 230/255 [01:29<00:09,  2.56it/s, loss=0.141, v_num=0, train_loss=0.0489, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.316, val_accuracy=0.901, val_f1_score=0.901]
Epoch 84:  91%|█████████ | 232/255 [01:30<00:08,  2.58it/s, loss=0.141, v_num=0, train_loss=0.0489, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.316, val_accuracy=0.901, val_f1_score=0.901]
Epoch 84:  92%|█████████▏| 234/255 [01:30<00:08,  2.59it/s, loss=0.141, v_num=0, train_loss=0.0489, train_accura

Epoch 84, global step 19209: val_loss reached 0.27646 (best 0.27609), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-2.ckpt" as top 2


Epoch 85:  89%|████████▊ | 226/255 [01:23<00:10,  2.69it/s, loss=0.126, v_num=0, train_loss=0.0389, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.276, val_accuracy=0.911, val_f1_score=0.911]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 85:  89%|████████▉ | 228/255 [01:30<00:10,  2.53it/s, loss=0.126, v_num=0, train_loss=0.0389, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.276, val_accuracy=0.911, val_f1_score=0.911]
Epoch 85:  90%|█████████ | 230/255 [01:30<00:09,  2.55it/s, loss=0.126, v_num=0, train_loss=0.0389, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.276, val_accuracy=0.911, val_f1_score=0.911]
Epoch 85:  91%|█████████ | 232/255 [01:30<00:08,  2.57it/s, loss=0.126, v_num=0, train_loss=0.0389, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.276, val_accuracy=0.911, val_f1_score=0.911]
Epoch 85:  92%|█████████▏| 234/255 [01:30<00:08,  2.58it/s, loss=0.126, v_num=0, train_loss=0.0389, train_accura

Epoch 85, global step 19435: val_loss was not in top 2


Epoch 86:  89%|████████▊ | 226/255 [01:24<00:10,  2.69it/s, loss=0.117, v_num=0, train_loss=0.0625, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.347, val_accuracy=0.877, val_f1_score=0.877]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 86:  89%|████████▉ | 228/255 [01:29<00:10,  2.54it/s, loss=0.117, v_num=0, train_loss=0.0625, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.347, val_accuracy=0.877, val_f1_score=0.877]
Epoch 86:  90%|█████████ | 230/255 [01:30<00:09,  2.55it/s, loss=0.117, v_num=0, train_loss=0.0625, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.347, val_accuracy=0.877, val_f1_score=0.877]
Epoch 86:  91%|█████████ | 232/255 [01:30<00:08,  2.57it/s, loss=0.117, v_num=0, train_loss=0.0625, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.347, val_accuracy=0.877, val_f1_score=0.877]
Epoch 86:  92%|█████████▏| 234/255 [01:30<00:08,  2.59it/s, loss=0.117, v_num=0, train_loss=0.0625, train_accura

Epoch 86, global step 19661: val_loss was not in top 2


Epoch 87:  89%|████████▊ | 226/255 [01:24<00:10,  2.69it/s, loss=0.138, v_num=0, train_loss=0.0893, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.308, val_accuracy=0.899, val_f1_score=0.899]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 87:  89%|████████▉ | 228/255 [01:29<00:10,  2.54it/s, loss=0.138, v_num=0, train_loss=0.0893, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.308, val_accuracy=0.899, val_f1_score=0.899]
Epoch 87:  90%|█████████ | 230/255 [01:30<00:09,  2.55it/s, loss=0.138, v_num=0, train_loss=0.0893, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.308, val_accuracy=0.899, val_f1_score=0.899]
Epoch 87:  91%|█████████ | 232/255 [01:30<00:08,  2.57it/s, loss=0.138, v_num=0, train_loss=0.0893, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.308, val_accuracy=0.899, val_f1_score=0.899]
Epoch 87:  92%|█████████▏| 234/255 [01:30<00:08,  2.59it/s, loss=0.138, v_num=0, train_loss=0.0893, train_accura

Epoch 87, global step 19887: val_loss reached 0.24675 (best 0.24675), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-2.ckpt" as top 2


Epoch 88:  89%|████████▊ | 226/255 [01:24<00:10,  2.68it/s, loss=0.113, v_num=0, train_loss=0.0149, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.247, val_accuracy=0.899, val_f1_score=0.899]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 88:  89%|████████▉ | 228/255 [01:30<00:10,  2.52it/s, loss=0.113, v_num=0, train_loss=0.0149, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.247, val_accuracy=0.899, val_f1_score=0.899]
Epoch 88:  90%|█████████ | 230/255 [01:30<00:09,  2.54it/s, loss=0.113, v_num=0, train_loss=0.0149, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.247, val_accuracy=0.899, val_f1_score=0.899]
Epoch 88:  91%|█████████ | 232/255 [01:30<00:08,  2.56it/s, loss=0.113, v_num=0, train_loss=0.0149, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.247, val_accuracy=0.899, val_f1_score=0.899]
Epoch 88:  92%|█████████▏| 234/255 [01:30<00:08,  2.57it/s, loss=0.113, v_num=0, train_loss=0.0149, train_accura

Epoch 88, global step 20113: val_loss reached 0.25980 (best 0.24675), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-2-v1.ckpt" as top 2


Epoch 89:  89%|████████▊ | 226/255 [01:24<00:10,  2.68it/s, loss=0.14, v_num=0, train_loss=0.235, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.260, val_accuracy=0.908, val_f1_score=0.908]   
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 89:  89%|████████▉ | 228/255 [01:30<00:10,  2.53it/s, loss=0.14, v_num=0, train_loss=0.235, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.260, val_accuracy=0.908, val_f1_score=0.908]
Epoch 89:  90%|█████████ | 230/255 [01:30<00:09,  2.55it/s, loss=0.14, v_num=0, train_loss=0.235, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.260, val_accuracy=0.908, val_f1_score=0.908]
Epoch 89:  91%|█████████ | 232/255 [01:30<00:08,  2.57it/s, loss=0.14, v_num=0, train_loss=0.235, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.260, val_accuracy=0.908, val_f1_score=0.908]
Epoch 89:  92%|█████████▏| 234/255 [01:30<00:08,  2.58it/s, loss=0.14, v_num=0, train_loss=0.235, train_accuracy=0.88

Epoch 89, global step 20339: val_loss was not in top 2


Epoch 90:  89%|████████▊ | 226/255 [01:24<00:10,  2.69it/s, loss=0.0737, v_num=0, train_loss=0.142, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.270, val_accuracy=0.909, val_f1_score=0.909] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 90:  89%|████████▉ | 228/255 [01:29<00:10,  2.53it/s, loss=0.0737, v_num=0, train_loss=0.142, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.270, val_accuracy=0.909, val_f1_score=0.909]
Validating:   7%|▋         | 2/29 [00:05<01:06,  2.46s/it][A
Epoch 90:  90%|█████████ | 230/255 [01:30<00:09,  2.55it/s, loss=0.0737, v_num=0, train_loss=0.142, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.270, val_accuracy=0.909, val_f1_score=0.909]
Epoch 90:  91%|█████████ | 232/255 [01:30<00:08,  2.57it/s, loss=0.0737, v_num=0, train_loss=0.142, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.270, val_accuracy=0.909, val_f1_score=0.909]
Epoch 90:  92%|█████████▏| 234/255 [01:30<00:08, 

Epoch 90, global step 20565: val_loss was not in top 2


Epoch 91:  89%|████████▊ | 226/255 [01:24<00:10,  2.69it/s, loss=0.0782, v_num=0, train_loss=0.0548, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.338, val_accuracy=0.894, val_f1_score=0.894]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 91:  89%|████████▉ | 228/255 [01:29<00:10,  2.53it/s, loss=0.0782, v_num=0, train_loss=0.0548, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.338, val_accuracy=0.894, val_f1_score=0.894]
Epoch 91:  90%|█████████ | 230/255 [01:30<00:09,  2.55it/s, loss=0.0782, v_num=0, train_loss=0.0548, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.338, val_accuracy=0.894, val_f1_score=0.894]
Epoch 91:  91%|█████████ | 232/255 [01:30<00:08,  2.57it/s, loss=0.0782, v_num=0, train_loss=0.0548, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.338, val_accuracy=0.894, val_f1_score=0.894]
Validating:  21%|██        | 6/29 [00:06<00:12,  1.81it/s][A
Epoch 91:  92%|█████████▏| 234/255 [01:30<00:0

Epoch 91, global step 20791: val_loss was not in top 2


Epoch 92:  89%|████████▊ | 226/255 [01:24<00:10,  2.68it/s, loss=0.0874, v_num=0, train_loss=0.0866, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.291, val_accuracy=0.904, val_f1_score=0.904] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 92:  89%|████████▉ | 228/255 [01:30<00:10,  2.53it/s, loss=0.0874, v_num=0, train_loss=0.0866, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.291, val_accuracy=0.904, val_f1_score=0.904]
Epoch 92:  90%|█████████ | 230/255 [01:30<00:09,  2.55it/s, loss=0.0874, v_num=0, train_loss=0.0866, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.291, val_accuracy=0.904, val_f1_score=0.904]
Epoch 92:  91%|█████████ | 232/255 [01:30<00:08,  2.56it/s, loss=0.0874, v_num=0, train_loss=0.0866, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.291, val_accuracy=0.904, val_f1_score=0.904]
Epoch 92:  92%|█████████▏| 234/255 [01:30<00:08,  2.58it/s, loss=0.0874, v_num=0, train_loss=0.0866, train_

Epoch 92, global step 21017: val_loss was not in top 2


Epoch 93:  89%|████████▊ | 226/255 [01:24<00:10,  2.69it/s, loss=0.121, v_num=0, train_loss=0.148, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.283, val_accuracy=0.910, val_f1_score=0.910]   
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 93:  89%|████████▉ | 228/255 [01:29<00:10,  2.53it/s, loss=0.121, v_num=0, train_loss=0.148, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.283, val_accuracy=0.910, val_f1_score=0.910]
Epoch 93:  90%|█████████ | 230/255 [01:30<00:09,  2.55it/s, loss=0.121, v_num=0, train_loss=0.148, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.283, val_accuracy=0.910, val_f1_score=0.910]
Epoch 93:  91%|█████████ | 232/255 [01:30<00:08,  2.57it/s, loss=0.121, v_num=0, train_loss=0.148, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.283, val_accuracy=0.910, val_f1_score=0.910]
Epoch 93:  92%|█████████▏| 234/255 [01:30<00:08,  2.58it/s, loss=0.121, v_num=0, train_loss=0.148, train_accuracy

Epoch 93, global step 21243: val_loss was not in top 2


Epoch 94:  89%|████████▊ | 226/255 [01:24<00:10,  2.68it/s, loss=0.108, v_num=0, train_loss=0.0367, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.297, val_accuracy=0.911, val_f1_score=0.911]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 94:  89%|████████▉ | 228/255 [01:30<00:10,  2.53it/s, loss=0.108, v_num=0, train_loss=0.0367, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.297, val_accuracy=0.911, val_f1_score=0.911]
Epoch 94:  90%|█████████ | 230/255 [01:30<00:09,  2.54it/s, loss=0.108, v_num=0, train_loss=0.0367, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.297, val_accuracy=0.911, val_f1_score=0.911]
Epoch 94:  91%|█████████ | 232/255 [01:30<00:08,  2.56it/s, loss=0.108, v_num=0, train_loss=0.0367, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.297, val_accuracy=0.911, val_f1_score=0.911]
Epoch 94:  92%|█████████▏| 234/255 [01:30<00:08,  2.58it/s, loss=0.108, v_num=0, train_loss=0.0367, train_accura

Epoch 94, global step 21469: val_loss was not in top 2


Epoch 95:  89%|████████▊ | 226/255 [01:24<00:10,  2.69it/s, loss=0.136, v_num=0, train_loss=0.170, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.287, val_accuracy=0.909, val_f1_score=0.909]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 95:  89%|████████▉ | 228/255 [01:29<00:10,  2.54it/s, loss=0.136, v_num=0, train_loss=0.170, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.287, val_accuracy=0.909, val_f1_score=0.909]
Epoch 95:  90%|█████████ | 230/255 [01:30<00:09,  2.55it/s, loss=0.136, v_num=0, train_loss=0.170, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.287, val_accuracy=0.909, val_f1_score=0.909]
Epoch 95:  91%|█████████ | 232/255 [01:30<00:08,  2.57it/s, loss=0.136, v_num=0, train_loss=0.170, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.287, val_accuracy=0.909, val_f1_score=0.909]
Epoch 95:  92%|█████████▏| 234/255 [01:30<00:08,  2.59it/s, loss=0.136, v_num=0, train_loss=0.170, train_accuracy=

Epoch 95, global step 21695: val_loss was not in top 2


Epoch 96:  89%|████████▊ | 226/255 [01:24<00:10,  2.68it/s, loss=0.147, v_num=0, train_loss=0.025, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.276, val_accuracy=0.906, val_f1_score=0.906] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 96:  89%|████████▉ | 228/255 [01:30<00:10,  2.53it/s, loss=0.147, v_num=0, train_loss=0.025, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.276, val_accuracy=0.906, val_f1_score=0.906]
Epoch 96:  90%|█████████ | 230/255 [01:30<00:09,  2.55it/s, loss=0.147, v_num=0, train_loss=0.025, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.276, val_accuracy=0.906, val_f1_score=0.906]
Epoch 96:  91%|█████████ | 232/255 [01:30<00:08,  2.57it/s, loss=0.147, v_num=0, train_loss=0.025, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.276, val_accuracy=0.906, val_f1_score=0.906]
Epoch 96:  92%|█████████▏| 234/255 [01:30<00:08,  2.58it/s, loss=0.147, v_num=0, train_loss=0.025, train_accuracy=1

Epoch 96, global step 21921: val_loss was not in top 2


Epoch 97:  89%|████████▊ | 226/255 [01:24<00:10,  2.69it/s, loss=0.097, v_num=0, train_loss=0.0251, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.275, val_accuracy=0.905, val_f1_score=0.905] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 97:  89%|████████▉ | 228/255 [01:29<00:10,  2.54it/s, loss=0.097, v_num=0, train_loss=0.0251, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.275, val_accuracy=0.905, val_f1_score=0.905]
Epoch 97:  90%|█████████ | 230/255 [01:30<00:09,  2.55it/s, loss=0.097, v_num=0, train_loss=0.0251, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.275, val_accuracy=0.905, val_f1_score=0.905]
Epoch 97:  91%|█████████ | 232/255 [01:30<00:08,  2.57it/s, loss=0.097, v_num=0, train_loss=0.0251, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.275, val_accuracy=0.905, val_f1_score=0.905]
Epoch 97:  92%|█████████▏| 234/255 [01:30<00:08,  2.59it/s, loss=0.097, v_num=0, train_loss=0.0251, train_accur

Epoch 97, global step 22147: val_loss was not in top 2


Epoch 98:  89%|████████▊ | 226/255 [01:24<00:10,  2.68it/s, loss=0.204, v_num=0, train_loss=0.163, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.286, val_accuracy=0.914, val_f1_score=0.914] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 98:  89%|████████▉ | 228/255 [01:30<00:10,  2.53it/s, loss=0.204, v_num=0, train_loss=0.163, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.286, val_accuracy=0.914, val_f1_score=0.914]
Epoch 98:  90%|█████████ | 230/255 [01:30<00:09,  2.55it/s, loss=0.204, v_num=0, train_loss=0.163, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.286, val_accuracy=0.914, val_f1_score=0.914]
Epoch 98:  91%|█████████ | 232/255 [01:30<00:08,  2.56it/s, loss=0.204, v_num=0, train_loss=0.163, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.286, val_accuracy=0.914, val_f1_score=0.914]
Epoch 98:  92%|█████████▏| 234/255 [01:30<00:08,  2.58it/s, loss=0.204, v_num=0, train_loss=0.163, train_accuracy=0

Epoch 98, global step 22373: val_loss was not in top 2


Epoch 99:  89%|████████▊ | 226/255 [01:24<00:10,  2.66it/s, loss=0.163, v_num=0, train_loss=0.115, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.299, val_accuracy=0.883, val_f1_score=0.883] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 99:  89%|████████▉ | 228/255 [01:30<00:10,  2.51it/s, loss=0.163, v_num=0, train_loss=0.115, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.299, val_accuracy=0.883, val_f1_score=0.883]
Epoch 99:  90%|█████████ | 230/255 [01:30<00:09,  2.53it/s, loss=0.163, v_num=0, train_loss=0.115, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.299, val_accuracy=0.883, val_f1_score=0.883]
Epoch 99:  91%|█████████ | 232/255 [01:31<00:09,  2.55it/s, loss=0.163, v_num=0, train_loss=0.115, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.299, val_accuracy=0.883, val_f1_score=0.883]
Epoch 99:  92%|█████████▏| 234/255 [01:31<00:08,  2.56it/s, loss=0.163, v_num=0, train_loss=0.115, train_accuracy=1

Epoch 99, global step 22599: val_loss was not in top 2


Epoch 100:  89%|████████▊ | 226/255 [01:25<00:10,  2.65it/s, loss=0.163, v_num=0, train_loss=0.182, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.307, val_accuracy=0.878, val_f1_score=0.878] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 100:  89%|████████▉ | 228/255 [01:31<00:10,  2.50it/s, loss=0.163, v_num=0, train_loss=0.182, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.307, val_accuracy=0.878, val_f1_score=0.878]
Epoch 100:  90%|█████████ | 230/255 [01:31<00:09,  2.52it/s, loss=0.163, v_num=0, train_loss=0.182, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.307, val_accuracy=0.878, val_f1_score=0.878]
Epoch 100:  91%|█████████ | 232/255 [01:31<00:09,  2.53it/s, loss=0.163, v_num=0, train_loss=0.182, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.307, val_accuracy=0.878, val_f1_score=0.878]
Epoch 100:  92%|█████████▏| 234/255 [01:31<00:08,  2.55it/s, loss=0.163, v_num=0, train_loss=0.182, train_accur

Epoch 100, global step 22825: val_loss was not in top 2


Epoch 101:  89%|████████▊ | 226/255 [01:24<00:10,  2.68it/s, loss=0.142, v_num=0, train_loss=0.114, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.335, val_accuracy=0.889, val_f1_score=0.889] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 101:  89%|████████▉ | 228/255 [01:30<00:10,  2.52it/s, loss=0.142, v_num=0, train_loss=0.114, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.335, val_accuracy=0.889, val_f1_score=0.889]
Epoch 101:  90%|█████████ | 230/255 [01:30<00:09,  2.54it/s, loss=0.142, v_num=0, train_loss=0.114, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.335, val_accuracy=0.889, val_f1_score=0.889]
Epoch 101:  91%|█████████ | 232/255 [01:30<00:08,  2.56it/s, loss=0.142, v_num=0, train_loss=0.114, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.335, val_accuracy=0.889, val_f1_score=0.889]
Epoch 101:  92%|█████████▏| 234/255 [01:30<00:08,  2.57it/s, loss=0.142, v_num=0, train_loss=0.114, train_accur

Epoch 101, global step 23051: val_loss was not in top 2


Epoch 102:  89%|████████▊ | 226/255 [01:24<00:10,  2.67it/s, loss=0.309, v_num=0, train_loss=0.568, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.346, val_accuracy=0.879, val_f1_score=0.879]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 102:  89%|████████▉ | 228/255 [01:30<00:10,  2.51it/s, loss=0.309, v_num=0, train_loss=0.568, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.346, val_accuracy=0.879, val_f1_score=0.879]
Epoch 102:  90%|█████████ | 230/255 [01:30<00:09,  2.53it/s, loss=0.309, v_num=0, train_loss=0.568, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.346, val_accuracy=0.879, val_f1_score=0.879]
Epoch 102:  91%|█████████ | 232/255 [01:31<00:09,  2.55it/s, loss=0.309, v_num=0, train_loss=0.568, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.346, val_accuracy=0.879, val_f1_score=0.879]
Epoch 102:  92%|█████████▏| 234/255 [01:31<00:08,  2.57it/s, loss=0.309, v_num=0, train_loss=0.568, train_accura

Epoch 102, global step 23277: val_loss was not in top 2


Epoch 103:  89%|████████▊ | 226/255 [01:24<00:10,  2.68it/s, loss=0.222, v_num=0, train_loss=0.243, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.431, val_accuracy=0.830, val_f1_score=0.830] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 103:  89%|████████▉ | 228/255 [01:30<00:10,  2.53it/s, loss=0.222, v_num=0, train_loss=0.243, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.431, val_accuracy=0.830, val_f1_score=0.830]
Epoch 103:  90%|█████████ | 230/255 [01:30<00:09,  2.55it/s, loss=0.222, v_num=0, train_loss=0.243, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.431, val_accuracy=0.830, val_f1_score=0.830]
Epoch 103:  91%|█████████ | 232/255 [01:30<00:08,  2.57it/s, loss=0.222, v_num=0, train_loss=0.243, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.431, val_accuracy=0.830, val_f1_score=0.830]
Epoch 103:  92%|█████████▏| 234/255 [01:30<00:08,  2.58it/s, loss=0.222, v_num=0, train_loss=0.243, train_accur

Epoch 103, global step 23503: val_loss was not in top 2


Epoch 104:  89%|████████▊ | 226/255 [01:24<00:10,  2.69it/s, loss=0.183, v_num=0, train_loss=0.0766, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.418, val_accuracy=0.854, val_f1_score=0.854]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 104:  89%|████████▉ | 228/255 [01:29<00:10,  2.54it/s, loss=0.183, v_num=0, train_loss=0.0766, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.418, val_accuracy=0.854, val_f1_score=0.854]
Epoch 104:  90%|█████████ | 230/255 [01:30<00:09,  2.56it/s, loss=0.183, v_num=0, train_loss=0.0766, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.418, val_accuracy=0.854, val_f1_score=0.854]
Epoch 104:  91%|█████████ | 232/255 [01:30<00:08,  2.57it/s, loss=0.183, v_num=0, train_loss=0.0766, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.418, val_accuracy=0.854, val_f1_score=0.854]
Epoch 104:  92%|█████████▏| 234/255 [01:30<00:08,  2.59it/s, loss=0.183, v_num=0, train_loss=0.0766, train_a

Epoch 104, global step 23729: val_loss was not in top 2


Epoch 105:  89%|████████▊ | 226/255 [01:23<00:10,  2.69it/s, loss=0.119, v_num=0, train_loss=0.172, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.354, val_accuracy=0.881, val_f1_score=0.881] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 105:  89%|████████▉ | 228/255 [01:29<00:10,  2.54it/s, loss=0.119, v_num=0, train_loss=0.172, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.354, val_accuracy=0.881, val_f1_score=0.881]
Epoch 105:  90%|█████████ | 230/255 [01:29<00:09,  2.56it/s, loss=0.119, v_num=0, train_loss=0.172, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.354, val_accuracy=0.881, val_f1_score=0.881]
Epoch 105:  91%|█████████ | 232/255 [01:30<00:08,  2.57it/s, loss=0.119, v_num=0, train_loss=0.172, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.354, val_accuracy=0.881, val_f1_score=0.881]
Epoch 105:  92%|█████████▏| 234/255 [01:30<00:08,  2.59it/s, loss=0.119, v_num=0, train_loss=0.172, train_accur

Epoch 105, global step 23955: val_loss was not in top 2


Epoch 106:  89%|████████▊ | 226/255 [01:24<00:10,  2.68it/s, loss=0.142, v_num=0, train_loss=0.106, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.324, val_accuracy=0.895, val_f1_score=0.895] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 106:  89%|████████▉ | 228/255 [01:30<00:10,  2.53it/s, loss=0.142, v_num=0, train_loss=0.106, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.324, val_accuracy=0.895, val_f1_score=0.895]
Epoch 106:  90%|█████████ | 230/255 [01:30<00:09,  2.55it/s, loss=0.142, v_num=0, train_loss=0.106, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.324, val_accuracy=0.895, val_f1_score=0.895]
Epoch 106:  91%|█████████ | 232/255 [01:30<00:08,  2.56it/s, loss=0.142, v_num=0, train_loss=0.106, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.324, val_accuracy=0.895, val_f1_score=0.895]
Epoch 106:  92%|█████████▏| 234/255 [01:30<00:08,  2.58it/s, loss=0.142, v_num=0, train_loss=0.106, train_accur

Epoch 106, global step 24181: val_loss was not in top 2


Epoch 107:  89%|████████▊ | 226/255 [01:24<00:10,  2.68it/s, loss=0.134, v_num=0, train_loss=0.0488, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.310, val_accuracy=0.884, val_f1_score=0.884]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 107:  89%|████████▉ | 228/255 [01:30<00:10,  2.53it/s, loss=0.134, v_num=0, train_loss=0.0488, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.310, val_accuracy=0.884, val_f1_score=0.884]
Epoch 107:  90%|█████████ | 230/255 [01:30<00:09,  2.54it/s, loss=0.134, v_num=0, train_loss=0.0488, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.310, val_accuracy=0.884, val_f1_score=0.884]
Epoch 107:  91%|█████████ | 232/255 [01:30<00:08,  2.56it/s, loss=0.134, v_num=0, train_loss=0.0488, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.310, val_accuracy=0.884, val_f1_score=0.884]
Epoch 107:  92%|█████████▏| 234/255 [01:30<00:08,  2.58it/s, loss=0.134, v_num=0, train_loss=0.0488, train_a

Epoch 107, global step 24407: val_loss was not in top 2


Epoch 108:  89%|████████▊ | 226/255 [01:23<00:10,  2.69it/s, loss=0.13, v_num=0, train_loss=0.126, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.277, val_accuracy=0.900, val_f1_score=0.900]   
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 108:  89%|████████▉ | 228/255 [01:29<00:10,  2.54it/s, loss=0.13, v_num=0, train_loss=0.126, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.277, val_accuracy=0.900, val_f1_score=0.900]
Epoch 108:  90%|█████████ | 230/255 [01:30<00:09,  2.55it/s, loss=0.13, v_num=0, train_loss=0.126, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.277, val_accuracy=0.900, val_f1_score=0.900]
Epoch 108:  91%|█████████ | 232/255 [01:30<00:08,  2.57it/s, loss=0.13, v_num=0, train_loss=0.126, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.277, val_accuracy=0.900, val_f1_score=0.900]
Epoch 108:  92%|█████████▏| 234/255 [01:30<00:08,  2.59it/s, loss=0.13, v_num=0, train_loss=0.126, train_accuracy

Epoch 108, global step 24633: val_loss was not in top 2


Epoch 109:  89%|████████▊ | 226/255 [01:24<00:10,  2.68it/s, loss=0.11, v_num=0, train_loss=0.059, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.326, val_accuracy=0.891, val_f1_score=0.891]   
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 109:  89%|████████▉ | 228/255 [01:30<00:10,  2.52it/s, loss=0.11, v_num=0, train_loss=0.059, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.326, val_accuracy=0.891, val_f1_score=0.891]
Validating:   7%|▋         | 2/29 [00:06<01:08,  2.53s/it][A
Epoch 109:  90%|█████████ | 230/255 [01:30<00:09,  2.54it/s, loss=0.11, v_num=0, train_loss=0.059, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.326, val_accuracy=0.891, val_f1_score=0.891]
Epoch 109:  91%|█████████ | 232/255 [01:30<00:08,  2.56it/s, loss=0.11, v_num=0, train_loss=0.059, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.326, val_accuracy=0.891, val_f1_score=0.891]
Epoch 109:  92%|█████████▏| 234/255 [01:30<00:08,  

Epoch 109, global step 24859: val_loss was not in top 2


Epoch 110:  89%|████████▊ | 226/255 [01:24<00:10,  2.67it/s, loss=0.12, v_num=0, train_loss=0.0447, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.307, val_accuracy=0.904, val_f1_score=0.904]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 110:  89%|████████▉ | 228/255 [01:30<00:10,  2.52it/s, loss=0.12, v_num=0, train_loss=0.0447, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.307, val_accuracy=0.904, val_f1_score=0.904]
Epoch 110:  90%|█████████ | 230/255 [01:30<00:09,  2.54it/s, loss=0.12, v_num=0, train_loss=0.0447, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.307, val_accuracy=0.904, val_f1_score=0.904]
Epoch 110:  91%|█████████ | 232/255 [01:30<00:08,  2.56it/s, loss=0.12, v_num=0, train_loss=0.0447, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.307, val_accuracy=0.904, val_f1_score=0.904]
Epoch 110:  92%|█████████▏| 234/255 [01:30<00:08,  2.57it/s, loss=0.12, v_num=0, train_loss=0.0447, train_accu

Epoch 110, global step 25085: val_loss was not in top 2


Epoch 111:  89%|████████▊ | 226/255 [01:24<00:10,  2.68it/s, loss=0.122, v_num=0, train_loss=0.150, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.384, val_accuracy=0.883, val_f1_score=0.883] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 111:  89%|████████▉ | 228/255 [01:30<00:10,  2.53it/s, loss=0.122, v_num=0, train_loss=0.150, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.384, val_accuracy=0.883, val_f1_score=0.883]
Epoch 111:  90%|█████████ | 230/255 [01:30<00:09,  2.55it/s, loss=0.122, v_num=0, train_loss=0.150, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.384, val_accuracy=0.883, val_f1_score=0.883]
Epoch 111:  91%|█████████ | 232/255 [01:30<00:08,  2.56it/s, loss=0.122, v_num=0, train_loss=0.150, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.384, val_accuracy=0.883, val_f1_score=0.883]
Epoch 111:  92%|█████████▏| 234/255 [01:30<00:08,  2.58it/s, loss=0.122, v_num=0, train_loss=0.150, train_accur

Epoch 111, global step 25311: val_loss was not in top 2


Epoch 112:  89%|████████▊ | 226/255 [01:24<00:10,  2.68it/s, loss=0.145, v_num=0, train_loss=0.0533, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.301, val_accuracy=0.901, val_f1_score=0.901]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 112:  89%|████████▉ | 228/255 [01:30<00:10,  2.52it/s, loss=0.145, v_num=0, train_loss=0.0533, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.301, val_accuracy=0.901, val_f1_score=0.901]
Epoch 112:  90%|█████████ | 230/255 [01:30<00:09,  2.54it/s, loss=0.145, v_num=0, train_loss=0.0533, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.301, val_accuracy=0.901, val_f1_score=0.901]
Epoch 112:  91%|█████████ | 232/255 [01:30<00:08,  2.56it/s, loss=0.145, v_num=0, train_loss=0.0533, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.301, val_accuracy=0.901, val_f1_score=0.901]
Epoch 112:  92%|█████████▏| 234/255 [01:30<00:08,  2.57it/s, loss=0.145, v_num=0, train_loss=0.0533, train_a

Epoch 112, global step 25537: val_loss was not in top 2


Epoch 113:  89%|████████▊ | 226/255 [01:24<00:10,  2.68it/s, loss=0.121, v_num=0, train_loss=0.142, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.291, val_accuracy=0.895, val_f1_score=0.895] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 113:  89%|████████▉ | 228/255 [01:30<00:10,  2.53it/s, loss=0.121, v_num=0, train_loss=0.142, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.291, val_accuracy=0.895, val_f1_score=0.895]
Epoch 113:  90%|█████████ | 230/255 [01:30<00:09,  2.54it/s, loss=0.121, v_num=0, train_loss=0.142, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.291, val_accuracy=0.895, val_f1_score=0.895]
Epoch 113:  91%|█████████ | 232/255 [01:30<00:08,  2.56it/s, loss=0.121, v_num=0, train_loss=0.142, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.291, val_accuracy=0.895, val_f1_score=0.895]
Epoch 113:  92%|█████████▏| 234/255 [01:30<00:08,  2.58it/s, loss=0.121, v_num=0, train_loss=0.142, train_accur

Epoch 113, global step 25763: val_loss was not in top 2


Epoch 114:  89%|████████▊ | 226/255 [01:24<00:10,  2.68it/s, loss=0.121, v_num=0, train_loss=0.0698, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.313, val_accuracy=0.896, val_f1_score=0.896] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 114:  89%|████████▉ | 228/255 [01:30<00:10,  2.53it/s, loss=0.121, v_num=0, train_loss=0.0698, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.313, val_accuracy=0.896, val_f1_score=0.896]
Epoch 114:  90%|█████████ | 230/255 [01:30<00:09,  2.54it/s, loss=0.121, v_num=0, train_loss=0.0698, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.313, val_accuracy=0.896, val_f1_score=0.896]
Epoch 114:  91%|█████████ | 232/255 [01:30<00:08,  2.56it/s, loss=0.121, v_num=0, train_loss=0.0698, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.313, val_accuracy=0.896, val_f1_score=0.896]
Epoch 114:  92%|█████████▏| 234/255 [01:30<00:08,  2.58it/s, loss=0.121, v_num=0, train_loss=0.0698, train_

Epoch 114, global step 25989: val_loss was not in top 2


Epoch 115:  89%|████████▊ | 226/255 [01:24<00:10,  2.68it/s, loss=0.0979, v_num=0, train_loss=0.0506, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.286, val_accuracy=0.894, val_f1_score=0.894]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 115:  89%|████████▉ | 228/255 [01:30<00:10,  2.52it/s, loss=0.0979, v_num=0, train_loss=0.0506, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.286, val_accuracy=0.894, val_f1_score=0.894]
Epoch 115:  90%|█████████ | 230/255 [01:30<00:09,  2.53it/s, loss=0.0979, v_num=0, train_loss=0.0506, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.286, val_accuracy=0.894, val_f1_score=0.894]
Epoch 115:  91%|█████████ | 232/255 [01:30<00:09,  2.55it/s, loss=0.0979, v_num=0, train_loss=0.0506, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.286, val_accuracy=0.894, val_f1_score=0.894]
Epoch 115:  92%|█████████▏| 234/255 [01:31<00:08,  2.57it/s, loss=0.0979, v_num=0, train_loss=0.0506, tr

Epoch 115, global step 26215: val_loss was not in top 2


Epoch 116:  89%|████████▊ | 226/255 [01:24<00:10,  2.68it/s, loss=0.13, v_num=0, train_loss=0.297, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.298, val_accuracy=0.903, val_f1_score=0.903]   
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 116:  89%|████████▉ | 228/255 [01:30<00:10,  2.52it/s, loss=0.13, v_num=0, train_loss=0.297, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.298, val_accuracy=0.903, val_f1_score=0.903]
Epoch 116:  90%|█████████ | 230/255 [01:30<00:09,  2.54it/s, loss=0.13, v_num=0, train_loss=0.297, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.298, val_accuracy=0.903, val_f1_score=0.903]
Epoch 116:  91%|█████████ | 232/255 [01:30<00:08,  2.56it/s, loss=0.13, v_num=0, train_loss=0.297, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.298, val_accuracy=0.903, val_f1_score=0.903]
Epoch 116:  92%|█████████▏| 234/255 [01:30<00:08,  2.57it/s, loss=0.13, v_num=0, train_loss=0.297, train_accuracy

Epoch 116, global step 26441: val_loss was not in top 2


Epoch 117:  89%|████████▊ | 226/255 [01:24<00:10,  2.68it/s, loss=0.198, v_num=0, train_loss=0.0909, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.349, val_accuracy=0.889, val_f1_score=0.889]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 117:  89%|████████▉ | 228/255 [01:30<00:10,  2.53it/s, loss=0.198, v_num=0, train_loss=0.0909, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.349, val_accuracy=0.889, val_f1_score=0.889]
Validating:   7%|▋         | 2/29 [00:05<01:06,  2.45s/it][A
Epoch 117:  90%|█████████ | 230/255 [01:30<00:09,  2.54it/s, loss=0.198, v_num=0, train_loss=0.0909, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.349, val_accuracy=0.889, val_f1_score=0.889]
Epoch 117:  91%|█████████ | 232/255 [01:30<00:08,  2.56it/s, loss=0.198, v_num=0, train_loss=0.0909, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.349, val_accuracy=0.889, val_f1_score=0.889]
Epoch 117:  92%|█████████▏| 234/255 [01:30<00:

Epoch 117, global step 26667: val_loss was not in top 2


Epoch 118:  89%|████████▊ | 226/255 [01:24<00:10,  2.67it/s, loss=0.13, v_num=0, train_loss=0.134, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.315, val_accuracy=0.881, val_f1_score=0.881]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 118:  89%|████████▉ | 228/255 [01:30<00:10,  2.52it/s, loss=0.13, v_num=0, train_loss=0.134, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.315, val_accuracy=0.881, val_f1_score=0.881]
Epoch 118:  90%|█████████ | 230/255 [01:30<00:09,  2.53it/s, loss=0.13, v_num=0, train_loss=0.134, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.315, val_accuracy=0.881, val_f1_score=0.881]
Epoch 118:  91%|█████████ | 232/255 [01:30<00:09,  2.55it/s, loss=0.13, v_num=0, train_loss=0.134, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.315, val_accuracy=0.881, val_f1_score=0.881]
Epoch 118:  92%|█████████▏| 234/255 [01:31<00:08,  2.57it/s, loss=0.13, v_num=0, train_loss=0.134, train_accuracy=

Epoch 118, global step 26893: val_loss was not in top 2


Epoch 119:  89%|████████▊ | 226/255 [01:24<00:10,  2.67it/s, loss=0.157, v_num=0, train_loss=0.0995, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.287, val_accuracy=0.895, val_f1_score=0.895]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 119:  89%|████████▉ | 228/255 [01:30<00:10,  2.52it/s, loss=0.157, v_num=0, train_loss=0.0995, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.287, val_accuracy=0.895, val_f1_score=0.895]
Validating:   7%|▋         | 2/29 [00:05<01:06,  2.48s/it][A
Epoch 119:  90%|█████████ | 230/255 [01:30<00:09,  2.54it/s, loss=0.157, v_num=0, train_loss=0.0995, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.287, val_accuracy=0.895, val_f1_score=0.895]
Epoch 119:  91%|█████████ | 232/255 [01:30<00:08,  2.56it/s, loss=0.157, v_num=0, train_loss=0.0995, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.287, val_accuracy=0.895, val_f1_score=0.895]
Epoch 119:  92%|█████████▏| 234/255 [01:30<00:

Epoch 119, global step 27119: val_loss was not in top 2


Epoch 120:  89%|████████▊ | 226/255 [01:24<00:10,  2.68it/s, loss=0.132, v_num=0, train_loss=0.319, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.356, val_accuracy=0.891, val_f1_score=0.891] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 120:  89%|████████▉ | 228/255 [01:30<00:10,  2.52it/s, loss=0.132, v_num=0, train_loss=0.319, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.356, val_accuracy=0.891, val_f1_score=0.891]
Epoch 120:  90%|█████████ | 230/255 [01:30<00:09,  2.54it/s, loss=0.132, v_num=0, train_loss=0.319, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.356, val_accuracy=0.891, val_f1_score=0.891]
Epoch 120:  91%|█████████ | 232/255 [01:30<00:08,  2.56it/s, loss=0.132, v_num=0, train_loss=0.319, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.356, val_accuracy=0.891, val_f1_score=0.891]
Epoch 120:  92%|█████████▏| 234/255 [01:30<00:08,  2.57it/s, loss=0.132, v_num=0, train_loss=0.319, train_accur

Epoch 120, global step 27345: val_loss reached 0.25661 (best 0.24675), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-2-v1.ckpt" as top 2


Epoch 121:  89%|████████▊ | 226/255 [01:24<00:10,  2.69it/s, loss=0.0968, v_num=0, train_loss=0.0211, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.257, val_accuracy=0.911, val_f1_score=0.911]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 121:  89%|████████▉ | 228/255 [01:30<00:10,  2.53it/s, loss=0.0968, v_num=0, train_loss=0.0211, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.257, val_accuracy=0.911, val_f1_score=0.911]
Epoch 121:  90%|█████████ | 230/255 [01:30<00:09,  2.55it/s, loss=0.0968, v_num=0, train_loss=0.0211, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.257, val_accuracy=0.911, val_f1_score=0.911]
Epoch 121:  91%|█████████ | 232/255 [01:30<00:08,  2.56it/s, loss=0.0968, v_num=0, train_loss=0.0211, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.257, val_accuracy=0.911, val_f1_score=0.911]
Epoch 121:  92%|█████████▏| 234/255 [01:30<00:08,  2.58it/s, loss=0.0968, v_num=0, train_loss=0.0211, tr

Epoch 121, global step 27571: val_loss was not in top 2


Epoch 122:  89%|████████▊ | 226/255 [01:24<00:10,  2.68it/s, loss=0.0965, v_num=0, train_loss=0.0828, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.297, val_accuracy=0.898, val_f1_score=0.898]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 122:  89%|████████▉ | 228/255 [01:30<00:10,  2.52it/s, loss=0.0965, v_num=0, train_loss=0.0828, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.297, val_accuracy=0.898, val_f1_score=0.898]
Epoch 122:  90%|█████████ | 230/255 [01:30<00:09,  2.54it/s, loss=0.0965, v_num=0, train_loss=0.0828, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.297, val_accuracy=0.898, val_f1_score=0.898]
Epoch 122:  91%|█████████ | 232/255 [01:30<00:08,  2.56it/s, loss=0.0965, v_num=0, train_loss=0.0828, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.297, val_accuracy=0.898, val_f1_score=0.898]
Validating:  21%|██        | 6/29 [00:06<00:13,  1.67it/s][A
Epoch 122:  92%|█████████▏| 234/255 [01:30

Epoch 122, global step 27797: val_loss was not in top 2


Epoch 123:  89%|████████▊ | 226/255 [01:24<00:10,  2.67it/s, loss=0.118, v_num=0, train_loss=0.0469, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.288, val_accuracy=0.903, val_f1_score=0.903]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 123:  89%|████████▉ | 228/255 [01:30<00:10,  2.52it/s, loss=0.118, v_num=0, train_loss=0.0469, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.288, val_accuracy=0.903, val_f1_score=0.903]
Epoch 123:  90%|█████████ | 230/255 [01:30<00:09,  2.54it/s, loss=0.118, v_num=0, train_loss=0.0469, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.288, val_accuracy=0.903, val_f1_score=0.903]
Epoch 123:  91%|█████████ | 232/255 [01:30<00:09,  2.55it/s, loss=0.118, v_num=0, train_loss=0.0469, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.288, val_accuracy=0.903, val_f1_score=0.903]
Epoch 123:  92%|█████████▏| 234/255 [01:31<00:08,  2.57it/s, loss=0.118, v_num=0, train_loss=0.0469, train

Epoch 123, global step 28023: val_loss was not in top 2


Epoch 124:  89%|████████▊ | 226/255 [01:25<00:10,  2.65it/s, loss=0.114, v_num=0, train_loss=0.0704, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.318, val_accuracy=0.902, val_f1_score=0.902]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 124:  89%|████████▉ | 228/255 [01:31<00:10,  2.50it/s, loss=0.114, v_num=0, train_loss=0.0704, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.318, val_accuracy=0.902, val_f1_score=0.902]
Epoch 124:  90%|█████████ | 230/255 [01:31<00:09,  2.51it/s, loss=0.114, v_num=0, train_loss=0.0704, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.318, val_accuracy=0.902, val_f1_score=0.902]
Epoch 124:  91%|█████████ | 232/255 [01:31<00:09,  2.53it/s, loss=0.114, v_num=0, train_loss=0.0704, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.318, val_accuracy=0.902, val_f1_score=0.902]
Epoch 124:  92%|█████████▏| 234/255 [01:31<00:08,  2.55it/s, loss=0.114, v_num=0, train_loss=0.0704, train_a

Epoch 124, global step 28249: val_loss was not in top 2


Epoch 125:  89%|████████▊ | 226/255 [01:19<00:10,  2.83it/s, loss=0.101, v_num=0, train_loss=0.235, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.353, val_accuracy=0.884, val_f1_score=0.884]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 125:  89%|████████▉ | 228/255 [01:25<00:10,  2.65it/s, loss=0.101, v_num=0, train_loss=0.235, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.353, val_accuracy=0.884, val_f1_score=0.884]
Epoch 125:  90%|█████████ | 230/255 [01:26<00:09,  2.67it/s, loss=0.101, v_num=0, train_loss=0.235, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.353, val_accuracy=0.884, val_f1_score=0.884]
Epoch 125:  91%|█████████ | 232/255 [01:26<00:08,  2.69it/s, loss=0.101, v_num=0, train_loss=0.235, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.353, val_accuracy=0.884, val_f1_score=0.884]
Epoch 125:  92%|█████████▏| 234/255 [01:26<00:07,  2.71it/s, loss=0.101, v_num=0, train_loss=0.235, train_accu

Epoch 125, global step 28475: val_loss was not in top 2


Epoch 126:  89%|████████▊ | 226/255 [01:19<00:10,  2.83it/s, loss=0.132, v_num=0, train_loss=0.0976, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.340, val_accuracy=0.898, val_f1_score=0.898]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 126:  89%|████████▉ | 228/255 [01:26<00:10,  2.65it/s, loss=0.132, v_num=0, train_loss=0.0976, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.340, val_accuracy=0.898, val_f1_score=0.898]
Epoch 126:  90%|█████████ | 230/255 [01:26<00:09,  2.66it/s, loss=0.132, v_num=0, train_loss=0.0976, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.340, val_accuracy=0.898, val_f1_score=0.898]
Epoch 126:  91%|█████████ | 232/255 [01:26<00:08,  2.68it/s, loss=0.132, v_num=0, train_loss=0.0976, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.340, val_accuracy=0.898, val_f1_score=0.898]
Epoch 126:  92%|█████████▏| 234/255 [01:26<00:07,  2.70it/s, loss=0.132, v_num=0, train_loss=0.0976, train_a

Epoch 126, global step 28701: val_loss was not in top 2


Epoch 127:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.305, v_num=0, train_loss=0.331, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.272, val_accuracy=0.911, val_f1_score=0.911]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 127:  89%|████████▉ | 228/255 [01:26<00:10,  2.64it/s, loss=0.305, v_num=0, train_loss=0.331, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.272, val_accuracy=0.911, val_f1_score=0.911]
Epoch 127:  90%|█████████ | 230/255 [01:26<00:09,  2.66it/s, loss=0.305, v_num=0, train_loss=0.331, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.272, val_accuracy=0.911, val_f1_score=0.911]
Epoch 127:  91%|█████████ | 232/255 [01:26<00:08,  2.68it/s, loss=0.305, v_num=0, train_loss=0.331, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.272, val_accuracy=0.911, val_f1_score=0.911]
Epoch 127:  92%|█████████▏| 234/255 [01:26<00:07,  2.70it/s, loss=0.305, v_num=0, train_loss=0.331, train_accu

Epoch 127, global step 28927: val_loss was not in top 2


Epoch 128:  89%|████████▊ | 226/255 [01:19<00:10,  2.83it/s, loss=0.189, v_num=0, train_loss=0.253, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.356, val_accuracy=0.857, val_f1_score=0.857] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 128:  89%|████████▉ | 228/255 [01:26<00:10,  2.65it/s, loss=0.189, v_num=0, train_loss=0.253, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.356, val_accuracy=0.857, val_f1_score=0.857]
Epoch 128:  90%|█████████ | 230/255 [01:26<00:09,  2.67it/s, loss=0.189, v_num=0, train_loss=0.253, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.356, val_accuracy=0.857, val_f1_score=0.857]
Epoch 128:  91%|█████████ | 232/255 [01:26<00:08,  2.69it/s, loss=0.189, v_num=0, train_loss=0.253, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.356, val_accuracy=0.857, val_f1_score=0.857]
Epoch 128:  92%|█████████▏| 234/255 [01:26<00:07,  2.70it/s, loss=0.189, v_num=0, train_loss=0.253, train_accur

Epoch 128, global step 29153: val_loss was not in top 2


Epoch 129:  89%|████████▊ | 226/255 [01:19<00:10,  2.83it/s, loss=0.0914, v_num=0, train_loss=0.0138, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.273, val_accuracy=0.899, val_f1_score=0.899]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 129:  89%|████████▉ | 228/255 [01:25<00:10,  2.65it/s, loss=0.0914, v_num=0, train_loss=0.0138, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.273, val_accuracy=0.899, val_f1_score=0.899]
Epoch 129:  90%|█████████ | 230/255 [01:26<00:09,  2.67it/s, loss=0.0914, v_num=0, train_loss=0.0138, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.273, val_accuracy=0.899, val_f1_score=0.899]
Epoch 129:  91%|█████████ | 232/255 [01:26<00:08,  2.69it/s, loss=0.0914, v_num=0, train_loss=0.0138, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.273, val_accuracy=0.899, val_f1_score=0.899]
Epoch 129:  92%|█████████▏| 234/255 [01:26<00:07,  2.71it/s, loss=0.0914, v_num=0, train_loss=0.0138, tr

Epoch 129, global step 29379: val_loss was not in top 2


Epoch 130:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.105, v_num=0, train_loss=0.0363, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.271, val_accuracy=0.906, val_f1_score=0.906] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 130:  89%|████████▉ | 228/255 [01:26<00:10,  2.65it/s, loss=0.105, v_num=0, train_loss=0.0363, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.271, val_accuracy=0.906, val_f1_score=0.906]
Epoch 130:  90%|█████████ | 230/255 [01:26<00:09,  2.66it/s, loss=0.105, v_num=0, train_loss=0.0363, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.271, val_accuracy=0.906, val_f1_score=0.906]
Epoch 130:  91%|█████████ | 232/255 [01:26<00:08,  2.68it/s, loss=0.105, v_num=0, train_loss=0.0363, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.271, val_accuracy=0.906, val_f1_score=0.906]
Epoch 130:  92%|█████████▏| 234/255 [01:26<00:07,  2.70it/s, loss=0.105, v_num=0, train_loss=0.0363, train_

Epoch 130, global step 29605: val_loss was not in top 2


Epoch 131:  89%|████████▊ | 226/255 [01:19<00:10,  2.83it/s, loss=0.121, v_num=0, train_loss=0.153, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.280, val_accuracy=0.904, val_f1_score=0.904] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 131:  89%|████████▉ | 228/255 [01:26<00:10,  2.64it/s, loss=0.121, v_num=0, train_loss=0.153, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.280, val_accuracy=0.904, val_f1_score=0.904]
Epoch 131:  90%|█████████ | 230/255 [01:26<00:09,  2.66it/s, loss=0.121, v_num=0, train_loss=0.153, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.280, val_accuracy=0.904, val_f1_score=0.904]
Epoch 131:  91%|█████████ | 232/255 [01:26<00:08,  2.68it/s, loss=0.121, v_num=0, train_loss=0.153, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.280, val_accuracy=0.904, val_f1_score=0.904]
Epoch 131:  92%|█████████▏| 234/255 [01:26<00:07,  2.70it/s, loss=0.121, v_num=0, train_loss=0.153, train_accur

Epoch 131, global step 29831: val_loss was not in top 2


Epoch 132:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.11, v_num=0, train_loss=0.361, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.273, val_accuracy=0.896, val_f1_score=0.896]   
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 132:  89%|████████▉ | 228/255 [01:26<00:10,  2.64it/s, loss=0.11, v_num=0, train_loss=0.361, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.273, val_accuracy=0.896, val_f1_score=0.896]
Epoch 132:  90%|█████████ | 230/255 [01:26<00:09,  2.66it/s, loss=0.11, v_num=0, train_loss=0.361, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.273, val_accuracy=0.896, val_f1_score=0.896]
Epoch 132:  91%|█████████ | 232/255 [01:26<00:08,  2.68it/s, loss=0.11, v_num=0, train_loss=0.361, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.273, val_accuracy=0.896, val_f1_score=0.896]
Epoch 132:  92%|█████████▏| 234/255 [01:26<00:07,  2.70it/s, loss=0.11, v_num=0, train_loss=0.361, train_accuracy

Epoch 132, global step 30057: val_loss reached 0.24828 (best 0.24675), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-2-v1.ckpt" as top 2


Epoch 133:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.0995, v_num=0, train_loss=0.0976, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.248, val_accuracy=0.908, val_f1_score=0.908]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 133:  89%|████████▉ | 228/255 [01:26<00:10,  2.64it/s, loss=0.0995, v_num=0, train_loss=0.0976, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.248, val_accuracy=0.908, val_f1_score=0.908]
Epoch 133:  90%|█████████ | 230/255 [01:26<00:09,  2.66it/s, loss=0.0995, v_num=0, train_loss=0.0976, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.248, val_accuracy=0.908, val_f1_score=0.908]
Epoch 133:  91%|█████████ | 232/255 [01:26<00:08,  2.68it/s, loss=0.0995, v_num=0, train_loss=0.0976, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.248, val_accuracy=0.908, val_f1_score=0.908]
Epoch 133:  92%|█████████▏| 234/255 [01:26<00:07,  2.70it/s, loss=0.0995, v_num=0, train_loss=0.0976, tr

Epoch 133, global step 30283: val_loss was not in top 2


Epoch 134:  89%|████████▊ | 226/255 [01:19<00:10,  2.83it/s, loss=0.22, v_num=0, train_loss=0.166, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.344, val_accuracy=0.905, val_f1_score=0.905]   
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 134:  89%|████████▉ | 228/255 [01:26<00:10,  2.65it/s, loss=0.22, v_num=0, train_loss=0.166, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.344, val_accuracy=0.905, val_f1_score=0.905]
Epoch 134:  90%|█████████ | 230/255 [01:26<00:09,  2.67it/s, loss=0.22, v_num=0, train_loss=0.166, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.344, val_accuracy=0.905, val_f1_score=0.905]
Epoch 134:  91%|█████████ | 232/255 [01:26<00:08,  2.68it/s, loss=0.22, v_num=0, train_loss=0.166, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.344, val_accuracy=0.905, val_f1_score=0.905]
Epoch 134:  92%|█████████▏| 234/255 [01:26<00:07,  2.70it/s, loss=0.22, v_num=0, train_loss=0.166, train_accuracy

Epoch 134, global step 30509: val_loss was not in top 2


Epoch 135:  89%|████████▊ | 226/255 [01:19<00:10,  2.83it/s, loss=0.125, v_num=0, train_loss=0.264, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.297, val_accuracy=0.896, val_f1_score=0.896] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 135:  89%|████████▉ | 228/255 [01:25<00:10,  2.66it/s, loss=0.125, v_num=0, train_loss=0.264, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.297, val_accuracy=0.896, val_f1_score=0.896]
Epoch 135:  90%|█████████ | 230/255 [01:26<00:09,  2.67it/s, loss=0.125, v_num=0, train_loss=0.264, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.297, val_accuracy=0.896, val_f1_score=0.896]
Epoch 135:  91%|█████████ | 232/255 [01:26<00:08,  2.69it/s, loss=0.125, v_num=0, train_loss=0.264, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.297, val_accuracy=0.896, val_f1_score=0.896]
Epoch 135:  92%|█████████▏| 234/255 [01:26<00:07,  2.71it/s, loss=0.125, v_num=0, train_loss=0.264, train_accur

Epoch 135, global step 30735: val_loss was not in top 2


Epoch 136:  89%|████████▊ | 226/255 [01:19<00:10,  2.83it/s, loss=0.126, v_num=0, train_loss=0.102, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.277, val_accuracy=0.908, val_f1_score=0.908]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 136:  89%|████████▉ | 228/255 [01:26<00:10,  2.65it/s, loss=0.126, v_num=0, train_loss=0.102, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.277, val_accuracy=0.908, val_f1_score=0.908]
Epoch 136:  90%|█████████ | 230/255 [01:26<00:09,  2.67it/s, loss=0.126, v_num=0, train_loss=0.102, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.277, val_accuracy=0.908, val_f1_score=0.908]
Epoch 136:  91%|█████████ | 232/255 [01:26<00:08,  2.69it/s, loss=0.126, v_num=0, train_loss=0.102, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.277, val_accuracy=0.908, val_f1_score=0.908]
Epoch 136:  92%|█████████▏| 234/255 [01:26<00:07,  2.71it/s, loss=0.126, v_num=0, train_loss=0.102, train_accu

Epoch 136, global step 30961: val_loss was not in top 2


Epoch 137:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.0977, v_num=0, train_loss=0.0215, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.265, val_accuracy=0.905, val_f1_score=0.905]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 137:  89%|████████▉ | 228/255 [01:26<00:10,  2.65it/s, loss=0.0977, v_num=0, train_loss=0.0215, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.265, val_accuracy=0.905, val_f1_score=0.905]
Epoch 137:  90%|█████████ | 230/255 [01:26<00:09,  2.66it/s, loss=0.0977, v_num=0, train_loss=0.0215, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.265, val_accuracy=0.905, val_f1_score=0.905]
Epoch 137:  91%|█████████ | 232/255 [01:26<00:08,  2.68it/s, loss=0.0977, v_num=0, train_loss=0.0215, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.265, val_accuracy=0.905, val_f1_score=0.905]
Epoch 137:  92%|█████████▏| 234/255 [01:26<00:07,  2.70it/s, loss=0.0977, v_num=0, train_loss=0.0215, tr

Epoch 137, global step 31187: val_loss was not in top 2


Epoch 138:  89%|████████▊ | 226/255 [01:19<00:10,  2.84it/s, loss=0.111, v_num=0, train_loss=0.0161, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.322, val_accuracy=0.896, val_f1_score=0.896]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 138:  89%|████████▉ | 228/255 [01:25<00:10,  2.66it/s, loss=0.111, v_num=0, train_loss=0.0161, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.322, val_accuracy=0.896, val_f1_score=0.896]
Epoch 138:  90%|█████████ | 230/255 [01:25<00:09,  2.68it/s, loss=0.111, v_num=0, train_loss=0.0161, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.322, val_accuracy=0.896, val_f1_score=0.896]
Epoch 138:  91%|█████████ | 232/255 [01:26<00:08,  2.70it/s, loss=0.111, v_num=0, train_loss=0.0161, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.322, val_accuracy=0.896, val_f1_score=0.896]
Epoch 138:  92%|█████████▏| 234/255 [01:26<00:07,  2.71it/s, loss=0.111, v_num=0, train_loss=0.0161, train

Epoch 138, global step 31413: val_loss was not in top 2


Epoch 139:  89%|████████▊ | 226/255 [01:19<00:10,  2.83it/s, loss=0.164, v_num=0, train_loss=0.501, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.413, val_accuracy=0.883, val_f1_score=0.883] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 139:  89%|████████▉ | 228/255 [01:25<00:10,  2.65it/s, loss=0.164, v_num=0, train_loss=0.501, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.413, val_accuracy=0.883, val_f1_score=0.883]
Epoch 139:  90%|█████████ | 230/255 [01:26<00:09,  2.67it/s, loss=0.164, v_num=0, train_loss=0.501, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.413, val_accuracy=0.883, val_f1_score=0.883]
Epoch 139:  91%|█████████ | 232/255 [01:26<00:08,  2.69it/s, loss=0.164, v_num=0, train_loss=0.501, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.413, val_accuracy=0.883, val_f1_score=0.883]
Epoch 139:  92%|█████████▏| 234/255 [01:26<00:07,  2.71it/s, loss=0.164, v_num=0, train_loss=0.501, train_accur

Epoch 139, global step 31639: val_loss was not in top 2


Epoch 140:  89%|████████▊ | 226/255 [01:19<00:10,  2.83it/s, loss=0.114, v_num=0, train_loss=0.299, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.317, val_accuracy=0.889, val_f1_score=0.889]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 140:  89%|████████▉ | 228/255 [01:25<00:10,  2.65it/s, loss=0.114, v_num=0, train_loss=0.299, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.317, val_accuracy=0.889, val_f1_score=0.889]
Epoch 140:  90%|█████████ | 230/255 [01:26<00:09,  2.67it/s, loss=0.114, v_num=0, train_loss=0.299, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.317, val_accuracy=0.889, val_f1_score=0.889]
Epoch 140:  91%|█████████ | 232/255 [01:26<00:08,  2.69it/s, loss=0.114, v_num=0, train_loss=0.299, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.317, val_accuracy=0.889, val_f1_score=0.889]
Epoch 140:  92%|█████████▏| 234/255 [01:26<00:07,  2.71it/s, loss=0.114, v_num=0, train_loss=0.299, train_accu

Epoch 140, global step 31865: val_loss was not in top 2


Epoch 141:  89%|████████▊ | 226/255 [01:19<00:10,  2.83it/s, loss=0.0878, v_num=0, train_loss=0.00269, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.304, val_accuracy=0.904, val_f1_score=0.904]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 141:  89%|████████▉ | 228/255 [01:25<00:10,  2.66it/s, loss=0.0878, v_num=0, train_loss=0.00269, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.304, val_accuracy=0.904, val_f1_score=0.904]
Epoch 141:  90%|█████████ | 230/255 [01:26<00:09,  2.67it/s, loss=0.0878, v_num=0, train_loss=0.00269, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.304, val_accuracy=0.904, val_f1_score=0.904]
Epoch 141:  91%|█████████ | 232/255 [01:26<00:08,  2.69it/s, loss=0.0878, v_num=0, train_loss=0.00269, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.304, val_accuracy=0.904, val_f1_score=0.904]
Epoch 141:  92%|█████████▏| 234/255 [01:26<00:07,  2.71it/s, loss=0.0878, v_num=0, train_loss=0.0026

Epoch 141, global step 32091: val_loss was not in top 2


Epoch 142:  89%|████████▊ | 226/255 [01:19<00:10,  2.84it/s, loss=0.0827, v_num=0, train_loss=0.130, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.318, val_accuracy=0.907, val_f1_score=0.907]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 142:  89%|████████▉ | 228/255 [01:25<00:10,  2.66it/s, loss=0.0827, v_num=0, train_loss=0.130, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.318, val_accuracy=0.907, val_f1_score=0.907]
Epoch 142:  90%|█████████ | 230/255 [01:25<00:09,  2.68it/s, loss=0.0827, v_num=0, train_loss=0.130, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.318, val_accuracy=0.907, val_f1_score=0.907]
Epoch 142:  91%|█████████ | 232/255 [01:26<00:08,  2.69it/s, loss=0.0827, v_num=0, train_loss=0.130, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.318, val_accuracy=0.907, val_f1_score=0.907]
Epoch 142:  92%|█████████▏| 234/255 [01:26<00:07,  2.71it/s, loss=0.0827, v_num=0, train_loss=0.130, train

Epoch 142, global step 32317: val_loss was not in top 2


Epoch 143:  89%|████████▊ | 226/255 [01:19<00:10,  2.83it/s, loss=0.0789, v_num=0, train_loss=0.0437, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.354, val_accuracy=0.894, val_f1_score=0.894] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 143:  89%|████████▉ | 228/255 [01:25<00:10,  2.66it/s, loss=0.0789, v_num=0, train_loss=0.0437, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.354, val_accuracy=0.894, val_f1_score=0.894]
Epoch 143:  90%|█████████ | 230/255 [01:26<00:09,  2.67it/s, loss=0.0789, v_num=0, train_loss=0.0437, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.354, val_accuracy=0.894, val_f1_score=0.894]
Epoch 143:  91%|█████████ | 232/255 [01:26<00:08,  2.69it/s, loss=0.0789, v_num=0, train_loss=0.0437, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.354, val_accuracy=0.894, val_f1_score=0.894]
Epoch 143:  92%|█████████▏| 234/255 [01:26<00:07,  2.71it/s, loss=0.0789, v_num=0, train_loss=0.0437, t

Epoch 143, global step 32543: val_loss was not in top 2


Epoch 144:  89%|████████▊ | 226/255 [01:19<00:10,  2.83it/s, loss=0.0938, v_num=0, train_loss=0.177, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.299, val_accuracy=0.907, val_f1_score=0.907] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 144:  89%|████████▉ | 228/255 [01:26<00:10,  2.65it/s, loss=0.0938, v_num=0, train_loss=0.177, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.299, val_accuracy=0.907, val_f1_score=0.907]
Epoch 144:  90%|█████████ | 230/255 [01:26<00:09,  2.67it/s, loss=0.0938, v_num=0, train_loss=0.177, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.299, val_accuracy=0.907, val_f1_score=0.907]
Epoch 144:  91%|█████████ | 232/255 [01:26<00:08,  2.69it/s, loss=0.0938, v_num=0, train_loss=0.177, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.299, val_accuracy=0.907, val_f1_score=0.907]
Epoch 144:  92%|█████████▏| 234/255 [01:26<00:07,  2.70it/s, loss=0.0938, v_num=0, train_loss=0.177, train_

Epoch 144, global step 32769: val_loss was not in top 2


Epoch 145:  89%|████████▊ | 226/255 [01:19<00:10,  2.83it/s, loss=0.0635, v_num=0, train_loss=0.123, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.325, val_accuracy=0.911, val_f1_score=0.911] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 145:  89%|████████▉ | 228/255 [01:25<00:10,  2.65it/s, loss=0.0635, v_num=0, train_loss=0.123, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.325, val_accuracy=0.911, val_f1_score=0.911]
Epoch 145:  90%|█████████ | 230/255 [01:26<00:09,  2.67it/s, loss=0.0635, v_num=0, train_loss=0.123, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.325, val_accuracy=0.911, val_f1_score=0.911]
Epoch 145:  91%|█████████ | 232/255 [01:26<00:08,  2.69it/s, loss=0.0635, v_num=0, train_loss=0.123, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.325, val_accuracy=0.911, val_f1_score=0.911]
Epoch 145:  92%|█████████▏| 234/255 [01:26<00:07,  2.71it/s, loss=0.0635, v_num=0, train_loss=0.123, train_

Epoch 145, global step 32995: val_loss was not in top 2


Epoch 146:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.131, v_num=0, train_loss=0.129, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.301, val_accuracy=0.912, val_f1_score=0.912]   
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 146:  89%|████████▉ | 228/255 [01:26<00:10,  2.65it/s, loss=0.131, v_num=0, train_loss=0.129, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.301, val_accuracy=0.912, val_f1_score=0.912]
Epoch 146:  90%|█████████ | 230/255 [01:26<00:09,  2.67it/s, loss=0.131, v_num=0, train_loss=0.129, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.301, val_accuracy=0.912, val_f1_score=0.912]
Epoch 146:  91%|█████████ | 232/255 [01:26<00:08,  2.68it/s, loss=0.131, v_num=0, train_loss=0.129, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.301, val_accuracy=0.912, val_f1_score=0.912]
Epoch 146:  92%|█████████▏| 234/255 [01:26<00:07,  2.70it/s, loss=0.131, v_num=0, train_loss=0.129, train_acc

Epoch 146, global step 33221: val_loss was not in top 2


Epoch 147:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.185, v_num=0, train_loss=0.387, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.441, val_accuracy=0.881, val_f1_score=0.881]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 147:  89%|████████▉ | 228/255 [01:26<00:10,  2.65it/s, loss=0.185, v_num=0, train_loss=0.387, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.441, val_accuracy=0.881, val_f1_score=0.881]
Epoch 147:  90%|█████████ | 230/255 [01:26<00:09,  2.66it/s, loss=0.185, v_num=0, train_loss=0.387, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.441, val_accuracy=0.881, val_f1_score=0.881]
Epoch 147:  91%|█████████ | 232/255 [01:26<00:08,  2.68it/s, loss=0.185, v_num=0, train_loss=0.387, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.441, val_accuracy=0.881, val_f1_score=0.881]
Epoch 147:  92%|█████████▏| 234/255 [01:26<00:07,  2.70it/s, loss=0.185, v_num=0, train_loss=0.387, train_accu

Epoch 147, global step 33447: val_loss was not in top 2


Epoch 148:  89%|████████▊ | 226/255 [01:19<00:10,  2.84it/s, loss=0.115, v_num=0, train_loss=0.184, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.426, val_accuracy=0.878, val_f1_score=0.878]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 148:  89%|████████▉ | 228/255 [01:25<00:10,  2.66it/s, loss=0.115, v_num=0, train_loss=0.184, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.426, val_accuracy=0.878, val_f1_score=0.878]
Epoch 148:  90%|█████████ | 230/255 [01:25<00:09,  2.68it/s, loss=0.115, v_num=0, train_loss=0.184, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.426, val_accuracy=0.878, val_f1_score=0.878]
Epoch 148:  91%|█████████ | 232/255 [01:26<00:08,  2.69it/s, loss=0.115, v_num=0, train_loss=0.184, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.426, val_accuracy=0.878, val_f1_score=0.878]
Epoch 148:  92%|█████████▏| 234/255 [01:26<00:07,  2.71it/s, loss=0.115, v_num=0, train_loss=0.184, train_accu

Epoch 148, global step 33673: val_loss was not in top 2


Epoch 149:  89%|████████▊ | 226/255 [01:19<00:10,  2.83it/s, loss=0.131, v_num=0, train_loss=0.243, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.297, val_accuracy=0.905, val_f1_score=0.905]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 149:  89%|████████▉ | 228/255 [01:25<00:10,  2.65it/s, loss=0.131, v_num=0, train_loss=0.243, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.297, val_accuracy=0.905, val_f1_score=0.905]
Epoch 149:  90%|█████████ | 230/255 [01:26<00:09,  2.67it/s, loss=0.131, v_num=0, train_loss=0.243, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.297, val_accuracy=0.905, val_f1_score=0.905]
Epoch 149:  91%|█████████ | 232/255 [01:26<00:08,  2.69it/s, loss=0.131, v_num=0, train_loss=0.243, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.297, val_accuracy=0.905, val_f1_score=0.905]
Epoch 149:  92%|█████████▏| 234/255 [01:26<00:07,  2.71it/s, loss=0.131, v_num=0, train_loss=0.243, train_accu

Epoch 149, global step 33899: val_loss was not in top 2


Epoch 150:  89%|████████▊ | 226/255 [01:19<00:10,  2.83it/s, loss=0.0662, v_num=0, train_loss=0.0125, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.277, val_accuracy=0.911, val_f1_score=0.911]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 150:  89%|████████▉ | 228/255 [01:25<00:10,  2.65it/s, loss=0.0662, v_num=0, train_loss=0.0125, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.277, val_accuracy=0.911, val_f1_score=0.911]
Epoch 150:  90%|█████████ | 230/255 [01:26<00:09,  2.67it/s, loss=0.0662, v_num=0, train_loss=0.0125, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.277, val_accuracy=0.911, val_f1_score=0.911]
Epoch 150:  91%|█████████ | 232/255 [01:26<00:08,  2.69it/s, loss=0.0662, v_num=0, train_loss=0.0125, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.277, val_accuracy=0.911, val_f1_score=0.911]
Epoch 150:  92%|█████████▏| 234/255 [01:26<00:07,  2.71it/s, loss=0.0662, v_num=0, train_loss=0.0125, tr

Epoch 150, global step 34125: val_loss was not in top 2


Epoch 151:  89%|████████▊ | 226/255 [01:19<00:10,  2.84it/s, loss=0.062, v_num=0, train_loss=0.0918, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.254, val_accuracy=0.913, val_f1_score=0.913]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 151:  89%|████████▉ | 228/255 [01:25<00:10,  2.66it/s, loss=0.062, v_num=0, train_loss=0.0918, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.254, val_accuracy=0.913, val_f1_score=0.913]
Epoch 151:  90%|█████████ | 230/255 [01:25<00:09,  2.68it/s, loss=0.062, v_num=0, train_loss=0.0918, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.254, val_accuracy=0.913, val_f1_score=0.913]
Epoch 151:  91%|█████████ | 232/255 [01:26<00:08,  2.69it/s, loss=0.062, v_num=0, train_loss=0.0918, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.254, val_accuracy=0.913, val_f1_score=0.913]
Epoch 151:  92%|█████████▏| 234/255 [01:26<00:07,  2.71it/s, loss=0.062, v_num=0, train_loss=0.0918, train

Epoch 151, global step 34351: val_loss was not in top 2


Epoch 152:  89%|████████▊ | 226/255 [01:19<00:10,  2.83it/s, loss=0.0788, v_num=0, train_loss=0.0883, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.272, val_accuracy=0.921, val_f1_score=0.921] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 152:  89%|████████▉ | 228/255 [01:25<00:10,  2.65it/s, loss=0.0788, v_num=0, train_loss=0.0883, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.272, val_accuracy=0.921, val_f1_score=0.921]
Epoch 152:  90%|█████████ | 230/255 [01:26<00:09,  2.67it/s, loss=0.0788, v_num=0, train_loss=0.0883, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.272, val_accuracy=0.921, val_f1_score=0.921]
Epoch 152:  91%|█████████ | 232/255 [01:26<00:08,  2.69it/s, loss=0.0788, v_num=0, train_loss=0.0883, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.272, val_accuracy=0.921, val_f1_score=0.921]
Epoch 152:  92%|█████████▏| 234/255 [01:26<00:07,  2.71it/s, loss=0.0788, v_num=0, train_loss=0.0883, t

Epoch 152, global step 34577: val_loss was not in top 2


Epoch 153:  89%|████████▊ | 226/255 [01:19<00:10,  2.83it/s, loss=0.0768, v_num=0, train_loss=0.00641, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.292, val_accuracy=0.908, val_f1_score=0.908]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 153:  89%|████████▉ | 228/255 [01:26<00:10,  2.65it/s, loss=0.0768, v_num=0, train_loss=0.00641, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.292, val_accuracy=0.908, val_f1_score=0.908]
Epoch 153:  90%|█████████ | 230/255 [01:26<00:09,  2.67it/s, loss=0.0768, v_num=0, train_loss=0.00641, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.292, val_accuracy=0.908, val_f1_score=0.908]
Epoch 153:  91%|█████████ | 232/255 [01:26<00:08,  2.69it/s, loss=0.0768, v_num=0, train_loss=0.00641, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.292, val_accuracy=0.908, val_f1_score=0.908]
Epoch 153:  92%|█████████▏| 234/255 [01:26<00:07,  2.70it/s, loss=0.0768, v_num=0, train_loss=0.0064

Epoch 153, global step 34803: val_loss was not in top 2


Epoch 154:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.098, v_num=0, train_loss=0.328, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.290, val_accuracy=0.917, val_f1_score=0.917]   
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 154:  89%|████████▉ | 228/255 [01:26<00:10,  2.65it/s, loss=0.098, v_num=0, train_loss=0.328, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.290, val_accuracy=0.917, val_f1_score=0.917]
Epoch 154:  90%|█████████ | 230/255 [01:26<00:09,  2.67it/s, loss=0.098, v_num=0, train_loss=0.328, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.290, val_accuracy=0.917, val_f1_score=0.917]
Epoch 154:  91%|█████████ | 232/255 [01:26<00:08,  2.68it/s, loss=0.098, v_num=0, train_loss=0.328, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.290, val_accuracy=0.917, val_f1_score=0.917]
Epoch 154:  92%|█████████▏| 234/255 [01:26<00:07,  2.70it/s, loss=0.098, v_num=0, train_loss=0.328, train_acc

Epoch 154, global step 35029: val_loss was not in top 2


Epoch 155:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.0476, v_num=0, train_loss=0.0652, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.274, val_accuracy=0.923, val_f1_score=0.923] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 155:  89%|████████▉ | 228/255 [01:26<00:10,  2.65it/s, loss=0.0476, v_num=0, train_loss=0.0652, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.274, val_accuracy=0.923, val_f1_score=0.923]
Epoch 155:  90%|█████████ | 230/255 [01:26<00:09,  2.66it/s, loss=0.0476, v_num=0, train_loss=0.0652, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.274, val_accuracy=0.923, val_f1_score=0.923]
Epoch 155:  91%|█████████ | 232/255 [01:26<00:08,  2.68it/s, loss=0.0476, v_num=0, train_loss=0.0652, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.274, val_accuracy=0.923, val_f1_score=0.923]
Epoch 155:  92%|█████████▏| 234/255 [01:26<00:07,  2.70it/s, loss=0.0476, v_num=0, train_loss=0.0652, t

Epoch 155, global step 35255: val_loss was not in top 2


Epoch 156:  89%|████████▊ | 226/255 [01:19<00:10,  2.83it/s, loss=0.145, v_num=0, train_loss=0.155, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.338, val_accuracy=0.912, val_f1_score=0.912]   
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 156:  89%|████████▉ | 228/255 [01:25<00:10,  2.65it/s, loss=0.145, v_num=0, train_loss=0.155, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.338, val_accuracy=0.912, val_f1_score=0.912]
Epoch 156:  90%|█████████ | 230/255 [01:26<00:09,  2.67it/s, loss=0.145, v_num=0, train_loss=0.155, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.338, val_accuracy=0.912, val_f1_score=0.912]
Epoch 156:  91%|█████████ | 232/255 [01:26<00:08,  2.69it/s, loss=0.145, v_num=0, train_loss=0.155, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.338, val_accuracy=0.912, val_f1_score=0.912]
Epoch 156:  92%|█████████▏| 234/255 [01:26<00:07,  2.71it/s, loss=0.145, v_num=0, train_loss=0.155, train_acc

Epoch 156, global step 35481: val_loss was not in top 2


Epoch 157:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.0759, v_num=0, train_loss=0.235, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.287, val_accuracy=0.889, val_f1_score=0.889] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 157:  89%|████████▉ | 228/255 [01:26<00:10,  2.65it/s, loss=0.0759, v_num=0, train_loss=0.235, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.287, val_accuracy=0.889, val_f1_score=0.889]
Epoch 157:  90%|█████████ | 230/255 [01:26<00:09,  2.66it/s, loss=0.0759, v_num=0, train_loss=0.235, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.287, val_accuracy=0.889, val_f1_score=0.889]
Epoch 157:  91%|█████████ | 232/255 [01:26<00:08,  2.68it/s, loss=0.0759, v_num=0, train_loss=0.235, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.287, val_accuracy=0.889, val_f1_score=0.889]
Epoch 157:  92%|█████████▏| 234/255 [01:26<00:07,  2.70it/s, loss=0.0759, v_num=0, train_loss=0.235, train_

Epoch 157, global step 35707: val_loss was not in top 2


Epoch 158:  89%|████████▊ | 226/255 [01:19<00:10,  2.83it/s, loss=0.0556, v_num=0, train_loss=0.0214, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.258, val_accuracy=0.923, val_f1_score=0.923] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 158:  89%|████████▉ | 228/255 [01:25<00:10,  2.65it/s, loss=0.0556, v_num=0, train_loss=0.0214, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.258, val_accuracy=0.923, val_f1_score=0.923]
Epoch 158:  90%|█████████ | 230/255 [01:26<00:09,  2.67it/s, loss=0.0556, v_num=0, train_loss=0.0214, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.258, val_accuracy=0.923, val_f1_score=0.923]
Epoch 158:  91%|█████████ | 232/255 [01:26<00:08,  2.69it/s, loss=0.0556, v_num=0, train_loss=0.0214, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.258, val_accuracy=0.923, val_f1_score=0.923]
Epoch 158:  92%|█████████▏| 234/255 [01:26<00:07,  2.71it/s, loss=0.0556, v_num=0, train_loss=0.0214, t

Epoch 158, global step 35933: val_loss was not in top 2


Epoch 159:  89%|████████▊ | 226/255 [01:19<00:10,  2.83it/s, loss=0.0964, v_num=0, train_loss=0.187, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.263, val_accuracy=0.925, val_f1_score=0.925] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 159:  89%|████████▉ | 228/255 [01:25<00:10,  2.65it/s, loss=0.0964, v_num=0, train_loss=0.187, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.263, val_accuracy=0.925, val_f1_score=0.925]
Epoch 159:  90%|█████████ | 230/255 [01:26<00:09,  2.67it/s, loss=0.0964, v_num=0, train_loss=0.187, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.263, val_accuracy=0.925, val_f1_score=0.925]
Epoch 159:  91%|█████████ | 232/255 [01:26<00:08,  2.69it/s, loss=0.0964, v_num=0, train_loss=0.187, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.263, val_accuracy=0.925, val_f1_score=0.925]
Epoch 159:  92%|█████████▏| 234/255 [01:26<00:07,  2.71it/s, loss=0.0964, v_num=0, train_loss=0.187, train_

Epoch 159, global step 36159: val_loss was not in top 2


Epoch 160:  89%|████████▊ | 226/255 [01:19<00:10,  2.83it/s, loss=0.116, v_num=0, train_loss=0.0623, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.252, val_accuracy=0.921, val_f1_score=0.921] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 160:  89%|████████▉ | 228/255 [01:25<00:10,  2.65it/s, loss=0.116, v_num=0, train_loss=0.0623, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.252, val_accuracy=0.921, val_f1_score=0.921]
Epoch 160:  90%|█████████ | 230/255 [01:26<00:09,  2.67it/s, loss=0.116, v_num=0, train_loss=0.0623, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.252, val_accuracy=0.921, val_f1_score=0.921]
Epoch 160:  91%|█████████ | 232/255 [01:26<00:08,  2.69it/s, loss=0.116, v_num=0, train_loss=0.0623, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.252, val_accuracy=0.921, val_f1_score=0.921]
Epoch 160:  92%|█████████▏| 234/255 [01:26<00:07,  2.71it/s, loss=0.116, v_num=0, train_loss=0.0623, train_

Epoch 160, global step 36385: val_loss was not in top 2


Epoch 161:  89%|████████▊ | 226/255 [01:19<00:10,  2.83it/s, loss=0.0722, v_num=0, train_loss=0.00177, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.317, val_accuracy=0.905, val_f1_score=0.905]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 161:  89%|████████▉ | 228/255 [01:26<00:10,  2.65it/s, loss=0.0722, v_num=0, train_loss=0.00177, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.317, val_accuracy=0.905, val_f1_score=0.905]
Epoch 161:  90%|█████████ | 230/255 [01:26<00:09,  2.67it/s, loss=0.0722, v_num=0, train_loss=0.00177, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.317, val_accuracy=0.905, val_f1_score=0.905]
Epoch 161:  91%|█████████ | 232/255 [01:26<00:08,  2.69it/s, loss=0.0722, v_num=0, train_loss=0.00177, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.317, val_accuracy=0.905, val_f1_score=0.905]
Epoch 161:  92%|█████████▏| 234/255 [01:26<00:07,  2.70it/s, loss=0.0722, v_num=0, train_loss=0.0017

Epoch 161, global step 36611: val_loss was not in top 2


Epoch 162:  89%|████████▊ | 226/255 [01:19<00:10,  2.83it/s, loss=0.0791, v_num=0, train_loss=0.0254, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.322, val_accuracy=0.913, val_f1_score=0.913] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 162:  89%|████████▉ | 228/255 [01:26<00:10,  2.65it/s, loss=0.0791, v_num=0, train_loss=0.0254, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.322, val_accuracy=0.913, val_f1_score=0.913]
Epoch 162:  90%|█████████ | 230/255 [01:26<00:09,  2.67it/s, loss=0.0791, v_num=0, train_loss=0.0254, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.322, val_accuracy=0.913, val_f1_score=0.913]
Epoch 162:  91%|█████████ | 232/255 [01:26<00:08,  2.68it/s, loss=0.0791, v_num=0, train_loss=0.0254, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.322, val_accuracy=0.913, val_f1_score=0.913]
Epoch 162:  92%|█████████▏| 234/255 [01:26<00:07,  2.70it/s, loss=0.0791, v_num=0, train_loss=0.0254, t

Epoch 162, global step 36837: val_loss reached 0.23335 (best 0.23335), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-2-v1.ckpt" as top 2


Epoch 163:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.0492, v_num=0, train_loss=0.000522, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.233, val_accuracy=0.931, val_f1_score=0.931]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 163:  89%|████████▉ | 228/255 [01:26<00:10,  2.64it/s, loss=0.0492, v_num=0, train_loss=0.000522, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.233, val_accuracy=0.931, val_f1_score=0.931]
Epoch 163:  90%|█████████ | 230/255 [01:26<00:09,  2.66it/s, loss=0.0492, v_num=0, train_loss=0.000522, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.233, val_accuracy=0.931, val_f1_score=0.931]
Epoch 163:  91%|█████████ | 232/255 [01:26<00:08,  2.68it/s, loss=0.0492, v_num=0, train_loss=0.000522, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.233, val_accuracy=0.931, val_f1_score=0.931]
Epoch 163:  92%|█████████▏| 234/255 [01:26<00:07,  2.70it/s, loss=0.0492, v_num=0, train_loss=0.

Epoch 163, global step 37063: val_loss reached 0.22967 (best 0.22967), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-2.ckpt" as top 2


Epoch 164:  89%|████████▊ | 226/255 [01:19<00:10,  2.83it/s, loss=0.0395, v_num=0, train_loss=0.0852, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.230, val_accuracy=0.924, val_f1_score=0.924]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 164:  89%|████████▉ | 228/255 [01:25<00:10,  2.65it/s, loss=0.0395, v_num=0, train_loss=0.0852, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.230, val_accuracy=0.924, val_f1_score=0.924]
Epoch 164:  90%|█████████ | 230/255 [01:26<00:09,  2.67it/s, loss=0.0395, v_num=0, train_loss=0.0852, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.230, val_accuracy=0.924, val_f1_score=0.924]
Epoch 164:  91%|█████████ | 232/255 [01:26<00:08,  2.69it/s, loss=0.0395, v_num=0, train_loss=0.0852, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.230, val_accuracy=0.924, val_f1_score=0.924]
Epoch 164:  92%|█████████▏| 234/255 [01:26<00:07,  2.71it/s, loss=0.0395, v_num=0, train_loss=0.0852, 

Epoch 164, global step 37289: val_loss was not in top 2


Epoch 165:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.0609, v_num=0, train_loss=0.00506, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.245, val_accuracy=0.930, val_f1_score=0.930]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 165:  89%|████████▉ | 228/255 [01:26<00:10,  2.65it/s, loss=0.0609, v_num=0, train_loss=0.00506, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.245, val_accuracy=0.930, val_f1_score=0.930]
Epoch 165:  90%|█████████ | 230/255 [01:26<00:09,  2.66it/s, loss=0.0609, v_num=0, train_loss=0.00506, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.245, val_accuracy=0.930, val_f1_score=0.930]
Epoch 165:  91%|█████████ | 232/255 [01:26<00:08,  2.68it/s, loss=0.0609, v_num=0, train_loss=0.00506, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.245, val_accuracy=0.930, val_f1_score=0.930]
Epoch 165:  92%|█████████▏| 234/255 [01:26<00:07,  2.70it/s, loss=0.0609, v_num=0, train_loss=0.0050

Epoch 165, global step 37515: val_loss was not in top 2


Epoch 166:  89%|████████▊ | 226/255 [01:19<00:10,  2.83it/s, loss=0.0437, v_num=0, train_loss=0.00674, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.242, val_accuracy=0.924, val_f1_score=0.924]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 166:  89%|████████▉ | 228/255 [01:25<00:10,  2.66it/s, loss=0.0437, v_num=0, train_loss=0.00674, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.242, val_accuracy=0.924, val_f1_score=0.924]
Epoch 166:  90%|█████████ | 230/255 [01:25<00:09,  2.68it/s, loss=0.0437, v_num=0, train_loss=0.00674, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.242, val_accuracy=0.924, val_f1_score=0.924]
Epoch 166:  91%|█████████ | 232/255 [01:26<00:08,  2.70it/s, loss=0.0437, v_num=0, train_loss=0.00674, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.242, val_accuracy=0.924, val_f1_score=0.924]
Epoch 166:  92%|█████████▏| 234/255 [01:26<00:07,  2.71it/s, loss=0.0437, v_num=0, train_loss=0.0067

Epoch 166, global step 37741: val_loss reached 0.21648 (best 0.21648), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-2-v1.ckpt" as top 2


Epoch 167:  89%|████████▊ | 226/255 [01:19<00:10,  2.83it/s, loss=0.0475, v_num=0, train_loss=0.0471, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.216, val_accuracy=0.928, val_f1_score=0.928] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 167:  89%|████████▉ | 228/255 [01:26<00:10,  2.65it/s, loss=0.0475, v_num=0, train_loss=0.0471, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.216, val_accuracy=0.928, val_f1_score=0.928]
Epoch 167:  90%|█████████ | 230/255 [01:26<00:09,  2.67it/s, loss=0.0475, v_num=0, train_loss=0.0471, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.216, val_accuracy=0.928, val_f1_score=0.928]
Epoch 167:  91%|█████████ | 232/255 [01:26<00:08,  2.69it/s, loss=0.0475, v_num=0, train_loss=0.0471, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.216, val_accuracy=0.928, val_f1_score=0.928]
Epoch 167:  92%|█████████▏| 234/255 [01:26<00:07,  2.71it/s, loss=0.0475, v_num=0, train_loss=0.0471, t

Epoch 167, global step 37967: val_loss was not in top 2


Epoch 168:  89%|████████▊ | 226/255 [01:19<00:10,  2.84it/s, loss=0.0801, v_num=0, train_loss=0.00795, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.243, val_accuracy=0.925, val_f1_score=0.925]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 168:  89%|████████▉ | 228/255 [01:25<00:10,  2.66it/s, loss=0.0801, v_num=0, train_loss=0.00795, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.243, val_accuracy=0.925, val_f1_score=0.925]
Epoch 168:  90%|█████████ | 230/255 [01:25<00:09,  2.68it/s, loss=0.0801, v_num=0, train_loss=0.00795, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.243, val_accuracy=0.925, val_f1_score=0.925]
Epoch 168:  91%|█████████ | 232/255 [01:26<00:08,  2.70it/s, loss=0.0801, v_num=0, train_loss=0.00795, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.243, val_accuracy=0.925, val_f1_score=0.925]
Epoch 168:  92%|█████████▏| 234/255 [01:26<00:07,  2.72it/s, loss=0.0801, v_num=0, train_loss=0.0079

Epoch 168, global step 38193: val_loss was not in top 2


Epoch 169:  89%|████████▊ | 226/255 [01:19<00:10,  2.83it/s, loss=0.0715, v_num=0, train_loss=0.205, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.253, val_accuracy=0.918, val_f1_score=0.918]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 169:  89%|████████▉ | 228/255 [01:26<00:10,  2.65it/s, loss=0.0715, v_num=0, train_loss=0.205, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.253, val_accuracy=0.918, val_f1_score=0.918]
Epoch 169:  90%|█████████ | 230/255 [01:26<00:09,  2.67it/s, loss=0.0715, v_num=0, train_loss=0.205, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.253, val_accuracy=0.918, val_f1_score=0.918]
Epoch 169:  91%|█████████ | 232/255 [01:26<00:08,  2.69it/s, loss=0.0715, v_num=0, train_loss=0.205, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.253, val_accuracy=0.918, val_f1_score=0.918]
Epoch 169:  92%|█████████▏| 234/255 [01:26<00:07,  2.70it/s, loss=0.0715, v_num=0, train_loss=0.205, train

Epoch 169, global step 38419: val_loss was not in top 2


Epoch 170:  89%|████████▊ | 226/255 [01:19<00:10,  2.83it/s, loss=0.0766, v_num=0, train_loss=0.0434, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.247, val_accuracy=0.930, val_f1_score=0.930] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 170:  89%|████████▉ | 228/255 [01:25<00:10,  2.65it/s, loss=0.0766, v_num=0, train_loss=0.0434, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.247, val_accuracy=0.930, val_f1_score=0.930]
Epoch 170:  90%|█████████ | 230/255 [01:26<00:09,  2.67it/s, loss=0.0766, v_num=0, train_loss=0.0434, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.247, val_accuracy=0.930, val_f1_score=0.930]
Epoch 170:  91%|█████████ | 232/255 [01:26<00:08,  2.69it/s, loss=0.0766, v_num=0, train_loss=0.0434, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.247, val_accuracy=0.930, val_f1_score=0.930]
Epoch 170:  92%|█████████▏| 234/255 [01:26<00:07,  2.71it/s, loss=0.0766, v_num=0, train_loss=0.0434, t

Epoch 170, global step 38645: val_loss was not in top 2


Epoch 171:  89%|████████▊ | 226/255 [01:19<00:10,  2.83it/s, loss=0.0322, v_num=0, train_loss=0.00299, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.281, val_accuracy=0.923, val_f1_score=0.923]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 171:  89%|████████▉ | 228/255 [01:26<00:10,  2.65it/s, loss=0.0322, v_num=0, train_loss=0.00299, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.281, val_accuracy=0.923, val_f1_score=0.923]
Epoch 171:  90%|█████████ | 230/255 [01:26<00:09,  2.67it/s, loss=0.0322, v_num=0, train_loss=0.00299, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.281, val_accuracy=0.923, val_f1_score=0.923]
Epoch 171:  91%|█████████ | 232/255 [01:26<00:08,  2.69it/s, loss=0.0322, v_num=0, train_loss=0.00299, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.281, val_accuracy=0.923, val_f1_score=0.923]
Epoch 171:  92%|█████████▏| 234/255 [01:26<00:07,  2.71it/s, loss=0.0322, v_num=0, train_loss=0.0029

Epoch 171, global step 38871: val_loss reached 0.22223 (best 0.21648), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-2.ckpt" as top 2


Epoch 172:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.0768, v_num=0, train_loss=0.0101, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.222, val_accuracy=0.932, val_f1_score=0.932] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 172:  89%|████████▉ | 228/255 [01:26<00:10,  2.65it/s, loss=0.0768, v_num=0, train_loss=0.0101, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.222, val_accuracy=0.932, val_f1_score=0.932]
Epoch 172:  90%|█████████ | 230/255 [01:26<00:09,  2.66it/s, loss=0.0768, v_num=0, train_loss=0.0101, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.222, val_accuracy=0.932, val_f1_score=0.932]
Epoch 172:  91%|█████████ | 232/255 [01:26<00:08,  2.68it/s, loss=0.0768, v_num=0, train_loss=0.0101, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.222, val_accuracy=0.932, val_f1_score=0.932]
Epoch 172:  92%|█████████▏| 234/255 [01:26<00:07,  2.70it/s, loss=0.0768, v_num=0, train_loss=0.0101, t

Epoch 172, global step 39097: val_loss was not in top 2


Epoch 173:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.0554, v_num=0, train_loss=0.014, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.243, val_accuracy=0.928, val_f1_score=0.928]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 173:  89%|████████▉ | 228/255 [01:26<00:10,  2.65it/s, loss=0.0554, v_num=0, train_loss=0.014, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.243, val_accuracy=0.928, val_f1_score=0.928]
Epoch 173:  90%|█████████ | 230/255 [01:26<00:09,  2.67it/s, loss=0.0554, v_num=0, train_loss=0.014, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.243, val_accuracy=0.928, val_f1_score=0.928]
Epoch 173:  91%|█████████ | 232/255 [01:26<00:08,  2.68it/s, loss=0.0554, v_num=0, train_loss=0.014, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.243, val_accuracy=0.928, val_f1_score=0.928]
Epoch 173:  92%|█████████▏| 234/255 [01:26<00:07,  2.70it/s, loss=0.0554, v_num=0, train_loss=0.014, train

Epoch 173, global step 39323: val_loss was not in top 2


Epoch 174:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.0347, v_num=0, train_loss=0.0165, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.231, val_accuracy=0.930, val_f1_score=0.930] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 174:  89%|████████▉ | 228/255 [01:26<00:10,  2.65it/s, loss=0.0347, v_num=0, train_loss=0.0165, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.231, val_accuracy=0.930, val_f1_score=0.930]
Epoch 174:  90%|█████████ | 230/255 [01:26<00:09,  2.67it/s, loss=0.0347, v_num=0, train_loss=0.0165, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.231, val_accuracy=0.930, val_f1_score=0.930]
Epoch 174:  91%|█████████ | 232/255 [01:26<00:08,  2.69it/s, loss=0.0347, v_num=0, train_loss=0.0165, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.231, val_accuracy=0.930, val_f1_score=0.930]
Epoch 174:  92%|█████████▏| 234/255 [01:26<00:07,  2.70it/s, loss=0.0347, v_num=0, train_loss=0.0165, t

Epoch 174, global step 39549: val_loss was not in top 2


Epoch 175:  89%|████████▊ | 226/255 [01:19<00:10,  2.83it/s, loss=0.0535, v_num=0, train_loss=0.000636, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.241, val_accuracy=0.928, val_f1_score=0.928]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 175:  89%|████████▉ | 228/255 [01:26<00:10,  2.65it/s, loss=0.0535, v_num=0, train_loss=0.000636, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.241, val_accuracy=0.928, val_f1_score=0.928]
Epoch 175:  90%|█████████ | 230/255 [01:26<00:09,  2.67it/s, loss=0.0535, v_num=0, train_loss=0.000636, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.241, val_accuracy=0.928, val_f1_score=0.928]
Epoch 175:  91%|█████████ | 232/255 [01:26<00:08,  2.69it/s, loss=0.0535, v_num=0, train_loss=0.000636, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.241, val_accuracy=0.928, val_f1_score=0.928]
Epoch 175:  92%|█████████▏| 234/255 [01:26<00:07,  2.70it/s, loss=0.0535, v_num=0, train_loss=0.

Epoch 175, global step 39775: val_loss was not in top 2


Epoch 176:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.0474, v_num=0, train_loss=0.264, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.258, val_accuracy=0.930, val_f1_score=0.930]   
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 176:  89%|████████▉ | 228/255 [01:26<00:10,  2.64it/s, loss=0.0474, v_num=0, train_loss=0.264, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.258, val_accuracy=0.930, val_f1_score=0.930]
Epoch 176:  90%|█████████ | 230/255 [01:26<00:09,  2.66it/s, loss=0.0474, v_num=0, train_loss=0.264, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.258, val_accuracy=0.930, val_f1_score=0.930]
Epoch 176:  91%|█████████ | 232/255 [01:26<00:08,  2.68it/s, loss=0.0474, v_num=0, train_loss=0.264, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.258, val_accuracy=0.930, val_f1_score=0.930]
Epoch 176:  92%|█████████▏| 234/255 [01:26<00:07,  2.70it/s, loss=0.0474, v_num=0, train_loss=0.264, trai

Epoch 176, global step 40001: val_loss was not in top 2


Epoch 177:  89%|████████▊ | 226/255 [01:19<00:10,  2.83it/s, loss=0.103, v_num=0, train_loss=0.0139, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.265, val_accuracy=0.931, val_f1_score=0.931]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 177:  89%|████████▉ | 228/255 [01:25<00:10,  2.66it/s, loss=0.103, v_num=0, train_loss=0.0139, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.265, val_accuracy=0.931, val_f1_score=0.931]
Epoch 177:  90%|█████████ | 230/255 [01:26<00:09,  2.67it/s, loss=0.103, v_num=0, train_loss=0.0139, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.265, val_accuracy=0.931, val_f1_score=0.931]
Epoch 177:  91%|█████████ | 232/255 [01:26<00:08,  2.69it/s, loss=0.103, v_num=0, train_loss=0.0139, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.265, val_accuracy=0.931, val_f1_score=0.931]
Epoch 177:  92%|█████████▏| 234/255 [01:26<00:07,  2.71it/s, loss=0.103, v_num=0, train_loss=0.0139, train

Epoch 177, global step 40227: val_loss was not in top 2


Epoch 178:  89%|████████▊ | 226/255 [01:19<00:10,  2.83it/s, loss=0.0481, v_num=0, train_loss=0.0194, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.264, val_accuracy=0.913, val_f1_score=0.913] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 178:  89%|████████▉ | 228/255 [01:25<00:10,  2.65it/s, loss=0.0481, v_num=0, train_loss=0.0194, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.264, val_accuracy=0.913, val_f1_score=0.913]
Epoch 178:  90%|█████████ | 230/255 [01:26<00:09,  2.67it/s, loss=0.0481, v_num=0, train_loss=0.0194, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.264, val_accuracy=0.913, val_f1_score=0.913]
Epoch 178:  91%|█████████ | 232/255 [01:26<00:08,  2.69it/s, loss=0.0481, v_num=0, train_loss=0.0194, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.264, val_accuracy=0.913, val_f1_score=0.913]
Epoch 178:  92%|█████████▏| 234/255 [01:26<00:07,  2.71it/s, loss=0.0481, v_num=0, train_loss=0.0194, t

Epoch 178, global step 40453: val_loss was not in top 2


Epoch 179:  89%|████████▊ | 226/255 [01:19<00:10,  2.83it/s, loss=0.069, v_num=0, train_loss=0.0828, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.227, val_accuracy=0.933, val_f1_score=0.933]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 179:  89%|████████▉ | 228/255 [01:26<00:10,  2.65it/s, loss=0.069, v_num=0, train_loss=0.0828, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.227, val_accuracy=0.933, val_f1_score=0.933]
Epoch 179:  90%|█████████ | 230/255 [01:26<00:09,  2.67it/s, loss=0.069, v_num=0, train_loss=0.0828, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.227, val_accuracy=0.933, val_f1_score=0.933]
Epoch 179:  91%|█████████ | 232/255 [01:26<00:08,  2.69it/s, loss=0.069, v_num=0, train_loss=0.0828, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.227, val_accuracy=0.933, val_f1_score=0.933]
Epoch 179:  92%|█████████▏| 234/255 [01:26<00:07,  2.70it/s, loss=0.069, v_num=0, train_loss=0.0828, train

Epoch 179, global step 40679: val_loss reached 0.21904 (best 0.21648), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-2.ckpt" as top 2


Epoch 180:  89%|████████▊ | 226/255 [01:19<00:10,  2.84it/s, loss=0.0356, v_num=0, train_loss=0.0243, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.219, val_accuracy=0.931, val_f1_score=0.931] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 180:  89%|████████▉ | 228/255 [01:25<00:10,  2.66it/s, loss=0.0356, v_num=0, train_loss=0.0243, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.219, val_accuracy=0.931, val_f1_score=0.931]
Epoch 180:  90%|█████████ | 230/255 [01:25<00:09,  2.68it/s, loss=0.0356, v_num=0, train_loss=0.0243, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.219, val_accuracy=0.931, val_f1_score=0.931]
Epoch 180:  91%|█████████ | 232/255 [01:26<00:08,  2.70it/s, loss=0.0356, v_num=0, train_loss=0.0243, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.219, val_accuracy=0.931, val_f1_score=0.931]
Epoch 180:  92%|█████████▏| 234/255 [01:26<00:07,  2.71it/s, loss=0.0356, v_num=0, train_loss=0.0243, t

Epoch 180, global step 40905: val_loss was not in top 2


Epoch 181:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.0344, v_num=0, train_loss=0.0506, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.255, val_accuracy=0.930, val_f1_score=0.930] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 181:  89%|████████▉ | 228/255 [01:26<00:10,  2.64it/s, loss=0.0344, v_num=0, train_loss=0.0506, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.255, val_accuracy=0.930, val_f1_score=0.930]
Epoch 181:  90%|█████████ | 230/255 [01:26<00:09,  2.66it/s, loss=0.0344, v_num=0, train_loss=0.0506, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.255, val_accuracy=0.930, val_f1_score=0.930]
Epoch 181:  91%|█████████ | 232/255 [01:26<00:08,  2.68it/s, loss=0.0344, v_num=0, train_loss=0.0506, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.255, val_accuracy=0.930, val_f1_score=0.930]
Epoch 181:  92%|█████████▏| 234/255 [01:26<00:07,  2.70it/s, loss=0.0344, v_num=0, train_loss=0.0506, t

Epoch 181, global step 41131: val_loss was not in top 2


Epoch 182:  89%|████████▊ | 226/255 [01:19<00:10,  2.83it/s, loss=0.0246, v_num=0, train_loss=0.0192, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.263, val_accuracy=0.925, val_f1_score=0.925] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 182:  89%|████████▉ | 228/255 [01:25<00:10,  2.65it/s, loss=0.0246, v_num=0, train_loss=0.0192, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.263, val_accuracy=0.925, val_f1_score=0.925]
Epoch 182:  90%|█████████ | 230/255 [01:26<00:09,  2.67it/s, loss=0.0246, v_num=0, train_loss=0.0192, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.263, val_accuracy=0.925, val_f1_score=0.925]
Epoch 182:  91%|█████████ | 232/255 [01:26<00:08,  2.69it/s, loss=0.0246, v_num=0, train_loss=0.0192, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.263, val_accuracy=0.925, val_f1_score=0.925]
Epoch 182:  92%|█████████▏| 234/255 [01:26<00:07,  2.71it/s, loss=0.0246, v_num=0, train_loss=0.0192, t

Epoch 182, global step 41357: val_loss was not in top 2


Epoch 183:  89%|████████▊ | 226/255 [01:19<00:10,  2.84it/s, loss=0.0189, v_num=0, train_loss=0.00654, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.282, val_accuracy=0.931, val_f1_score=0.931]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 183:  89%|████████▉ | 228/255 [01:25<00:10,  2.66it/s, loss=0.0189, v_num=0, train_loss=0.00654, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.282, val_accuracy=0.931, val_f1_score=0.931]
Epoch 183:  90%|█████████ | 230/255 [01:25<00:09,  2.68it/s, loss=0.0189, v_num=0, train_loss=0.00654, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.282, val_accuracy=0.931, val_f1_score=0.931]
Epoch 183:  91%|█████████ | 232/255 [01:26<00:08,  2.70it/s, loss=0.0189, v_num=0, train_loss=0.00654, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.282, val_accuracy=0.931, val_f1_score=0.931]
Epoch 183:  92%|█████████▏| 234/255 [01:26<00:07,  2.71it/s, loss=0.0189, v_num=0, train_loss=0.0065

Epoch 183, global step 41583: val_loss was not in top 2


Epoch 184:  89%|████████▊ | 226/255 [01:19<00:10,  2.83it/s, loss=0.0484, v_num=0, train_loss=0.00974, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.286, val_accuracy=0.924, val_f1_score=0.924]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 184:  89%|████████▉ | 228/255 [01:25<00:10,  2.65it/s, loss=0.0484, v_num=0, train_loss=0.00974, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.286, val_accuracy=0.924, val_f1_score=0.924]
Epoch 184:  90%|█████████ | 230/255 [01:26<00:09,  2.67it/s, loss=0.0484, v_num=0, train_loss=0.00974, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.286, val_accuracy=0.924, val_f1_score=0.924]
Epoch 184:  91%|█████████ | 232/255 [01:26<00:08,  2.69it/s, loss=0.0484, v_num=0, train_loss=0.00974, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.286, val_accuracy=0.924, val_f1_score=0.924]
Epoch 184:  92%|█████████▏| 234/255 [01:26<00:07,  2.71it/s, loss=0.0484, v_num=0, train_loss=0.0097

Epoch 184, global step 41809: val_loss was not in top 2


Epoch 185:  89%|████████▊ | 226/255 [01:19<00:10,  2.85it/s, loss=0.028, v_num=0, train_loss=0.00907, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.246, val_accuracy=0.928, val_f1_score=0.928] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 185:  89%|████████▉ | 228/255 [01:25<00:10,  2.67it/s, loss=0.028, v_num=0, train_loss=0.00907, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.246, val_accuracy=0.928, val_f1_score=0.928]
Epoch 185:  90%|█████████ | 230/255 [01:25<00:09,  2.69it/s, loss=0.028, v_num=0, train_loss=0.00907, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.246, val_accuracy=0.928, val_f1_score=0.928]
Epoch 185:  91%|█████████ | 232/255 [01:25<00:08,  2.70it/s, loss=0.028, v_num=0, train_loss=0.00907, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.246, val_accuracy=0.928, val_f1_score=0.928]
Epoch 185:  92%|█████████▏| 234/255 [01:25<00:07,  2.72it/s, loss=0.028, v_num=0, train_loss=0.00907, t

Epoch 185, global step 42035: val_loss was not in top 2


Epoch 186:  89%|████████▊ | 226/255 [01:19<00:10,  2.84it/s, loss=0.0666, v_num=0, train_loss=0.00865, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.264, val_accuracy=0.930, val_f1_score=0.930]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 186:  89%|████████▉ | 228/255 [01:25<00:10,  2.66it/s, loss=0.0666, v_num=0, train_loss=0.00865, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.264, val_accuracy=0.930, val_f1_score=0.930]
Epoch 186:  90%|█████████ | 230/255 [01:25<00:09,  2.68it/s, loss=0.0666, v_num=0, train_loss=0.00865, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.264, val_accuracy=0.930, val_f1_score=0.930]
Epoch 186:  91%|█████████ | 232/255 [01:26<00:08,  2.69it/s, loss=0.0666, v_num=0, train_loss=0.00865, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.264, val_accuracy=0.930, val_f1_score=0.930]
Epoch 186:  92%|█████████▏| 234/255 [01:26<00:07,  2.71it/s, loss=0.0666, v_num=0, train_loss=0.0086

Epoch 186, global step 42261: val_loss was not in top 2


Epoch 187:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.0324, v_num=0, train_loss=0.0329, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.256, val_accuracy=0.934, val_f1_score=0.934] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 187:  89%|████████▉ | 228/255 [01:26<00:10,  2.65it/s, loss=0.0324, v_num=0, train_loss=0.0329, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.256, val_accuracy=0.934, val_f1_score=0.934]
Epoch 187:  90%|█████████ | 230/255 [01:26<00:09,  2.66it/s, loss=0.0324, v_num=0, train_loss=0.0329, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.256, val_accuracy=0.934, val_f1_score=0.934]
Epoch 187:  91%|█████████ | 232/255 [01:26<00:08,  2.68it/s, loss=0.0324, v_num=0, train_loss=0.0329, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.256, val_accuracy=0.934, val_f1_score=0.934]
Epoch 187:  92%|█████████▏| 234/255 [01:26<00:07,  2.70it/s, loss=0.0324, v_num=0, train_loss=0.0329, t

Epoch 187, global step 42487: val_loss was not in top 2


Epoch 188:  89%|████████▊ | 226/255 [01:19<00:10,  2.83it/s, loss=0.0291, v_num=0, train_loss=0.168, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.235, val_accuracy=0.936, val_f1_score=0.936]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 188:  89%|████████▉ | 228/255 [01:25<00:10,  2.65it/s, loss=0.0291, v_num=0, train_loss=0.168, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.235, val_accuracy=0.936, val_f1_score=0.936]
Epoch 188:  90%|█████████ | 230/255 [01:26<00:09,  2.67it/s, loss=0.0291, v_num=0, train_loss=0.168, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.235, val_accuracy=0.936, val_f1_score=0.936]
Epoch 188:  91%|█████████ | 232/255 [01:26<00:08,  2.69it/s, loss=0.0291, v_num=0, train_loss=0.168, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.235, val_accuracy=0.936, val_f1_score=0.936]
Epoch 188:  92%|█████████▏| 234/255 [01:26<00:07,  2.71it/s, loss=0.0291, v_num=0, train_loss=0.168, train

Epoch 188, global step 42713: val_loss was not in top 2


Epoch 189:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.0163, v_num=0, train_loss=0.0178, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.285, val_accuracy=0.923, val_f1_score=0.923]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 189:  89%|████████▉ | 228/255 [01:26<00:10,  2.65it/s, loss=0.0163, v_num=0, train_loss=0.0178, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.285, val_accuracy=0.923, val_f1_score=0.923]
Epoch 189:  90%|█████████ | 230/255 [01:26<00:09,  2.67it/s, loss=0.0163, v_num=0, train_loss=0.0178, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.285, val_accuracy=0.923, val_f1_score=0.923]
Epoch 189:  91%|█████████ | 232/255 [01:26<00:08,  2.68it/s, loss=0.0163, v_num=0, train_loss=0.0178, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.285, val_accuracy=0.923, val_f1_score=0.923]
Epoch 189:  92%|█████████▏| 234/255 [01:26<00:07,  2.70it/s, loss=0.0163, v_num=0, train_loss=0.0178, 

Epoch 189, global step 42939: val_loss was not in top 2


Epoch 190:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.0398, v_num=0, train_loss=0.0261, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.279, val_accuracy=0.935, val_f1_score=0.935] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 190:  89%|████████▉ | 228/255 [01:26<00:10,  2.64it/s, loss=0.0398, v_num=0, train_loss=0.0261, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.279, val_accuracy=0.935, val_f1_score=0.935]
Epoch 190:  90%|█████████ | 230/255 [01:26<00:09,  2.66it/s, loss=0.0398, v_num=0, train_loss=0.0261, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.279, val_accuracy=0.935, val_f1_score=0.935]
Epoch 190:  91%|█████████ | 232/255 [01:26<00:08,  2.68it/s, loss=0.0398, v_num=0, train_loss=0.0261, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.279, val_accuracy=0.935, val_f1_score=0.935]
Epoch 190:  92%|█████████▏| 234/255 [01:26<00:07,  2.70it/s, loss=0.0398, v_num=0, train_loss=0.0261, t

Epoch 190, global step 43165: val_loss was not in top 2


Epoch 191:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.0258, v_num=0, train_loss=0.00192, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.242, val_accuracy=0.929, val_f1_score=0.929]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 191:  89%|████████▉ | 228/255 [01:26<00:10,  2.65it/s, loss=0.0258, v_num=0, train_loss=0.00192, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.242, val_accuracy=0.929, val_f1_score=0.929]
Epoch 191:  90%|█████████ | 230/255 [01:26<00:09,  2.66it/s, loss=0.0258, v_num=0, train_loss=0.00192, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.242, val_accuracy=0.929, val_f1_score=0.929]
Epoch 191:  91%|█████████ | 232/255 [01:26<00:08,  2.68it/s, loss=0.0258, v_num=0, train_loss=0.00192, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.242, val_accuracy=0.929, val_f1_score=0.929]
Epoch 191:  92%|█████████▏| 234/255 [01:26<00:07,  2.70it/s, loss=0.0258, v_num=0, train_loss=0.0019

Epoch 191, global step 43391: val_loss was not in top 2


Epoch 192:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.0191, v_num=0, train_loss=0.00317, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.255, val_accuracy=0.928, val_f1_score=0.928]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 192:  89%|████████▉ | 228/255 [01:26<00:10,  2.65it/s, loss=0.0191, v_num=0, train_loss=0.00317, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.255, val_accuracy=0.928, val_f1_score=0.928]
Epoch 192:  90%|█████████ | 230/255 [01:26<00:09,  2.66it/s, loss=0.0191, v_num=0, train_loss=0.00317, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.255, val_accuracy=0.928, val_f1_score=0.928]
Epoch 192:  91%|█████████ | 232/255 [01:26<00:08,  2.68it/s, loss=0.0191, v_num=0, train_loss=0.00317, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.255, val_accuracy=0.928, val_f1_score=0.928]
Epoch 192:  92%|█████████▏| 234/255 [01:26<00:07,  2.70it/s, loss=0.0191, v_num=0, train_loss=0.0031

Epoch 192, global step 43617: val_loss was not in top 2


Epoch 193:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.0165, v_num=0, train_loss=0.00146, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.248, val_accuracy=0.931, val_f1_score=0.931] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 193:  89%|████████▉ | 228/255 [01:26<00:10,  2.65it/s, loss=0.0165, v_num=0, train_loss=0.00146, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.248, val_accuracy=0.931, val_f1_score=0.931]
Epoch 193:  90%|█████████ | 230/255 [01:26<00:09,  2.66it/s, loss=0.0165, v_num=0, train_loss=0.00146, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.248, val_accuracy=0.931, val_f1_score=0.931]
Epoch 193:  91%|█████████ | 232/255 [01:26<00:08,  2.68it/s, loss=0.0165, v_num=0, train_loss=0.00146, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.248, val_accuracy=0.931, val_f1_score=0.931]
Epoch 193:  92%|█████████▏| 234/255 [01:26<00:07,  2.70it/s, loss=0.0165, v_num=0, train_loss=0.001

Epoch 193, global step 43843: val_loss was not in top 2


Epoch 194:  89%|████████▊ | 226/255 [01:19<00:10,  2.83it/s, loss=0.0575, v_num=0, train_loss=0.00384, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.262, val_accuracy=0.930, val_f1_score=0.930]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 194:  89%|████████▉ | 228/255 [01:26<00:10,  2.65it/s, loss=0.0575, v_num=0, train_loss=0.00384, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.262, val_accuracy=0.930, val_f1_score=0.930]
Epoch 194:  90%|█████████ | 230/255 [01:26<00:09,  2.67it/s, loss=0.0575, v_num=0, train_loss=0.00384, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.262, val_accuracy=0.930, val_f1_score=0.930]
Epoch 194:  91%|█████████ | 232/255 [01:26<00:08,  2.69it/s, loss=0.0575, v_num=0, train_loss=0.00384, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.262, val_accuracy=0.930, val_f1_score=0.930]
Epoch 194:  92%|█████████▏| 234/255 [01:26<00:07,  2.70it/s, loss=0.0575, v_num=0, train_loss=0.00

Epoch 194, global step 44069: val_loss was not in top 2


Epoch 195:  89%|████████▊ | 226/255 [01:19<00:10,  2.83it/s, loss=0.0194, v_num=0, train_loss=0.0102, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.302, val_accuracy=0.918, val_f1_score=0.918]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 195:  89%|████████▉ | 228/255 [01:25<00:10,  2.65it/s, loss=0.0194, v_num=0, train_loss=0.0102, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.302, val_accuracy=0.918, val_f1_score=0.918]
Epoch 195:  90%|█████████ | 230/255 [01:26<00:09,  2.67it/s, loss=0.0194, v_num=0, train_loss=0.0102, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.302, val_accuracy=0.918, val_f1_score=0.918]
Epoch 195:  91%|█████████ | 232/255 [01:26<00:08,  2.69it/s, loss=0.0194, v_num=0, train_loss=0.0102, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.302, val_accuracy=0.918, val_f1_score=0.918]
Epoch 195:  92%|█████████▏| 234/255 [01:26<00:07,  2.71it/s, loss=0.0194, v_num=0, train_loss=0.0102, 

Epoch 195, global step 44295: val_loss was not in top 2


Epoch 196:  89%|████████▊ | 226/255 [01:19<00:10,  2.83it/s, loss=0.0161, v_num=0, train_loss=0.00223, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.256, val_accuracy=0.934, val_f1_score=0.934] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 196:  89%|████████▉ | 228/255 [01:25<00:10,  2.65it/s, loss=0.0161, v_num=0, train_loss=0.00223, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.256, val_accuracy=0.934, val_f1_score=0.934]
Epoch 196:  90%|█████████ | 230/255 [01:26<00:09,  2.67it/s, loss=0.0161, v_num=0, train_loss=0.00223, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.256, val_accuracy=0.934, val_f1_score=0.934]
Epoch 196:  91%|█████████ | 232/255 [01:26<00:08,  2.69it/s, loss=0.0161, v_num=0, train_loss=0.00223, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.256, val_accuracy=0.934, val_f1_score=0.934]
Epoch 196:  92%|█████████▏| 234/255 [01:26<00:07,  2.71it/s, loss=0.0161, v_num=0, train_loss=0.002

Epoch 196, global step 44521: val_loss was not in top 2


Epoch 197:  89%|████████▊ | 226/255 [01:19<00:10,  2.83it/s, loss=0.0128, v_num=0, train_loss=0.000858, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.235, val_accuracy=0.935, val_f1_score=0.935] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 197:  89%|████████▉ | 228/255 [01:26<00:10,  2.65it/s, loss=0.0128, v_num=0, train_loss=0.000858, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.235, val_accuracy=0.935, val_f1_score=0.935]
Epoch 197:  90%|█████████ | 230/255 [01:26<00:09,  2.67it/s, loss=0.0128, v_num=0, train_loss=0.000858, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.235, val_accuracy=0.935, val_f1_score=0.935]
Epoch 197:  91%|█████████ | 232/255 [01:26<00:08,  2.69it/s, loss=0.0128, v_num=0, train_loss=0.000858, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.235, val_accuracy=0.935, val_f1_score=0.935]
Epoch 197:  92%|█████████▏| 234/255 [01:26<00:07,  2.70it/s, loss=0.0128, v_num=0, train_loss=0

Epoch 197, global step 44747: val_loss was not in top 2


Epoch 198:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.0382, v_num=0, train_loss=0.000931, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.241, val_accuracy=0.945, val_f1_score=0.945]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 198:  89%|████████▉ | 228/255 [01:26<00:10,  2.65it/s, loss=0.0382, v_num=0, train_loss=0.000931, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.241, val_accuracy=0.945, val_f1_score=0.945]
Epoch 198:  90%|█████████ | 230/255 [01:26<00:09,  2.66it/s, loss=0.0382, v_num=0, train_loss=0.000931, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.241, val_accuracy=0.945, val_f1_score=0.945]
Epoch 198:  91%|█████████ | 232/255 [01:26<00:08,  2.68it/s, loss=0.0382, v_num=0, train_loss=0.000931, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.241, val_accuracy=0.945, val_f1_score=0.945]
Epoch 198:  92%|█████████▏| 234/255 [01:26<00:07,  2.70it/s, loss=0.0382, v_num=0, train_loss=0.

Epoch 198, global step 44973: val_loss was not in top 2


Epoch 199:  89%|████████▊ | 226/255 [01:19<00:10,  2.83it/s, loss=0.0484, v_num=0, train_loss=0.00362, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.262, val_accuracy=0.930, val_f1_score=0.930] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 199:  89%|████████▉ | 228/255 [01:25<00:10,  2.65it/s, loss=0.0484, v_num=0, train_loss=0.00362, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.262, val_accuracy=0.930, val_f1_score=0.930]
Epoch 199:  90%|█████████ | 230/255 [01:26<00:09,  2.67it/s, loss=0.0484, v_num=0, train_loss=0.00362, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.262, val_accuracy=0.930, val_f1_score=0.930]
Epoch 199:  91%|█████████ | 232/255 [01:26<00:08,  2.69it/s, loss=0.0484, v_num=0, train_loss=0.00362, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.262, val_accuracy=0.930, val_f1_score=0.930]
Epoch 199:  92%|█████████▏| 234/255 [01:26<00:07,  2.71it/s, loss=0.0484, v_num=0, train_loss=0.003

Epoch 199, global step 45199: val_loss was not in top 2


Epoch 199: 100%|██████████| 255/255 [01:28<00:00,  2.87it/s, loss=0.0484, v_num=0, train_loss=0.00362, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.233, val_accuracy=0.930, val_f1_score=0.930]


LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1,2]


Testing: 100%|██████████| 29/29 [00:09<00:00,  4.84it/s]--------------------------------------------------------------------------------
DATALOADER:0 TEST RESULTS
{'test_f1_score': 0.929737389087677,
 'test_train_accuracy': 0.929737389087677,
 'test_train_loss': 0.25471553206443787}
--------------------------------------------------------------------------------
Testing: 100%|██████████| 29/29 [00:09<00:00,  3.18it/s]
------------------ Round: 3 ------------------
['FT10', 'O2', 'O1', 'FT7', 'F4', 'TP7', 'C3', 'C4', 'F3', 'FT8', 'T6', 'HEOR', 'T5', 'VEOL', 'F7', 'FZ', 'VEOU', 'A1', 'P3', 'PZ', 'CP3', 'P4', 'CPZ', 'A2', 'HEOL', 'CP4', 'FT9', 'F8', 'OZ', 'CZ', 'FC4', 'FC3', 'FP1', 'PO1', 'T3', 'T4', 'PO2']
Len: 37


GPU available: True, used: True
TPU available: False, using: 0 TPU cores
IPU available: False, using: 0 IPUs
LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1,2]
Missing logger folder: lightning_logs/Drowsy_3

  | Name      | Type             | Params
-----------------------------------------------
0 | model     | DrowsyModel      | 1.4 M 
1 | criterion | CrossEntropyLoss | 0     
-----------------------------------------------
1.4 M     Trainable params
0         Non-trainable params
1.4 M     Total params
5.421     Total estimated model params size (MB)


                                                                      

Global seed set to 42


Epoch 0:  89%|████████▊ | 226/255 [01:19<00:10,  2.84it/s, loss=0.627, v_num=0, train_loss=0.520, train_accuracy=0.667, train_f1_score=0.667]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 0:  89%|████████▉ | 228/255 [01:26<00:10,  2.65it/s, loss=0.627, v_num=0, train_loss=0.520, train_accuracy=0.667, train_f1_score=0.667]
Epoch 0:  90%|█████████ | 230/255 [01:26<00:09,  2.67it/s, loss=0.627, v_num=0, train_loss=0.520, train_accuracy=0.667, train_f1_score=0.667]
Epoch 0:  91%|█████████ | 232/255 [01:26<00:08,  2.68it/s, loss=0.627, v_num=0, train_loss=0.520, train_accuracy=0.667, train_f1_score=0.667]
Epoch 0:  92%|█████████▏| 234/255 [01:26<00:07,  2.70it/s, loss=0.627, v_num=0, train_loss=0.520, train_accuracy=0.667, train_f1_score=0.667]
Epoch 0:  93%|█████████▎| 236/255 [01:26<00:06,  2.72it/s, loss=0.627, v_num=0, train_loss=0.520, train_accuracy=0.667, train_f1_score=0.667]
Epoch 0:  93%|█████████▎| 238/255 [01:26<00:06,  2.74it/s, l

Epoch 0, global step 225: val_loss reached 0.65169 (best 0.65169), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-3.ckpt" as top 2


Epoch 1:  89%|████████▊ | 226/255 [01:19<00:10,  2.83it/s, loss=0.556, v_num=0, train_loss=0.533, train_accuracy=0.667, train_f1_score=0.667, val_loss=0.652, val_accuracy=0.644, val_f1_score=0.644]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 1:  89%|████████▉ | 228/255 [01:26<00:10,  2.64it/s, loss=0.556, v_num=0, train_loss=0.533, train_accuracy=0.667, train_f1_score=0.667, val_loss=0.652, val_accuracy=0.644, val_f1_score=0.644]
Epoch 1:  90%|█████████ | 230/255 [01:26<00:09,  2.66it/s, loss=0.556, v_num=0, train_loss=0.533, train_accuracy=0.667, train_f1_score=0.667, val_loss=0.652, val_accuracy=0.644, val_f1_score=0.644]
Epoch 1:  91%|█████████ | 232/255 [01:26<00:08,  2.68it/s, loss=0.556, v_num=0, train_loss=0.533, train_accuracy=0.667, train_f1_score=0.667, val_loss=0.652, val_accuracy=0.644, val_f1_score=0.644]
Epoch 1:  92%|█████████▏| 234/255 [01:26<00:07,  2.70it/s, loss=0.556, v_num=0, train_loss=0.533, train_accuracy=0.667, 

Epoch 1, global step 451: val_loss reached 0.61214 (best 0.61214), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-3-v1.ckpt" as top 2


Epoch 2:  89%|████████▊ | 226/255 [01:19<00:10,  2.83it/s, loss=0.574, v_num=0, train_loss=0.581, train_accuracy=0.611, train_f1_score=0.611, val_loss=0.612, val_accuracy=0.691, val_f1_score=0.691]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 2:  89%|████████▉ | 228/255 [01:26<00:10,  2.64it/s, loss=0.574, v_num=0, train_loss=0.581, train_accuracy=0.611, train_f1_score=0.611, val_loss=0.612, val_accuracy=0.691, val_f1_score=0.691]
Epoch 2:  90%|█████████ | 230/255 [01:26<00:09,  2.66it/s, loss=0.574, v_num=0, train_loss=0.581, train_accuracy=0.611, train_f1_score=0.611, val_loss=0.612, val_accuracy=0.691, val_f1_score=0.691]
Epoch 2:  91%|█████████ | 232/255 [01:26<00:08,  2.68it/s, loss=0.574, v_num=0, train_loss=0.581, train_accuracy=0.611, train_f1_score=0.611, val_loss=0.612, val_accuracy=0.691, val_f1_score=0.691]
Epoch 2:  92%|█████████▏| 234/255 [01:26<00:07,  2.69it/s, loss=0.574, v_num=0, train_loss=0.581, train_accuracy=0.611, 

Epoch 2, global step 677: val_loss reached 0.59018 (best 0.59018), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-3.ckpt" as top 2


Epoch 3:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.51, v_num=0, train_loss=0.408, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.590, val_accuracy=0.704, val_f1_score=0.704] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 3:  89%|████████▉ | 228/255 [01:26<00:10,  2.63it/s, loss=0.51, v_num=0, train_loss=0.408, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.590, val_accuracy=0.704, val_f1_score=0.704]
Epoch 3:  90%|█████████ | 230/255 [01:26<00:09,  2.65it/s, loss=0.51, v_num=0, train_loss=0.408, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.590, val_accuracy=0.704, val_f1_score=0.704]
Epoch 3:  91%|█████████ | 232/255 [01:26<00:08,  2.67it/s, loss=0.51, v_num=0, train_loss=0.408, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.590, val_accuracy=0.704, val_f1_score=0.704]
Epoch 3:  92%|█████████▏| 234/255 [01:27<00:07,  2.69it/s, loss=0.51, v_num=0, train_loss=0.408, train_accuracy=0.778, trai

Epoch 3, global step 903: val_loss reached 0.57847 (best 0.57847), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-3-v1.ckpt" as top 2


Epoch 4:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.516, v_num=0, train_loss=0.429, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.578, val_accuracy=0.702, val_f1_score=0.702]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 4:  89%|████████▉ | 228/255 [01:26<00:10,  2.64it/s, loss=0.516, v_num=0, train_loss=0.429, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.578, val_accuracy=0.702, val_f1_score=0.702]
Epoch 4:  90%|█████████ | 230/255 [01:26<00:09,  2.66it/s, loss=0.516, v_num=0, train_loss=0.429, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.578, val_accuracy=0.702, val_f1_score=0.702]
Epoch 4:  91%|█████████ | 232/255 [01:26<00:08,  2.67it/s, loss=0.516, v_num=0, train_loss=0.429, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.578, val_accuracy=0.702, val_f1_score=0.702]
Epoch 4:  92%|█████████▏| 234/255 [01:26<00:07,  2.69it/s, loss=0.516, v_num=0, train_loss=0.429, train_accuracy=0.778, 

Epoch 4, global step 1129: val_loss was not in top 2


Epoch 5:  89%|████████▊ | 226/255 [01:20<00:10,  2.81it/s, loss=0.448, v_num=0, train_loss=0.514, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.594, val_accuracy=0.718, val_f1_score=0.718]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 5:  89%|████████▉ | 228/255 [01:26<00:10,  2.63it/s, loss=0.448, v_num=0, train_loss=0.514, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.594, val_accuracy=0.718, val_f1_score=0.718]
Epoch 5:  90%|█████████ | 230/255 [01:26<00:09,  2.65it/s, loss=0.448, v_num=0, train_loss=0.514, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.594, val_accuracy=0.718, val_f1_score=0.718]
Epoch 5:  91%|█████████ | 232/255 [01:27<00:08,  2.66it/s, loss=0.448, v_num=0, train_loss=0.514, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.594, val_accuracy=0.718, val_f1_score=0.718]
Epoch 5:  92%|█████████▏| 234/255 [01:27<00:07,  2.68it/s, loss=0.448, v_num=0, train_loss=0.514, train_accuracy=0.778, 

Epoch 5, global step 1355: val_loss reached 0.49710 (best 0.49710), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-3.ckpt" as top 2


Epoch 6:  89%|████████▊ | 226/255 [01:19<00:10,  2.83it/s, loss=0.463, v_num=0, train_loss=0.200, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.497, val_accuracy=0.786, val_f1_score=0.786]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 6:  89%|████████▉ | 228/255 [01:26<00:10,  2.64it/s, loss=0.463, v_num=0, train_loss=0.200, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.497, val_accuracy=0.786, val_f1_score=0.786]
Epoch 6:  90%|█████████ | 230/255 [01:26<00:09,  2.66it/s, loss=0.463, v_num=0, train_loss=0.200, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.497, val_accuracy=0.786, val_f1_score=0.786]
Epoch 6:  91%|█████████ | 232/255 [01:26<00:08,  2.67it/s, loss=0.463, v_num=0, train_loss=0.200, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.497, val_accuracy=0.786, val_f1_score=0.786]
Epoch 6:  92%|█████████▏| 234/255 [01:26<00:07,  2.69it/s, loss=0.463, v_num=0, train_loss=0.200, train_accuracy=1.000, 

Epoch 6, global step 1581: val_loss reached 0.52673 (best 0.49710), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-3-v1.ckpt" as top 2


Epoch 7:  89%|████████▊ | 226/255 [01:20<00:10,  2.81it/s, loss=0.391, v_num=0, train_loss=0.336, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.527, val_accuracy=0.766, val_f1_score=0.766]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 7:  89%|████████▉ | 228/255 [01:26<00:10,  2.63it/s, loss=0.391, v_num=0, train_loss=0.336, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.527, val_accuracy=0.766, val_f1_score=0.766]
Epoch 7:  90%|█████████ | 230/255 [01:26<00:09,  2.65it/s, loss=0.391, v_num=0, train_loss=0.336, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.527, val_accuracy=0.766, val_f1_score=0.766]
Epoch 7:  91%|█████████ | 232/255 [01:27<00:08,  2.66it/s, loss=0.391, v_num=0, train_loss=0.336, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.527, val_accuracy=0.766, val_f1_score=0.766]
Epoch 7:  92%|█████████▏| 234/255 [01:27<00:07,  2.68it/s, loss=0.391, v_num=0, train_loss=0.336, train_accuracy=0.833, 

Epoch 7, global step 1807: val_loss reached 0.43516 (best 0.43516), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-3-v1.ckpt" as top 2


Epoch 8:  89%|████████▊ | 226/255 [01:20<00:10,  2.81it/s, loss=0.406, v_num=0, train_loss=0.424, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.435, val_accuracy=0.813, val_f1_score=0.813]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 8:  89%|████████▉ | 228/255 [01:26<00:10,  2.62it/s, loss=0.406, v_num=0, train_loss=0.424, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.435, val_accuracy=0.813, val_f1_score=0.813]
Epoch 8:  90%|█████████ | 230/255 [01:27<00:09,  2.64it/s, loss=0.406, v_num=0, train_loss=0.424, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.435, val_accuracy=0.813, val_f1_score=0.813]
Epoch 8:  91%|█████████ | 232/255 [01:27<00:08,  2.66it/s, loss=0.406, v_num=0, train_loss=0.424, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.435, val_accuracy=0.813, val_f1_score=0.813]
Epoch 8:  92%|█████████▏| 234/255 [01:27<00:07,  2.68it/s, loss=0.406, v_num=0, train_loss=0.424, train_accuracy=0.944, 

Epoch 8, global step 2033: val_loss was not in top 2


Epoch 9:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.362, v_num=0, train_loss=0.365, train_accuracy=0.722, train_f1_score=0.722, val_loss=0.511, val_accuracy=0.794, val_f1_score=0.794]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 9:  89%|████████▉ | 228/255 [01:26<00:10,  2.63it/s, loss=0.362, v_num=0, train_loss=0.365, train_accuracy=0.722, train_f1_score=0.722, val_loss=0.511, val_accuracy=0.794, val_f1_score=0.794]
Epoch 9:  90%|█████████ | 230/255 [01:26<00:09,  2.65it/s, loss=0.362, v_num=0, train_loss=0.365, train_accuracy=0.722, train_f1_score=0.722, val_loss=0.511, val_accuracy=0.794, val_f1_score=0.794]
Epoch 9:  91%|█████████ | 232/255 [01:27<00:08,  2.67it/s, loss=0.362, v_num=0, train_loss=0.365, train_accuracy=0.722, train_f1_score=0.722, val_loss=0.511, val_accuracy=0.794, val_f1_score=0.794]
Epoch 9:  92%|█████████▏| 234/255 [01:27<00:07,  2.68it/s, loss=0.362, v_num=0, train_loss=0.365, train_accuracy=0.722, 

Epoch 9, global step 2259: val_loss reached 0.43502 (best 0.43502), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-3.ckpt" as top 2


Epoch 10:  89%|████████▊ | 226/255 [01:19<00:10,  2.84it/s, loss=0.36, v_num=0, train_loss=0.609, train_accuracy=0.722, train_f1_score=0.722, val_loss=0.435, val_accuracy=0.820, val_f1_score=0.820] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 10:  89%|████████▉ | 228/255 [01:26<00:10,  2.65it/s, loss=0.36, v_num=0, train_loss=0.609, train_accuracy=0.722, train_f1_score=0.722, val_loss=0.435, val_accuracy=0.820, val_f1_score=0.820]
Epoch 10:  90%|█████████ | 230/255 [01:26<00:09,  2.67it/s, loss=0.36, v_num=0, train_loss=0.609, train_accuracy=0.722, train_f1_score=0.722, val_loss=0.435, val_accuracy=0.820, val_f1_score=0.820]
Epoch 10:  91%|█████████ | 232/255 [01:26<00:08,  2.69it/s, loss=0.36, v_num=0, train_loss=0.609, train_accuracy=0.722, train_f1_score=0.722, val_loss=0.435, val_accuracy=0.820, val_f1_score=0.820]
Epoch 10:  92%|█████████▏| 234/255 [01:26<00:07,  2.70it/s, loss=0.36, v_num=0, train_loss=0.609, train_accuracy=0.722,

Epoch 10, global step 2485: val_loss reached 0.43316 (best 0.43316), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-3-v1.ckpt" as top 2


Epoch 11:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.609, v_num=0, train_loss=0.615, train_accuracy=0.667, train_f1_score=0.667, val_loss=0.433, val_accuracy=0.829, val_f1_score=0.829]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 11:  89%|████████▉ | 228/255 [01:26<00:10,  2.64it/s, loss=0.609, v_num=0, train_loss=0.615, train_accuracy=0.667, train_f1_score=0.667, val_loss=0.433, val_accuracy=0.829, val_f1_score=0.829]
Epoch 11:  90%|█████████ | 230/255 [01:26<00:09,  2.65it/s, loss=0.609, v_num=0, train_loss=0.615, train_accuracy=0.667, train_f1_score=0.667, val_loss=0.433, val_accuracy=0.829, val_f1_score=0.829]
Epoch 11:  91%|█████████ | 232/255 [01:26<00:08,  2.67it/s, loss=0.609, v_num=0, train_loss=0.615, train_accuracy=0.667, train_f1_score=0.667, val_loss=0.433, val_accuracy=0.829, val_f1_score=0.829]
Epoch 11:  92%|█████████▏| 234/255 [01:26<00:07,  2.69it/s, loss=0.609, v_num=0, train_loss=0.615, train_accuracy=0.

Epoch 11, global step 2711: val_loss was not in top 2


Epoch 12:  89%|████████▊ | 226/255 [01:19<00:10,  2.84it/s, loss=0.446, v_num=0, train_loss=0.286, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.617, val_accuracy=0.666, val_f1_score=0.666]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 12:  89%|████████▉ | 228/255 [01:26<00:10,  2.65it/s, loss=0.446, v_num=0, train_loss=0.286, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.617, val_accuracy=0.666, val_f1_score=0.666]
Epoch 12:  90%|█████████ | 230/255 [01:26<00:09,  2.67it/s, loss=0.446, v_num=0, train_loss=0.286, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.617, val_accuracy=0.666, val_f1_score=0.666]
Epoch 12:  91%|█████████ | 232/255 [01:26<00:08,  2.68it/s, loss=0.446, v_num=0, train_loss=0.286, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.617, val_accuracy=0.666, val_f1_score=0.666]
Epoch 12:  92%|█████████▏| 234/255 [01:26<00:07,  2.70it/s, loss=0.446, v_num=0, train_loss=0.286, train_accuracy=0.

Epoch 12, global step 2937: val_loss was not in top 2


Epoch 13:  89%|████████▊ | 226/255 [01:20<00:10,  2.81it/s, loss=0.578, v_num=0, train_loss=0.422, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.513, val_accuracy=0.774, val_f1_score=0.774]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 13:  89%|████████▉ | 228/255 [01:26<00:10,  2.63it/s, loss=0.578, v_num=0, train_loss=0.422, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.513, val_accuracy=0.774, val_f1_score=0.774]
Epoch 13:  90%|█████████ | 230/255 [01:26<00:09,  2.65it/s, loss=0.578, v_num=0, train_loss=0.422, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.513, val_accuracy=0.774, val_f1_score=0.774]
Epoch 13:  91%|█████████ | 232/255 [01:27<00:08,  2.67it/s, loss=0.578, v_num=0, train_loss=0.422, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.513, val_accuracy=0.774, val_f1_score=0.774]
Epoch 13:  92%|█████████▏| 234/255 [01:27<00:07,  2.68it/s, loss=0.578, v_num=0, train_loss=0.422, train_accuracy=0.

Epoch 13, global step 3163: val_loss was not in top 2


Epoch 14:  89%|████████▊ | 226/255 [01:20<00:10,  2.81it/s, loss=0.377, v_num=0, train_loss=0.330, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.630, val_accuracy=0.682, val_f1_score=0.682]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 14:  89%|████████▉ | 228/255 [01:26<00:10,  2.62it/s, loss=0.377, v_num=0, train_loss=0.330, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.630, val_accuracy=0.682, val_f1_score=0.682]
Epoch 14:  90%|█████████ | 230/255 [01:27<00:09,  2.64it/s, loss=0.377, v_num=0, train_loss=0.330, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.630, val_accuracy=0.682, val_f1_score=0.682]
Epoch 14:  91%|█████████ | 232/255 [01:27<00:08,  2.66it/s, loss=0.377, v_num=0, train_loss=0.330, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.630, val_accuracy=0.682, val_f1_score=0.682]
Epoch 14:  92%|█████████▏| 234/255 [01:27<00:07,  2.68it/s, loss=0.377, v_num=0, train_loss=0.330, train_accuracy=0.

Epoch 14, global step 3389: val_loss was not in top 2


Epoch 15:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.331, v_num=0, train_loss=0.636, train_accuracy=0.722, train_f1_score=0.722, val_loss=0.483, val_accuracy=0.819, val_f1_score=0.819]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 15:  89%|████████▉ | 228/255 [01:26<00:10,  2.63it/s, loss=0.331, v_num=0, train_loss=0.636, train_accuracy=0.722, train_f1_score=0.722, val_loss=0.483, val_accuracy=0.819, val_f1_score=0.819]
Epoch 15:  90%|█████████ | 230/255 [01:26<00:09,  2.65it/s, loss=0.331, v_num=0, train_loss=0.636, train_accuracy=0.722, train_f1_score=0.722, val_loss=0.483, val_accuracy=0.819, val_f1_score=0.819]
Epoch 15:  91%|█████████ | 232/255 [01:26<00:08,  2.67it/s, loss=0.331, v_num=0, train_loss=0.636, train_accuracy=0.722, train_f1_score=0.722, val_loss=0.483, val_accuracy=0.819, val_f1_score=0.819]
Epoch 15:  92%|█████████▏| 234/255 [01:27<00:07,  2.69it/s, loss=0.331, v_num=0, train_loss=0.636, train_accuracy=0.

Epoch 15, global step 3615: val_loss was not in top 2


Epoch 16:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.326, v_num=0, train_loss=0.268, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.477, val_accuracy=0.819, val_f1_score=0.819]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 16:  89%|████████▉ | 228/255 [01:26<00:10,  2.63it/s, loss=0.326, v_num=0, train_loss=0.268, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.477, val_accuracy=0.819, val_f1_score=0.819]
Epoch 16:  90%|█████████ | 230/255 [01:26<00:09,  2.65it/s, loss=0.326, v_num=0, train_loss=0.268, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.477, val_accuracy=0.819, val_f1_score=0.819]
Epoch 16:  91%|█████████ | 232/255 [01:26<00:08,  2.67it/s, loss=0.326, v_num=0, train_loss=0.268, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.477, val_accuracy=0.819, val_f1_score=0.819]
Epoch 16:  92%|█████████▏| 234/255 [01:27<00:07,  2.69it/s, loss=0.326, v_num=0, train_loss=0.268, train_accuracy=0.

Epoch 16, global step 3841: val_loss was not in top 2


Epoch 17:  89%|████████▊ | 226/255 [01:20<00:10,  2.81it/s, loss=0.283, v_num=0, train_loss=0.165, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.444, val_accuracy=0.814, val_f1_score=0.814]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 17:  89%|████████▉ | 228/255 [01:26<00:10,  2.63it/s, loss=0.283, v_num=0, train_loss=0.165, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.444, val_accuracy=0.814, val_f1_score=0.814]
Epoch 17:  90%|█████████ | 230/255 [01:27<00:09,  2.64it/s, loss=0.283, v_num=0, train_loss=0.165, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.444, val_accuracy=0.814, val_f1_score=0.814]
Epoch 17:  91%|█████████ | 232/255 [01:27<00:08,  2.66it/s, loss=0.283, v_num=0, train_loss=0.165, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.444, val_accuracy=0.814, val_f1_score=0.814]
Epoch 17:  92%|█████████▏| 234/255 [01:27<00:07,  2.68it/s, loss=0.283, v_num=0, train_loss=0.165, train_accuracy=1.

Epoch 17, global step 4067: val_loss was not in top 2


Epoch 18:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.285, v_num=0, train_loss=0.257, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.437, val_accuracy=0.828, val_f1_score=0.828]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 18:  89%|████████▉ | 228/255 [01:26<00:10,  2.64it/s, loss=0.285, v_num=0, train_loss=0.257, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.437, val_accuracy=0.828, val_f1_score=0.828]
Epoch 18:  90%|█████████ | 230/255 [01:26<00:09,  2.65it/s, loss=0.285, v_num=0, train_loss=0.257, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.437, val_accuracy=0.828, val_f1_score=0.828]
Epoch 18:  91%|█████████ | 232/255 [01:26<00:08,  2.67it/s, loss=0.285, v_num=0, train_loss=0.257, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.437, val_accuracy=0.828, val_f1_score=0.828]
Epoch 18:  92%|█████████▏| 234/255 [01:26<00:07,  2.69it/s, loss=0.285, v_num=0, train_loss=0.257, train_accuracy=0.

Epoch 18, global step 4293: val_loss was not in top 2


Epoch 19:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.302, v_num=0, train_loss=0.236, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.450, val_accuracy=0.842, val_f1_score=0.842]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 19:  89%|████████▉ | 228/255 [01:26<00:10,  2.64it/s, loss=0.302, v_num=0, train_loss=0.236, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.450, val_accuracy=0.842, val_f1_score=0.842]
Epoch 19:  90%|█████████ | 230/255 [01:26<00:09,  2.65it/s, loss=0.302, v_num=0, train_loss=0.236, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.450, val_accuracy=0.842, val_f1_score=0.842]
Epoch 19:  91%|█████████ | 232/255 [01:26<00:08,  2.67it/s, loss=0.302, v_num=0, train_loss=0.236, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.450, val_accuracy=0.842, val_f1_score=0.842]
Epoch 19:  92%|█████████▏| 234/255 [01:26<00:07,  2.69it/s, loss=0.302, v_num=0, train_loss=0.236, train_accuracy=0.

Epoch 19, global step 4519: val_loss was not in top 2


Epoch 20:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.265, v_num=0, train_loss=0.185, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.460, val_accuracy=0.838, val_f1_score=0.838]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 20:  89%|████████▉ | 228/255 [01:26<00:10,  2.63it/s, loss=0.265, v_num=0, train_loss=0.185, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.460, val_accuracy=0.838, val_f1_score=0.838]
Epoch 20:  90%|█████████ | 230/255 [01:26<00:09,  2.65it/s, loss=0.265, v_num=0, train_loss=0.185, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.460, val_accuracy=0.838, val_f1_score=0.838]
Epoch 20:  91%|█████████ | 232/255 [01:27<00:08,  2.67it/s, loss=0.265, v_num=0, train_loss=0.185, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.460, val_accuracy=0.838, val_f1_score=0.838]
Epoch 20:  92%|█████████▏| 234/255 [01:27<00:07,  2.68it/s, loss=0.265, v_num=0, train_loss=0.185, train_accuracy=0.

Epoch 20, global step 4745: val_loss reached 0.39426 (best 0.39426), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-3.ckpt" as top 2


Epoch 21:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.238, v_num=0, train_loss=0.203, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.394, val_accuracy=0.839, val_f1_score=0.839]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 21:  89%|████████▉ | 228/255 [01:26<00:10,  2.63it/s, loss=0.238, v_num=0, train_loss=0.203, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.394, val_accuracy=0.839, val_f1_score=0.839]
Epoch 21:  90%|█████████ | 230/255 [01:26<00:09,  2.65it/s, loss=0.238, v_num=0, train_loss=0.203, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.394, val_accuracy=0.839, val_f1_score=0.839]
Epoch 21:  91%|█████████ | 232/255 [01:26<00:08,  2.67it/s, loss=0.238, v_num=0, train_loss=0.203, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.394, val_accuracy=0.839, val_f1_score=0.839]
Epoch 21:  92%|█████████▏| 234/255 [01:27<00:07,  2.69it/s, loss=0.238, v_num=0, train_loss=0.203, train_accuracy=0.

Epoch 21, global step 4971: val_loss was not in top 2


Epoch 22:  89%|████████▊ | 226/255 [01:20<00:10,  2.81it/s, loss=0.527, v_num=0, train_loss=0.437, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.495, val_accuracy=0.850, val_f1_score=0.850]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 22:  89%|████████▉ | 228/255 [01:26<00:10,  2.63it/s, loss=0.527, v_num=0, train_loss=0.437, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.495, val_accuracy=0.850, val_f1_score=0.850]
Epoch 22:  90%|█████████ | 230/255 [01:26<00:09,  2.65it/s, loss=0.527, v_num=0, train_loss=0.437, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.495, val_accuracy=0.850, val_f1_score=0.850]
Epoch 22:  91%|█████████ | 232/255 [01:27<00:08,  2.66it/s, loss=0.527, v_num=0, train_loss=0.437, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.495, val_accuracy=0.850, val_f1_score=0.850]
Epoch 22:  92%|█████████▏| 234/255 [01:27<00:07,  2.68it/s, loss=0.527, v_num=0, train_loss=0.437, train_accuracy=0.

Epoch 22, global step 5197: val_loss was not in top 2


Epoch 23:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.393, v_num=0, train_loss=0.165, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.565, val_accuracy=0.686, val_f1_score=0.686]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 23:  89%|████████▉ | 228/255 [01:26<00:10,  2.63it/s, loss=0.393, v_num=0, train_loss=0.165, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.565, val_accuracy=0.686, val_f1_score=0.686]
Epoch 23:  90%|█████████ | 230/255 [01:26<00:09,  2.65it/s, loss=0.393, v_num=0, train_loss=0.165, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.565, val_accuracy=0.686, val_f1_score=0.686]
Epoch 23:  91%|█████████ | 232/255 [01:27<00:08,  2.66it/s, loss=0.393, v_num=0, train_loss=0.165, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.565, val_accuracy=0.686, val_f1_score=0.686]
Epoch 23:  92%|█████████▏| 234/255 [01:27<00:07,  2.68it/s, loss=0.393, v_num=0, train_loss=0.165, train_accuracy=1.

Epoch 23, global step 5423: val_loss was not in top 2


Epoch 24:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.37, v_num=0, train_loss=0.531, train_accuracy=0.722, train_f1_score=0.722, val_loss=0.474, val_accuracy=0.795, val_f1_score=0.795] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 24:  89%|████████▉ | 228/255 [01:26<00:10,  2.63it/s, loss=0.37, v_num=0, train_loss=0.531, train_accuracy=0.722, train_f1_score=0.722, val_loss=0.474, val_accuracy=0.795, val_f1_score=0.795]
Epoch 24:  90%|█████████ | 230/255 [01:26<00:09,  2.65it/s, loss=0.37, v_num=0, train_loss=0.531, train_accuracy=0.722, train_f1_score=0.722, val_loss=0.474, val_accuracy=0.795, val_f1_score=0.795]
Epoch 24:  91%|█████████ | 232/255 [01:27<00:08,  2.66it/s, loss=0.37, v_num=0, train_loss=0.531, train_accuracy=0.722, train_f1_score=0.722, val_loss=0.474, val_accuracy=0.795, val_f1_score=0.795]
Epoch 24:  92%|█████████▏| 234/255 [01:27<00:07,  2.68it/s, loss=0.37, v_num=0, train_loss=0.531, train_accuracy=0.722,

Epoch 24, global step 5649: val_loss was not in top 2


Epoch 25:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.304, v_num=0, train_loss=0.176, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.445, val_accuracy=0.823, val_f1_score=0.823]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 25:  89%|████████▉ | 228/255 [01:26<00:10,  2.63it/s, loss=0.304, v_num=0, train_loss=0.176, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.445, val_accuracy=0.823, val_f1_score=0.823]
Epoch 25:  90%|█████████ | 230/255 [01:26<00:09,  2.65it/s, loss=0.304, v_num=0, train_loss=0.176, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.445, val_accuracy=0.823, val_f1_score=0.823]
Epoch 25:  91%|█████████ | 232/255 [01:27<00:08,  2.66it/s, loss=0.304, v_num=0, train_loss=0.176, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.445, val_accuracy=0.823, val_f1_score=0.823]
Epoch 25:  92%|█████████▏| 234/255 [01:27<00:07,  2.68it/s, loss=0.304, v_num=0, train_loss=0.176, train_accuracy=0.

Epoch 25, global step 5875: val_loss was not in top 2


Epoch 26:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.26, v_num=0, train_loss=0.292, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.451, val_accuracy=0.830, val_f1_score=0.830]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 26:  89%|████████▉ | 228/255 [01:26<00:10,  2.64it/s, loss=0.26, v_num=0, train_loss=0.292, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.451, val_accuracy=0.830, val_f1_score=0.830]
Epoch 26:  90%|█████████ | 230/255 [01:26<00:09,  2.65it/s, loss=0.26, v_num=0, train_loss=0.292, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.451, val_accuracy=0.830, val_f1_score=0.830]
Epoch 26:  91%|█████████ | 232/255 [01:26<00:08,  2.67it/s, loss=0.26, v_num=0, train_loss=0.292, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.451, val_accuracy=0.830, val_f1_score=0.830]
Epoch 26:  92%|█████████▏| 234/255 [01:26<00:07,  2.69it/s, loss=0.26, v_num=0, train_loss=0.292, train_accuracy=0.833

Epoch 26, global step 6101: val_loss reached 0.42901 (best 0.39426), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-3-v1.ckpt" as top 2


Epoch 27:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.274, v_num=0, train_loss=0.467, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.429, val_accuracy=0.840, val_f1_score=0.840]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 27:  89%|████████▉ | 228/255 [01:26<00:10,  2.63it/s, loss=0.274, v_num=0, train_loss=0.467, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.429, val_accuracy=0.840, val_f1_score=0.840]
Epoch 27:  90%|█████████ | 230/255 [01:26<00:09,  2.65it/s, loss=0.274, v_num=0, train_loss=0.467, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.429, val_accuracy=0.840, val_f1_score=0.840]
Epoch 27:  91%|█████████ | 232/255 [01:26<00:08,  2.67it/s, loss=0.274, v_num=0, train_loss=0.467, train_accuracy=0.778, train_f1_score=0.778, val_loss=0.429, val_accuracy=0.840, val_f1_score=0.840]
Epoch 27:  92%|█████████▏| 234/255 [01:27<00:07,  2.69it/s, loss=0.274, v_num=0, train_loss=0.467, train_accuracy=0.

Epoch 27, global step 6327: val_loss reached 0.41831 (best 0.39426), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-3-v1.ckpt" as top 2


Epoch 28:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.227, v_num=0, train_loss=0.235, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.418, val_accuracy=0.847, val_f1_score=0.847] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 28:  89%|████████▉ | 228/255 [01:26<00:10,  2.63it/s, loss=0.227, v_num=0, train_loss=0.235, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.418, val_accuracy=0.847, val_f1_score=0.847]
Epoch 28:  90%|█████████ | 230/255 [01:26<00:09,  2.65it/s, loss=0.227, v_num=0, train_loss=0.235, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.418, val_accuracy=0.847, val_f1_score=0.847]
Epoch 28:  91%|█████████ | 232/255 [01:27<00:08,  2.66it/s, loss=0.227, v_num=0, train_loss=0.235, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.418, val_accuracy=0.847, val_f1_score=0.847]
Epoch 28:  92%|█████████▏| 234/255 [01:27<00:07,  2.68it/s, loss=0.227, v_num=0, train_loss=0.235, train_accuracy=0

Epoch 28, global step 6553: val_loss was not in top 2


Epoch 29:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.249, v_num=0, train_loss=0.220, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.538, val_accuracy=0.828, val_f1_score=0.828] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 29:  89%|████████▉ | 228/255 [01:26<00:10,  2.63it/s, loss=0.249, v_num=0, train_loss=0.220, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.538, val_accuracy=0.828, val_f1_score=0.828]
Epoch 29:  90%|█████████ | 230/255 [01:26<00:09,  2.65it/s, loss=0.249, v_num=0, train_loss=0.220, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.538, val_accuracy=0.828, val_f1_score=0.828]
Epoch 29:  91%|█████████ | 232/255 [01:27<00:08,  2.66it/s, loss=0.249, v_num=0, train_loss=0.220, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.538, val_accuracy=0.828, val_f1_score=0.828]
Epoch 29:  92%|█████████▏| 234/255 [01:27<00:07,  2.68it/s, loss=0.249, v_num=0, train_loss=0.220, train_accuracy=0

Epoch 29, global step 6779: val_loss was not in top 2


Epoch 30:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.225, v_num=0, train_loss=0.212, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.464, val_accuracy=0.841, val_f1_score=0.841] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 30:  89%|████████▉ | 228/255 [01:26<00:10,  2.63it/s, loss=0.225, v_num=0, train_loss=0.212, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.464, val_accuracy=0.841, val_f1_score=0.841]
Epoch 30:  90%|█████████ | 230/255 [01:26<00:09,  2.65it/s, loss=0.225, v_num=0, train_loss=0.212, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.464, val_accuracy=0.841, val_f1_score=0.841]
Epoch 30:  91%|█████████ | 232/255 [01:27<00:08,  2.67it/s, loss=0.225, v_num=0, train_loss=0.212, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.464, val_accuracy=0.841, val_f1_score=0.841]
Epoch 30:  92%|█████████▏| 234/255 [01:27<00:07,  2.68it/s, loss=0.225, v_num=0, train_loss=0.212, train_accuracy=0

Epoch 30, global step 7005: val_loss was not in top 2


Epoch 31:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.198, v_num=0, train_loss=0.174, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.480, val_accuracy=0.840, val_f1_score=0.840] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 31:  89%|████████▉ | 228/255 [01:26<00:10,  2.63it/s, loss=0.198, v_num=0, train_loss=0.174, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.480, val_accuracy=0.840, val_f1_score=0.840]
Epoch 31:  90%|█████████ | 230/255 [01:26<00:09,  2.65it/s, loss=0.198, v_num=0, train_loss=0.174, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.480, val_accuracy=0.840, val_f1_score=0.840]
Epoch 31:  91%|█████████ | 232/255 [01:26<00:08,  2.67it/s, loss=0.198, v_num=0, train_loss=0.174, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.480, val_accuracy=0.840, val_f1_score=0.840]
Epoch 31:  92%|█████████▏| 234/255 [01:27<00:07,  2.69it/s, loss=0.198, v_num=0, train_loss=0.174, train_accuracy=0

Epoch 31, global step 7231: val_loss was not in top 2


Epoch 32:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.187, v_num=0, train_loss=0.205, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.452, val_accuracy=0.852, val_f1_score=0.852] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 32:  89%|████████▉ | 228/255 [01:26<00:10,  2.63it/s, loss=0.187, v_num=0, train_loss=0.205, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.452, val_accuracy=0.852, val_f1_score=0.852]
Epoch 32:  90%|█████████ | 230/255 [01:26<00:09,  2.65it/s, loss=0.187, v_num=0, train_loss=0.205, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.452, val_accuracy=0.852, val_f1_score=0.852]
Epoch 32:  91%|█████████ | 232/255 [01:26<00:08,  2.67it/s, loss=0.187, v_num=0, train_loss=0.205, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.452, val_accuracy=0.852, val_f1_score=0.852]
Epoch 32:  92%|█████████▏| 234/255 [01:27<00:07,  2.69it/s, loss=0.187, v_num=0, train_loss=0.205, train_accuracy=0

Epoch 32, global step 7457: val_loss reached 0.40944 (best 0.39426), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-3-v1.ckpt" as top 2


Epoch 33:  89%|████████▊ | 226/255 [01:20<00:10,  2.81it/s, loss=0.182, v_num=0, train_loss=0.405, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.409, val_accuracy=0.866, val_f1_score=0.866] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 33:  89%|████████▉ | 228/255 [01:26<00:10,  2.62it/s, loss=0.182, v_num=0, train_loss=0.405, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.409, val_accuracy=0.866, val_f1_score=0.866]
Epoch 33:  90%|█████████ | 230/255 [01:27<00:09,  2.64it/s, loss=0.182, v_num=0, train_loss=0.405, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.409, val_accuracy=0.866, val_f1_score=0.866]
Epoch 33:  91%|█████████ | 232/255 [01:27<00:08,  2.66it/s, loss=0.182, v_num=0, train_loss=0.405, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.409, val_accuracy=0.866, val_f1_score=0.866]
Epoch 33:  92%|█████████▏| 234/255 [01:27<00:07,  2.68it/s, loss=0.182, v_num=0, train_loss=0.405, train_accuracy=0

Epoch 33, global step 7683: val_loss reached 0.39874 (best 0.39426), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-3-v1.ckpt" as top 2


Epoch 34:  89%|████████▊ | 226/255 [01:20<00:10,  2.81it/s, loss=0.186, v_num=0, train_loss=0.291, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.399, val_accuracy=0.863, val_f1_score=0.863] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 34:  89%|████████▉ | 228/255 [01:26<00:10,  2.62it/s, loss=0.186, v_num=0, train_loss=0.291, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.399, val_accuracy=0.863, val_f1_score=0.863]
Epoch 34:  90%|█████████ | 230/255 [01:27<00:09,  2.64it/s, loss=0.186, v_num=0, train_loss=0.291, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.399, val_accuracy=0.863, val_f1_score=0.863]
Epoch 34:  91%|█████████ | 232/255 [01:27<00:08,  2.66it/s, loss=0.186, v_num=0, train_loss=0.291, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.399, val_accuracy=0.863, val_f1_score=0.863]
Epoch 34:  92%|█████████▏| 234/255 [01:27<00:07,  2.68it/s, loss=0.186, v_num=0, train_loss=0.291, train_accuracy=0

Epoch 34, global step 7909: val_loss was not in top 2


Epoch 35:  89%|████████▊ | 226/255 [01:20<00:10,  2.81it/s, loss=0.202, v_num=0, train_loss=0.211, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.400, val_accuracy=0.865, val_f1_score=0.865] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 35:  89%|████████▉ | 228/255 [01:26<00:10,  2.63it/s, loss=0.202, v_num=0, train_loss=0.211, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.400, val_accuracy=0.865, val_f1_score=0.865]
Epoch 35:  90%|█████████ | 230/255 [01:26<00:09,  2.64it/s, loss=0.202, v_num=0, train_loss=0.211, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.400, val_accuracy=0.865, val_f1_score=0.865]
Epoch 35:  91%|█████████ | 232/255 [01:27<00:08,  2.66it/s, loss=0.202, v_num=0, train_loss=0.211, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.400, val_accuracy=0.865, val_f1_score=0.865]
Epoch 35:  92%|█████████▏| 234/255 [01:27<00:07,  2.68it/s, loss=0.202, v_num=0, train_loss=0.211, train_accuracy=0

Epoch 35, global step 8135: val_loss was not in top 2


Epoch 36:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.164, v_num=0, train_loss=0.162, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.446, val_accuracy=0.856, val_f1_score=0.856] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 36:  89%|████████▉ | 228/255 [01:26<00:10,  2.63it/s, loss=0.164, v_num=0, train_loss=0.162, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.446, val_accuracy=0.856, val_f1_score=0.856]
Epoch 36:  90%|█████████ | 230/255 [01:26<00:09,  2.65it/s, loss=0.164, v_num=0, train_loss=0.162, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.446, val_accuracy=0.856, val_f1_score=0.856]
Epoch 36:  91%|█████████ | 232/255 [01:27<00:08,  2.67it/s, loss=0.164, v_num=0, train_loss=0.162, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.446, val_accuracy=0.856, val_f1_score=0.856]
Epoch 36:  92%|█████████▏| 234/255 [01:27<00:07,  2.68it/s, loss=0.164, v_num=0, train_loss=0.162, train_accuracy=0

Epoch 36, global step 8361: val_loss was not in top 2


Epoch 37:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.186, v_num=0, train_loss=0.138, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.411, val_accuracy=0.867, val_f1_score=0.867] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 37:  89%|████████▉ | 228/255 [01:26<00:10,  2.63it/s, loss=0.186, v_num=0, train_loss=0.138, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.411, val_accuracy=0.867, val_f1_score=0.867]
Epoch 37:  90%|█████████ | 230/255 [01:26<00:09,  2.65it/s, loss=0.186, v_num=0, train_loss=0.138, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.411, val_accuracy=0.867, val_f1_score=0.867]
Epoch 37:  91%|█████████ | 232/255 [01:27<00:08,  2.67it/s, loss=0.186, v_num=0, train_loss=0.138, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.411, val_accuracy=0.867, val_f1_score=0.867]
Epoch 37:  92%|█████████▏| 234/255 [01:27<00:07,  2.68it/s, loss=0.186, v_num=0, train_loss=0.138, train_accuracy=0

Epoch 37, global step 8587: val_loss was not in top 2


Epoch 38:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.152, v_num=0, train_loss=0.336, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.426, val_accuracy=0.877, val_f1_score=0.877] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 38:  89%|████████▉ | 228/255 [01:26<00:10,  2.63it/s, loss=0.152, v_num=0, train_loss=0.336, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.426, val_accuracy=0.877, val_f1_score=0.877]
Epoch 38:  90%|█████████ | 230/255 [01:26<00:09,  2.65it/s, loss=0.152, v_num=0, train_loss=0.336, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.426, val_accuracy=0.877, val_f1_score=0.877]
Epoch 38:  91%|█████████ | 232/255 [01:26<00:08,  2.67it/s, loss=0.152, v_num=0, train_loss=0.336, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.426, val_accuracy=0.877, val_f1_score=0.877]
Epoch 38:  92%|█████████▏| 234/255 [01:27<00:07,  2.69it/s, loss=0.152, v_num=0, train_loss=0.336, train_accuracy=0

Epoch 38, global step 8813: val_loss was not in top 2


Epoch 39:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.15, v_num=0, train_loss=0.180, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.420, val_accuracy=0.880, val_f1_score=0.880]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 39:  89%|████████▉ | 228/255 [01:26<00:10,  2.63it/s, loss=0.15, v_num=0, train_loss=0.180, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.420, val_accuracy=0.880, val_f1_score=0.880]
Epoch 39:  90%|█████████ | 230/255 [01:26<00:09,  2.65it/s, loss=0.15, v_num=0, train_loss=0.180, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.420, val_accuracy=0.880, val_f1_score=0.880]
Epoch 39:  91%|█████████ | 232/255 [01:27<00:08,  2.67it/s, loss=0.15, v_num=0, train_loss=0.180, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.420, val_accuracy=0.880, val_f1_score=0.880]
Epoch 39:  92%|█████████▏| 234/255 [01:27<00:07,  2.68it/s, loss=0.15, v_num=0, train_loss=0.180, train_accuracy=0.944

Epoch 39, global step 9039: val_loss was not in top 2


Epoch 40:  89%|████████▊ | 226/255 [01:20<00:10,  2.81it/s, loss=0.292, v_num=0, train_loss=0.214, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.462, val_accuracy=0.859, val_f1_score=0.859] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 40:  89%|████████▉ | 228/255 [01:26<00:10,  2.62it/s, loss=0.292, v_num=0, train_loss=0.214, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.462, val_accuracy=0.859, val_f1_score=0.859]
Epoch 40:  90%|█████████ | 230/255 [01:27<00:09,  2.64it/s, loss=0.292, v_num=0, train_loss=0.214, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.462, val_accuracy=0.859, val_f1_score=0.859]
Epoch 40:  91%|█████████ | 232/255 [01:27<00:08,  2.66it/s, loss=0.292, v_num=0, train_loss=0.214, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.462, val_accuracy=0.859, val_f1_score=0.859]
Epoch 40:  92%|█████████▏| 234/255 [01:27<00:07,  2.68it/s, loss=0.292, v_num=0, train_loss=0.214, train_accuracy=0

Epoch 40, global step 9265: val_loss was not in top 2


Epoch 41:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.119, v_num=0, train_loss=0.163, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.629, val_accuracy=0.828, val_f1_score=0.828] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 41:  89%|████████▉ | 228/255 [01:26<00:10,  2.63it/s, loss=0.119, v_num=0, train_loss=0.163, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.629, val_accuracy=0.828, val_f1_score=0.828]
Epoch 41:  90%|█████████ | 230/255 [01:26<00:09,  2.65it/s, loss=0.119, v_num=0, train_loss=0.163, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.629, val_accuracy=0.828, val_f1_score=0.828]
Epoch 41:  91%|█████████ | 232/255 [01:27<00:08,  2.67it/s, loss=0.119, v_num=0, train_loss=0.163, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.629, val_accuracy=0.828, val_f1_score=0.828]
Epoch 41:  92%|█████████▏| 234/255 [01:27<00:07,  2.68it/s, loss=0.119, v_num=0, train_loss=0.163, train_accuracy=0

Epoch 41, global step 9491: val_loss was not in top 2


Epoch 42:  89%|████████▊ | 226/255 [01:20<00:10,  2.81it/s, loss=0.179, v_num=0, train_loss=0.209, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.572, val_accuracy=0.861, val_f1_score=0.861] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 42:  89%|████████▉ | 228/255 [01:26<00:10,  2.62it/s, loss=0.179, v_num=0, train_loss=0.209, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.572, val_accuracy=0.861, val_f1_score=0.861]
Epoch 42:  90%|█████████ | 230/255 [01:27<00:09,  2.64it/s, loss=0.179, v_num=0, train_loss=0.209, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.572, val_accuracy=0.861, val_f1_score=0.861]
Epoch 42:  91%|█████████ | 232/255 [01:27<00:08,  2.66it/s, loss=0.179, v_num=0, train_loss=0.209, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.572, val_accuracy=0.861, val_f1_score=0.861]
Epoch 42:  92%|█████████▏| 234/255 [01:27<00:07,  2.68it/s, loss=0.179, v_num=0, train_loss=0.209, train_accuracy=0

Epoch 42, global step 9717: val_loss was not in top 2


Epoch 43:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.161, v_num=0, train_loss=0.0963, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.417, val_accuracy=0.863, val_f1_score=0.863]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 43:  89%|████████▉ | 228/255 [01:26<00:10,  2.63it/s, loss=0.161, v_num=0, train_loss=0.0963, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.417, val_accuracy=0.863, val_f1_score=0.863]
Epoch 43:  90%|█████████ | 230/255 [01:26<00:09,  2.65it/s, loss=0.161, v_num=0, train_loss=0.0963, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.417, val_accuracy=0.863, val_f1_score=0.863]
Epoch 43:  91%|█████████ | 232/255 [01:27<00:08,  2.67it/s, loss=0.161, v_num=0, train_loss=0.0963, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.417, val_accuracy=0.863, val_f1_score=0.863]
Epoch 43:  92%|█████████▏| 234/255 [01:27<00:07,  2.68it/s, loss=0.161, v_num=0, train_loss=0.0963, train_accura

Epoch 43, global step 9943: val_loss was not in top 2


Epoch 44:  89%|████████▊ | 226/255 [01:20<00:10,  2.81it/s, loss=0.117, v_num=0, train_loss=0.0225, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.411, val_accuracy=0.881, val_f1_score=0.881]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 44:  89%|████████▉ | 228/255 [01:26<00:10,  2.62it/s, loss=0.117, v_num=0, train_loss=0.0225, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.411, val_accuracy=0.881, val_f1_score=0.881]
Epoch 44:  90%|█████████ | 230/255 [01:27<00:09,  2.64it/s, loss=0.117, v_num=0, train_loss=0.0225, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.411, val_accuracy=0.881, val_f1_score=0.881]
Epoch 44:  91%|█████████ | 232/255 [01:27<00:08,  2.66it/s, loss=0.117, v_num=0, train_loss=0.0225, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.411, val_accuracy=0.881, val_f1_score=0.881]
Epoch 44:  92%|█████████▏| 234/255 [01:27<00:07,  2.68it/s, loss=0.117, v_num=0, train_loss=0.0225, train_accura

Epoch 44, global step 10169: val_loss reached 0.36170 (best 0.36170), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-3-v1.ckpt" as top 2


Epoch 45:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.14, v_num=0, train_loss=0.459, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.362, val_accuracy=0.894, val_f1_score=0.894]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 45:  89%|████████▉ | 228/255 [01:26<00:10,  2.63it/s, loss=0.14, v_num=0, train_loss=0.459, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.362, val_accuracy=0.894, val_f1_score=0.894]
Epoch 45:  90%|█████████ | 230/255 [01:26<00:09,  2.65it/s, loss=0.14, v_num=0, train_loss=0.459, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.362, val_accuracy=0.894, val_f1_score=0.894]
Epoch 45:  91%|█████████ | 232/255 [01:26<00:08,  2.67it/s, loss=0.14, v_num=0, train_loss=0.459, train_accuracy=0.833, train_f1_score=0.833, val_loss=0.362, val_accuracy=0.894, val_f1_score=0.894]
Epoch 45:  92%|█████████▏| 234/255 [01:27<00:07,  2.69it/s, loss=0.14, v_num=0, train_loss=0.459, train_accuracy=0.833

Epoch 45, global step 10395: val_loss reached 0.39296 (best 0.36170), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-3.ckpt" as top 2


Epoch 46:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.117, v_num=0, train_loss=0.192, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.393, val_accuracy=0.891, val_f1_score=0.891]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 46:  89%|████████▉ | 228/255 [01:26<00:10,  2.63it/s, loss=0.117, v_num=0, train_loss=0.192, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.393, val_accuracy=0.891, val_f1_score=0.891]
Epoch 46:  90%|█████████ | 230/255 [01:26<00:09,  2.65it/s, loss=0.117, v_num=0, train_loss=0.192, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.393, val_accuracy=0.891, val_f1_score=0.891]
Epoch 46:  91%|█████████ | 232/255 [01:27<00:08,  2.66it/s, loss=0.117, v_num=0, train_loss=0.192, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.393, val_accuracy=0.891, val_f1_score=0.891]
Epoch 46:  92%|█████████▏| 234/255 [01:27<00:07,  2.68it/s, loss=0.117, v_num=0, train_loss=0.192, train_accuracy=

Epoch 46, global step 10621: val_loss was not in top 2


Epoch 47:  89%|████████▊ | 226/255 [01:20<00:10,  2.81it/s, loss=0.103, v_num=0, train_loss=0.0239, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.396, val_accuracy=0.892, val_f1_score=0.892] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 47:  89%|████████▉ | 228/255 [01:26<00:10,  2.62it/s, loss=0.103, v_num=0, train_loss=0.0239, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.396, val_accuracy=0.892, val_f1_score=0.892]
Epoch 47:  90%|█████████ | 230/255 [01:27<00:09,  2.64it/s, loss=0.103, v_num=0, train_loss=0.0239, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.396, val_accuracy=0.892, val_f1_score=0.892]
Epoch 47:  91%|█████████ | 232/255 [01:27<00:08,  2.66it/s, loss=0.103, v_num=0, train_loss=0.0239, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.396, val_accuracy=0.892, val_f1_score=0.892]
Epoch 47:  92%|█████████▏| 234/255 [01:27<00:07,  2.68it/s, loss=0.103, v_num=0, train_loss=0.0239, train_accur

Epoch 47, global step 10847: val_loss was not in top 2


Epoch 48:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.102, v_num=0, train_loss=0.174, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.423, val_accuracy=0.892, val_f1_score=0.892]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 48:  89%|████████▉ | 228/255 [01:26<00:10,  2.63it/s, loss=0.102, v_num=0, train_loss=0.174, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.423, val_accuracy=0.892, val_f1_score=0.892]
Epoch 48:  90%|█████████ | 230/255 [01:26<00:09,  2.65it/s, loss=0.102, v_num=0, train_loss=0.174, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.423, val_accuracy=0.892, val_f1_score=0.892]
Epoch 48:  91%|█████████ | 232/255 [01:27<00:08,  2.66it/s, loss=0.102, v_num=0, train_loss=0.174, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.423, val_accuracy=0.892, val_f1_score=0.892]
Epoch 48:  92%|█████████▏| 234/255 [01:27<00:07,  2.68it/s, loss=0.102, v_num=0, train_loss=0.174, train_accuracy=

Epoch 48, global step 11073: val_loss was not in top 2


Epoch 49:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.112, v_num=0, train_loss=0.102, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.510, val_accuracy=0.880, val_f1_score=0.880]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 49:  89%|████████▉ | 228/255 [01:26<00:10,  2.63it/s, loss=0.112, v_num=0, train_loss=0.102, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.510, val_accuracy=0.880, val_f1_score=0.880]
Epoch 49:  90%|█████████ | 230/255 [01:26<00:09,  2.65it/s, loss=0.112, v_num=0, train_loss=0.102, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.510, val_accuracy=0.880, val_f1_score=0.880]
Epoch 49:  91%|█████████ | 232/255 [01:27<00:08,  2.66it/s, loss=0.112, v_num=0, train_loss=0.102, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.510, val_accuracy=0.880, val_f1_score=0.880]
Epoch 49:  92%|█████████▏| 234/255 [01:27<00:07,  2.68it/s, loss=0.112, v_num=0, train_loss=0.102, train_accuracy=

Epoch 49, global step 11299: val_loss was not in top 2


Epoch 50:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.177, v_num=0, train_loss=0.146, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.414, val_accuracy=0.891, val_f1_score=0.891]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 50:  89%|████████▉ | 228/255 [01:26<00:10,  2.63it/s, loss=0.177, v_num=0, train_loss=0.146, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.414, val_accuracy=0.891, val_f1_score=0.891]
Epoch 50:  90%|█████████ | 230/255 [01:26<00:09,  2.65it/s, loss=0.177, v_num=0, train_loss=0.146, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.414, val_accuracy=0.891, val_f1_score=0.891]
Epoch 50:  91%|█████████ | 232/255 [01:26<00:08,  2.67it/s, loss=0.177, v_num=0, train_loss=0.146, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.414, val_accuracy=0.891, val_f1_score=0.891]
Epoch 50:  92%|█████████▏| 234/255 [01:27<00:07,  2.69it/s, loss=0.177, v_num=0, train_loss=0.146, train_accuracy=

Epoch 50, global step 11525: val_loss was not in top 2


Epoch 51:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.102, v_num=0, train_loss=0.114, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.461, val_accuracy=0.884, val_f1_score=0.884]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 51:  89%|████████▉ | 228/255 [01:26<00:10,  2.63it/s, loss=0.102, v_num=0, train_loss=0.114, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.461, val_accuracy=0.884, val_f1_score=0.884]
Epoch 51:  90%|█████████ | 230/255 [01:26<00:09,  2.65it/s, loss=0.102, v_num=0, train_loss=0.114, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.461, val_accuracy=0.884, val_f1_score=0.884]
Epoch 51:  91%|█████████ | 232/255 [01:26<00:08,  2.67it/s, loss=0.102, v_num=0, train_loss=0.114, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.461, val_accuracy=0.884, val_f1_score=0.884]
Epoch 51:  92%|█████████▏| 234/255 [01:27<00:07,  2.69it/s, loss=0.102, v_num=0, train_loss=0.114, train_accuracy=

Epoch 51, global step 11751: val_loss was not in top 2


Epoch 52:  89%|████████▊ | 226/255 [01:20<00:10,  2.81it/s, loss=0.112, v_num=0, train_loss=0.0375, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.438, val_accuracy=0.886, val_f1_score=0.886] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 52:  89%|████████▉ | 228/255 [01:26<00:10,  2.63it/s, loss=0.112, v_num=0, train_loss=0.0375, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.438, val_accuracy=0.886, val_f1_score=0.886]
Epoch 52:  90%|█████████ | 230/255 [01:26<00:09,  2.64it/s, loss=0.112, v_num=0, train_loss=0.0375, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.438, val_accuracy=0.886, val_f1_score=0.886]
Epoch 52:  91%|█████████ | 232/255 [01:27<00:08,  2.66it/s, loss=0.112, v_num=0, train_loss=0.0375, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.438, val_accuracy=0.886, val_f1_score=0.886]
Epoch 52:  92%|█████████▏| 234/255 [01:27<00:07,  2.68it/s, loss=0.112, v_num=0, train_loss=0.0375, train_accur

Epoch 52, global step 11977: val_loss reached 0.37315 (best 0.36170), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-3.ckpt" as top 2


Epoch 53:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.112, v_num=0, train_loss=0.0561, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.373, val_accuracy=0.908, val_f1_score=0.908] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 53:  89%|████████▉ | 228/255 [01:26<00:10,  2.63it/s, loss=0.112, v_num=0, train_loss=0.0561, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.373, val_accuracy=0.908, val_f1_score=0.908]
Epoch 53:  90%|█████████ | 230/255 [01:26<00:09,  2.65it/s, loss=0.112, v_num=0, train_loss=0.0561, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.373, val_accuracy=0.908, val_f1_score=0.908]
Epoch 53:  91%|█████████ | 232/255 [01:27<00:08,  2.67it/s, loss=0.112, v_num=0, train_loss=0.0561, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.373, val_accuracy=0.908, val_f1_score=0.908]
Epoch 53:  92%|█████████▏| 234/255 [01:27<00:07,  2.68it/s, loss=0.112, v_num=0, train_loss=0.0561, train_accur

Epoch 53, global step 12203: val_loss reached 0.36269 (best 0.36170), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-3.ckpt" as top 2


Epoch 54:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.157, v_num=0, train_loss=0.0576, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.363, val_accuracy=0.897, val_f1_score=0.897] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 54:  89%|████████▉ | 228/255 [01:26<00:10,  2.63it/s, loss=0.157, v_num=0, train_loss=0.0576, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.363, val_accuracy=0.897, val_f1_score=0.897]
Epoch 54:  90%|█████████ | 230/255 [01:26<00:09,  2.65it/s, loss=0.157, v_num=0, train_loss=0.0576, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.363, val_accuracy=0.897, val_f1_score=0.897]
Epoch 54:  91%|█████████ | 232/255 [01:26<00:08,  2.67it/s, loss=0.157, v_num=0, train_loss=0.0576, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.363, val_accuracy=0.897, val_f1_score=0.897]
Epoch 54:  92%|█████████▏| 234/255 [01:27<00:07,  2.69it/s, loss=0.157, v_num=0, train_loss=0.0576, train_accur

Epoch 54, global step 12429: val_loss reached 0.28694 (best 0.28694), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-3.ckpt" as top 2


Epoch 55:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.127, v_num=0, train_loss=0.0867, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.287, val_accuracy=0.896, val_f1_score=0.896]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 55:  89%|████████▉ | 228/255 [01:26<00:10,  2.63it/s, loss=0.127, v_num=0, train_loss=0.0867, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.287, val_accuracy=0.896, val_f1_score=0.896]
Epoch 55:  90%|█████████ | 230/255 [01:26<00:09,  2.65it/s, loss=0.127, v_num=0, train_loss=0.0867, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.287, val_accuracy=0.896, val_f1_score=0.896]
Epoch 55:  91%|█████████ | 232/255 [01:26<00:08,  2.67it/s, loss=0.127, v_num=0, train_loss=0.0867, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.287, val_accuracy=0.896, val_f1_score=0.896]
Epoch 55:  92%|█████████▏| 234/255 [01:27<00:07,  2.69it/s, loss=0.127, v_num=0, train_loss=0.0867, train_accura

Epoch 55, global step 12655: val_loss was not in top 2


Epoch 56:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.119, v_num=0, train_loss=0.0916, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.414, val_accuracy=0.883, val_f1_score=0.883] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 56:  89%|████████▉ | 228/255 [01:26<00:10,  2.63it/s, loss=0.119, v_num=0, train_loss=0.0916, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.414, val_accuracy=0.883, val_f1_score=0.883]
Epoch 56:  90%|█████████ | 230/255 [01:26<00:09,  2.65it/s, loss=0.119, v_num=0, train_loss=0.0916, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.414, val_accuracy=0.883, val_f1_score=0.883]
Epoch 56:  91%|█████████ | 232/255 [01:27<00:08,  2.66it/s, loss=0.119, v_num=0, train_loss=0.0916, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.414, val_accuracy=0.883, val_f1_score=0.883]
Epoch 56:  92%|█████████▏| 234/255 [01:27<00:07,  2.68it/s, loss=0.119, v_num=0, train_loss=0.0916, train_accur

Epoch 56, global step 12881: val_loss reached 0.35353 (best 0.28694), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-3-v1.ckpt" as top 2


Epoch 57:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.122, v_num=0, train_loss=0.313, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.354, val_accuracy=0.895, val_f1_score=0.895]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 57:  89%|████████▉ | 228/255 [01:26<00:10,  2.63it/s, loss=0.122, v_num=0, train_loss=0.313, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.354, val_accuracy=0.895, val_f1_score=0.895]
Epoch 57:  90%|█████████ | 230/255 [01:26<00:09,  2.64it/s, loss=0.122, v_num=0, train_loss=0.313, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.354, val_accuracy=0.895, val_f1_score=0.895]
Epoch 57:  91%|█████████ | 232/255 [01:27<00:08,  2.66it/s, loss=0.122, v_num=0, train_loss=0.313, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.354, val_accuracy=0.895, val_f1_score=0.895]
Epoch 57:  92%|█████████▏| 234/255 [01:27<00:07,  2.68it/s, loss=0.122, v_num=0, train_loss=0.313, train_accuracy=

Epoch 57, global step 13107: val_loss was not in top 2


Epoch 58:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.103, v_num=0, train_loss=0.123, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.368, val_accuracy=0.894, val_f1_score=0.894]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 58:  89%|████████▉ | 228/255 [01:26<00:10,  2.63it/s, loss=0.103, v_num=0, train_loss=0.123, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.368, val_accuracy=0.894, val_f1_score=0.894]
Epoch 58:  90%|█████████ | 230/255 [01:26<00:09,  2.65it/s, loss=0.103, v_num=0, train_loss=0.123, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.368, val_accuracy=0.894, val_f1_score=0.894]
Epoch 58:  91%|█████████ | 232/255 [01:27<00:08,  2.67it/s, loss=0.103, v_num=0, train_loss=0.123, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.368, val_accuracy=0.894, val_f1_score=0.894]
Epoch 58:  92%|█████████▏| 234/255 [01:27<00:07,  2.68it/s, loss=0.103, v_num=0, train_loss=0.123, train_accuracy=

Epoch 58, global step 13333: val_loss was not in top 2


Epoch 59:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.0814, v_num=0, train_loss=0.0574, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.354, val_accuracy=0.901, val_f1_score=0.901]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 59:  89%|████████▉ | 228/255 [01:26<00:10,  2.63it/s, loss=0.0814, v_num=0, train_loss=0.0574, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.354, val_accuracy=0.901, val_f1_score=0.901]
Epoch 59:  90%|█████████ | 230/255 [01:26<00:09,  2.65it/s, loss=0.0814, v_num=0, train_loss=0.0574, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.354, val_accuracy=0.901, val_f1_score=0.901]
Epoch 59:  91%|█████████ | 232/255 [01:26<00:08,  2.67it/s, loss=0.0814, v_num=0, train_loss=0.0574, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.354, val_accuracy=0.901, val_f1_score=0.901]
Epoch 59:  92%|█████████▏| 234/255 [01:27<00:07,  2.69it/s, loss=0.0814, v_num=0, train_loss=0.0574, train_a

Epoch 59, global step 13559: val_loss was not in top 2


Epoch 60:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.0648, v_num=0, train_loss=0.0171, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.383, val_accuracy=0.896, val_f1_score=0.896]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 60:  89%|████████▉ | 228/255 [01:26<00:10,  2.63it/s, loss=0.0648, v_num=0, train_loss=0.0171, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.383, val_accuracy=0.896, val_f1_score=0.896]
Epoch 60:  90%|█████████ | 230/255 [01:26<00:09,  2.65it/s, loss=0.0648, v_num=0, train_loss=0.0171, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.383, val_accuracy=0.896, val_f1_score=0.896]
Epoch 60:  91%|█████████ | 232/255 [01:26<00:08,  2.67it/s, loss=0.0648, v_num=0, train_loss=0.0171, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.383, val_accuracy=0.896, val_f1_score=0.896]
Epoch 60:  92%|█████████▏| 234/255 [01:27<00:07,  2.69it/s, loss=0.0648, v_num=0, train_loss=0.0171, train_a

Epoch 60, global step 13785: val_loss reached 0.33279 (best 0.28694), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-3-v1.ckpt" as top 2


Epoch 61:  89%|████████▊ | 226/255 [01:20<00:10,  2.81it/s, loss=0.101, v_num=0, train_loss=0.158, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.333, val_accuracy=0.908, val_f1_score=0.908]   
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 61:  89%|████████▉ | 228/255 [01:26<00:10,  2.63it/s, loss=0.101, v_num=0, train_loss=0.158, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.333, val_accuracy=0.908, val_f1_score=0.908]
Epoch 61:  90%|█████████ | 230/255 [01:26<00:09,  2.64it/s, loss=0.101, v_num=0, train_loss=0.158, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.333, val_accuracy=0.908, val_f1_score=0.908]
Epoch 61:  91%|█████████ | 232/255 [01:27<00:08,  2.66it/s, loss=0.101, v_num=0, train_loss=0.158, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.333, val_accuracy=0.908, val_f1_score=0.908]
Epoch 61:  92%|█████████▏| 234/255 [01:27<00:07,  2.68it/s, loss=0.101, v_num=0, train_loss=0.158, train_accuracy

Epoch 61, global step 14011: val_loss was not in top 2


Epoch 62:  89%|████████▊ | 226/255 [01:20<00:10,  2.81it/s, loss=0.0684, v_num=0, train_loss=0.128, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.440, val_accuracy=0.891, val_f1_score=0.891]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 62:  89%|████████▉ | 228/255 [01:26<00:10,  2.62it/s, loss=0.0684, v_num=0, train_loss=0.128, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.440, val_accuracy=0.891, val_f1_score=0.891]
Epoch 62:  90%|█████████ | 230/255 [01:27<00:09,  2.64it/s, loss=0.0684, v_num=0, train_loss=0.128, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.440, val_accuracy=0.891, val_f1_score=0.891]
Epoch 62:  91%|█████████ | 232/255 [01:27<00:08,  2.66it/s, loss=0.0684, v_num=0, train_loss=0.128, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.440, val_accuracy=0.891, val_f1_score=0.891]
Epoch 62:  92%|█████████▏| 234/255 [01:27<00:07,  2.68it/s, loss=0.0684, v_num=0, train_loss=0.128, train_accu

Epoch 62, global step 14237: val_loss was not in top 2


Epoch 63:  89%|████████▊ | 226/255 [01:20<00:10,  2.81it/s, loss=0.0726, v_num=0, train_loss=0.0592, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.431, val_accuracy=0.906, val_f1_score=0.906]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 63:  89%|████████▉ | 228/255 [01:26<00:10,  2.63it/s, loss=0.0726, v_num=0, train_loss=0.0592, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.431, val_accuracy=0.906, val_f1_score=0.906]
Epoch 63:  90%|█████████ | 230/255 [01:27<00:09,  2.64it/s, loss=0.0726, v_num=0, train_loss=0.0592, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.431, val_accuracy=0.906, val_f1_score=0.906]
Epoch 63:  91%|█████████ | 232/255 [01:27<00:08,  2.66it/s, loss=0.0726, v_num=0, train_loss=0.0592, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.431, val_accuracy=0.906, val_f1_score=0.906]
Epoch 63:  92%|█████████▏| 234/255 [01:27<00:07,  2.68it/s, loss=0.0726, v_num=0, train_loss=0.0592, train_a

Epoch 63, global step 14463: val_loss was not in top 2


Epoch 64:  89%|████████▊ | 226/255 [01:19<00:10,  2.83it/s, loss=0.0632, v_num=0, train_loss=0.0858, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.429, val_accuracy=0.899, val_f1_score=0.899]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 64:  89%|████████▉ | 228/255 [01:26<00:10,  2.64it/s, loss=0.0632, v_num=0, train_loss=0.0858, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.429, val_accuracy=0.899, val_f1_score=0.899]
Epoch 64:  90%|█████████ | 230/255 [01:26<00:09,  2.65it/s, loss=0.0632, v_num=0, train_loss=0.0858, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.429, val_accuracy=0.899, val_f1_score=0.899]
Epoch 64:  91%|█████████ | 232/255 [01:26<00:08,  2.67it/s, loss=0.0632, v_num=0, train_loss=0.0858, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.429, val_accuracy=0.899, val_f1_score=0.899]
Epoch 64:  92%|█████████▏| 234/255 [01:26<00:07,  2.69it/s, loss=0.0632, v_num=0, train_loss=0.0858, train_a

Epoch 64, global step 14689: val_loss was not in top 2


Epoch 65:  89%|████████▊ | 226/255 [01:20<00:10,  2.81it/s, loss=0.082, v_num=0, train_loss=0.00868, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.343, val_accuracy=0.908, val_f1_score=0.908]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 65:  89%|████████▉ | 228/255 [01:26<00:10,  2.62it/s, loss=0.082, v_num=0, train_loss=0.00868, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.343, val_accuracy=0.908, val_f1_score=0.908]
Epoch 65:  90%|█████████ | 230/255 [01:27<00:09,  2.64it/s, loss=0.082, v_num=0, train_loss=0.00868, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.343, val_accuracy=0.908, val_f1_score=0.908]
Epoch 65:  91%|█████████ | 232/255 [01:27<00:08,  2.66it/s, loss=0.082, v_num=0, train_loss=0.00868, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.343, val_accuracy=0.908, val_f1_score=0.908]
Epoch 65:  92%|█████████▏| 234/255 [01:27<00:07,  2.68it/s, loss=0.082, v_num=0, train_loss=0.00868, train_a

Epoch 65, global step 14915: val_loss was not in top 2


Epoch 66:  89%|████████▊ | 226/255 [01:20<00:10,  2.81it/s, loss=0.0554, v_num=0, train_loss=0.0154, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.353, val_accuracy=0.911, val_f1_score=0.911] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 66:  89%|████████▉ | 228/255 [01:26<00:10,  2.63it/s, loss=0.0554, v_num=0, train_loss=0.0154, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.353, val_accuracy=0.911, val_f1_score=0.911]
Epoch 66:  90%|█████████ | 230/255 [01:26<00:09,  2.64it/s, loss=0.0554, v_num=0, train_loss=0.0154, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.353, val_accuracy=0.911, val_f1_score=0.911]
Epoch 66:  91%|█████████ | 232/255 [01:27<00:08,  2.66it/s, loss=0.0554, v_num=0, train_loss=0.0154, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.353, val_accuracy=0.911, val_f1_score=0.911]
Epoch 66:  92%|█████████▏| 234/255 [01:27<00:07,  2.68it/s, loss=0.0554, v_num=0, train_loss=0.0154, train_

Epoch 66, global step 15141: val_loss was not in top 2


Epoch 67:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.0657, v_num=0, train_loss=0.0228, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.410, val_accuracy=0.910, val_f1_score=0.910]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 67:  89%|████████▉ | 228/255 [01:26<00:10,  2.63it/s, loss=0.0657, v_num=0, train_loss=0.0228, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.410, val_accuracy=0.910, val_f1_score=0.910]
Epoch 67:  90%|█████████ | 230/255 [01:26<00:09,  2.65it/s, loss=0.0657, v_num=0, train_loss=0.0228, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.410, val_accuracy=0.910, val_f1_score=0.910]
Epoch 67:  91%|█████████ | 232/255 [01:26<00:08,  2.67it/s, loss=0.0657, v_num=0, train_loss=0.0228, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.410, val_accuracy=0.910, val_f1_score=0.910]
Epoch 67:  92%|█████████▏| 234/255 [01:27<00:07,  2.69it/s, loss=0.0657, v_num=0, train_loss=0.0228, train_a

Epoch 67, global step 15367: val_loss was not in top 2


Epoch 68:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.0768, v_num=0, train_loss=0.0241, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.352, val_accuracy=0.912, val_f1_score=0.912]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 68:  89%|████████▉ | 228/255 [01:26<00:10,  2.63it/s, loss=0.0768, v_num=0, train_loss=0.0241, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.352, val_accuracy=0.912, val_f1_score=0.912]
Epoch 68:  90%|█████████ | 230/255 [01:26<00:09,  2.65it/s, loss=0.0768, v_num=0, train_loss=0.0241, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.352, val_accuracy=0.912, val_f1_score=0.912]
Epoch 68:  91%|█████████ | 232/255 [01:27<00:08,  2.67it/s, loss=0.0768, v_num=0, train_loss=0.0241, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.352, val_accuracy=0.912, val_f1_score=0.912]
Epoch 68:  92%|█████████▏| 234/255 [01:27<00:07,  2.68it/s, loss=0.0768, v_num=0, train_loss=0.0241, train_a

Epoch 68, global step 15593: val_loss was not in top 2


Epoch 69:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.0735, v_num=0, train_loss=0.0224, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.371, val_accuracy=0.901, val_f1_score=0.901] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 69:  89%|████████▉ | 228/255 [01:26<00:10,  2.63it/s, loss=0.0735, v_num=0, train_loss=0.0224, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.371, val_accuracy=0.901, val_f1_score=0.901]
Epoch 69:  90%|█████████ | 230/255 [01:26<00:09,  2.65it/s, loss=0.0735, v_num=0, train_loss=0.0224, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.371, val_accuracy=0.901, val_f1_score=0.901]
Epoch 69:  91%|█████████ | 232/255 [01:27<00:08,  2.66it/s, loss=0.0735, v_num=0, train_loss=0.0224, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.371, val_accuracy=0.901, val_f1_score=0.901]
Epoch 69:  92%|█████████▏| 234/255 [01:27<00:07,  2.68it/s, loss=0.0735, v_num=0, train_loss=0.0224, train_

Epoch 69, global step 15819: val_loss was not in top 2


Epoch 70:  89%|████████▊ | 226/255 [01:19<00:10,  2.83it/s, loss=0.0649, v_num=0, train_loss=0.214, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.388, val_accuracy=0.885, val_f1_score=0.885]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 70:  89%|████████▉ | 228/255 [01:26<00:10,  2.64it/s, loss=0.0649, v_num=0, train_loss=0.214, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.388, val_accuracy=0.885, val_f1_score=0.885]
Epoch 70:  90%|█████████ | 230/255 [01:26<00:09,  2.66it/s, loss=0.0649, v_num=0, train_loss=0.214, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.388, val_accuracy=0.885, val_f1_score=0.885]
Epoch 70:  91%|█████████ | 232/255 [01:26<00:08,  2.67it/s, loss=0.0649, v_num=0, train_loss=0.214, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.388, val_accuracy=0.885, val_f1_score=0.885]
Epoch 70:  92%|█████████▏| 234/255 [01:26<00:07,  2.69it/s, loss=0.0649, v_num=0, train_loss=0.214, train_accu

Epoch 70, global step 16045: val_loss was not in top 2


Epoch 71:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.0485, v_num=0, train_loss=0.005, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.387, val_accuracy=0.906, val_f1_score=0.906]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 71:  89%|████████▉ | 228/255 [01:26<00:10,  2.63it/s, loss=0.0485, v_num=0, train_loss=0.005, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.387, val_accuracy=0.906, val_f1_score=0.906]
Epoch 71:  90%|█████████ | 230/255 [01:26<00:09,  2.65it/s, loss=0.0485, v_num=0, train_loss=0.005, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.387, val_accuracy=0.906, val_f1_score=0.906]
Epoch 71:  91%|█████████ | 232/255 [01:27<00:08,  2.66it/s, loss=0.0485, v_num=0, train_loss=0.005, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.387, val_accuracy=0.906, val_f1_score=0.906]
Epoch 71:  92%|█████████▏| 234/255 [01:27<00:07,  2.68it/s, loss=0.0485, v_num=0, train_loss=0.005, train_accu

Epoch 71, global step 16271: val_loss was not in top 2


Epoch 72:  89%|████████▊ | 226/255 [01:20<00:10,  2.81it/s, loss=0.0422, v_num=0, train_loss=0.086, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.419, val_accuracy=0.905, val_f1_score=0.905]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 72:  89%|████████▉ | 228/255 [01:26<00:10,  2.62it/s, loss=0.0422, v_num=0, train_loss=0.086, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.419, val_accuracy=0.905, val_f1_score=0.905]
Epoch 72:  90%|█████████ | 230/255 [01:27<00:09,  2.64it/s, loss=0.0422, v_num=0, train_loss=0.086, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.419, val_accuracy=0.905, val_f1_score=0.905]
Epoch 72:  91%|█████████ | 232/255 [01:27<00:08,  2.66it/s, loss=0.0422, v_num=0, train_loss=0.086, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.419, val_accuracy=0.905, val_f1_score=0.905]
Epoch 72:  92%|█████████▏| 234/255 [01:27<00:07,  2.68it/s, loss=0.0422, v_num=0, train_loss=0.086, train_accu

Epoch 72, global step 16497: val_loss was not in top 2


Epoch 73:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.0502, v_num=0, train_loss=0.0157, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.379, val_accuracy=0.911, val_f1_score=0.911] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 73:  89%|████████▉ | 228/255 [01:26<00:10,  2.63it/s, loss=0.0502, v_num=0, train_loss=0.0157, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.379, val_accuracy=0.911, val_f1_score=0.911]
Epoch 73:  90%|█████████ | 230/255 [01:26<00:09,  2.64it/s, loss=0.0502, v_num=0, train_loss=0.0157, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.379, val_accuracy=0.911, val_f1_score=0.911]
Epoch 73:  91%|█████████ | 232/255 [01:27<00:08,  2.66it/s, loss=0.0502, v_num=0, train_loss=0.0157, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.379, val_accuracy=0.911, val_f1_score=0.911]
Epoch 73:  92%|█████████▏| 234/255 [01:27<00:07,  2.68it/s, loss=0.0502, v_num=0, train_loss=0.0157, train_

Epoch 73, global step 16723: val_loss was not in top 2


Epoch 74:  89%|████████▊ | 226/255 [01:20<00:10,  2.81it/s, loss=0.0472, v_num=0, train_loss=0.0631, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.390, val_accuracy=0.909, val_f1_score=0.909] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 74:  89%|████████▉ | 228/255 [01:26<00:10,  2.62it/s, loss=0.0472, v_num=0, train_loss=0.0631, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.390, val_accuracy=0.909, val_f1_score=0.909]
Epoch 74:  90%|█████████ | 230/255 [01:27<00:09,  2.64it/s, loss=0.0472, v_num=0, train_loss=0.0631, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.390, val_accuracy=0.909, val_f1_score=0.909]
Epoch 74:  91%|█████████ | 232/255 [01:27<00:08,  2.66it/s, loss=0.0472, v_num=0, train_loss=0.0631, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.390, val_accuracy=0.909, val_f1_score=0.909]
Epoch 74:  92%|█████████▏| 234/255 [01:27<00:07,  2.68it/s, loss=0.0472, v_num=0, train_loss=0.0631, train_

Epoch 74, global step 16949: val_loss was not in top 2


Epoch 75:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.0644, v_num=0, train_loss=0.00374, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.402, val_accuracy=0.913, val_f1_score=0.913]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 75:  89%|████████▉ | 228/255 [01:26<00:10,  2.63it/s, loss=0.0644, v_num=0, train_loss=0.00374, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.402, val_accuracy=0.913, val_f1_score=0.913]
Epoch 75:  90%|█████████ | 230/255 [01:26<00:09,  2.65it/s, loss=0.0644, v_num=0, train_loss=0.00374, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.402, val_accuracy=0.913, val_f1_score=0.913]
Epoch 75:  91%|█████████ | 232/255 [01:27<00:08,  2.66it/s, loss=0.0644, v_num=0, train_loss=0.00374, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.402, val_accuracy=0.913, val_f1_score=0.913]
Epoch 75:  92%|█████████▏| 234/255 [01:27<00:07,  2.68it/s, loss=0.0644, v_num=0, train_loss=0.00374, tr

Epoch 75, global step 17175: val_loss was not in top 2


Epoch 76:  89%|████████▊ | 226/255 [01:20<00:10,  2.81it/s, loss=0.0375, v_num=0, train_loss=0.0196, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.358, val_accuracy=0.917, val_f1_score=0.917] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 76:  89%|████████▉ | 228/255 [01:27<00:10,  2.62it/s, loss=0.0375, v_num=0, train_loss=0.0196, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.358, val_accuracy=0.917, val_f1_score=0.917]
Epoch 76:  90%|█████████ | 230/255 [01:27<00:09,  2.64it/s, loss=0.0375, v_num=0, train_loss=0.0196, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.358, val_accuracy=0.917, val_f1_score=0.917]
Epoch 76:  91%|█████████ | 232/255 [01:27<00:08,  2.66it/s, loss=0.0375, v_num=0, train_loss=0.0196, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.358, val_accuracy=0.917, val_f1_score=0.917]
Epoch 76:  92%|█████████▏| 234/255 [01:27<00:07,  2.67it/s, loss=0.0375, v_num=0, train_loss=0.0196, train_

Epoch 76, global step 17401: val_loss was not in top 2


Epoch 77:  89%|████████▊ | 226/255 [01:20<00:10,  2.81it/s, loss=0.0512, v_num=0, train_loss=0.115, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.411, val_accuracy=0.913, val_f1_score=0.913]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 77:  89%|████████▉ | 228/255 [01:26<00:10,  2.62it/s, loss=0.0512, v_num=0, train_loss=0.115, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.411, val_accuracy=0.913, val_f1_score=0.913]
Epoch 77:  90%|█████████ | 230/255 [01:27<00:09,  2.64it/s, loss=0.0512, v_num=0, train_loss=0.115, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.411, val_accuracy=0.913, val_f1_score=0.913]
Epoch 77:  91%|█████████ | 232/255 [01:27<00:08,  2.66it/s, loss=0.0512, v_num=0, train_loss=0.115, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.411, val_accuracy=0.913, val_f1_score=0.913]
Epoch 77:  92%|█████████▏| 234/255 [01:27<00:07,  2.68it/s, loss=0.0512, v_num=0, train_loss=0.115, train_accu

Epoch 77, global step 17627: val_loss was not in top 2


Epoch 78:  89%|████████▊ | 226/255 [01:20<00:10,  2.81it/s, loss=0.0371, v_num=0, train_loss=0.0406, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.352, val_accuracy=0.916, val_f1_score=0.916] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 78:  89%|████████▉ | 228/255 [01:26<00:10,  2.62it/s, loss=0.0371, v_num=0, train_loss=0.0406, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.352, val_accuracy=0.916, val_f1_score=0.916]
Epoch 78:  90%|█████████ | 230/255 [01:27<00:09,  2.64it/s, loss=0.0371, v_num=0, train_loss=0.0406, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.352, val_accuracy=0.916, val_f1_score=0.916]
Epoch 78:  91%|█████████ | 232/255 [01:27<00:08,  2.66it/s, loss=0.0371, v_num=0, train_loss=0.0406, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.352, val_accuracy=0.916, val_f1_score=0.916]
Epoch 78:  92%|█████████▏| 234/255 [01:27<00:07,  2.68it/s, loss=0.0371, v_num=0, train_loss=0.0406, train_

Epoch 78, global step 17853: val_loss was not in top 2


Epoch 79:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.0755, v_num=0, train_loss=0.423, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.350, val_accuracy=0.920, val_f1_score=0.920]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 79:  89%|████████▉ | 228/255 [01:26<00:10,  2.63it/s, loss=0.0755, v_num=0, train_loss=0.423, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.350, val_accuracy=0.920, val_f1_score=0.920]
Epoch 79:  90%|█████████ | 230/255 [01:26<00:09,  2.65it/s, loss=0.0755, v_num=0, train_loss=0.423, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.350, val_accuracy=0.920, val_f1_score=0.920]
Epoch 79:  91%|█████████ | 232/255 [01:27<00:08,  2.67it/s, loss=0.0755, v_num=0, train_loss=0.423, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.350, val_accuracy=0.920, val_f1_score=0.920]
Epoch 79:  92%|█████████▏| 234/255 [01:27<00:07,  2.68it/s, loss=0.0755, v_num=0, train_loss=0.423, train_accu

Epoch 79, global step 18079: val_loss reached 0.32791 (best 0.28694), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-3-v1.ckpt" as top 2


Epoch 80:  89%|████████▊ | 226/255 [01:20<00:10,  2.81it/s, loss=0.0461, v_num=0, train_loss=0.0751, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.328, val_accuracy=0.928, val_f1_score=0.928] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 80:  89%|████████▉ | 228/255 [01:26<00:10,  2.62it/s, loss=0.0461, v_num=0, train_loss=0.0751, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.328, val_accuracy=0.928, val_f1_score=0.928]
Epoch 80:  90%|█████████ | 230/255 [01:27<00:09,  2.64it/s, loss=0.0461, v_num=0, train_loss=0.0751, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.328, val_accuracy=0.928, val_f1_score=0.928]
Epoch 80:  91%|█████████ | 232/255 [01:27<00:08,  2.66it/s, loss=0.0461, v_num=0, train_loss=0.0751, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.328, val_accuracy=0.928, val_f1_score=0.928]
Epoch 80:  92%|█████████▏| 234/255 [01:27<00:07,  2.68it/s, loss=0.0461, v_num=0, train_loss=0.0751, train_

Epoch 80, global step 18305: val_loss reached 0.31468 (best 0.28694), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-3-v1.ckpt" as top 2


Epoch 81:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.0466, v_num=0, train_loss=0.0533, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.315, val_accuracy=0.923, val_f1_score=0.923] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 81:  89%|████████▉ | 228/255 [01:26<00:10,  2.62it/s, loss=0.0466, v_num=0, train_loss=0.0533, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.315, val_accuracy=0.923, val_f1_score=0.923]
Epoch 81:  90%|█████████ | 230/255 [01:27<00:09,  2.64it/s, loss=0.0466, v_num=0, train_loss=0.0533, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.315, val_accuracy=0.923, val_f1_score=0.923]
Epoch 81:  91%|█████████ | 232/255 [01:27<00:08,  2.66it/s, loss=0.0466, v_num=0, train_loss=0.0533, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.315, val_accuracy=0.923, val_f1_score=0.923]
Epoch 81:  92%|█████████▏| 234/255 [01:27<00:07,  2.68it/s, loss=0.0466, v_num=0, train_loss=0.0533, train_

Epoch 81, global step 18531: val_loss reached 0.31432 (best 0.28694), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-3-v1.ckpt" as top 2


Epoch 82:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.0425, v_num=0, train_loss=0.0218, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.314, val_accuracy=0.919, val_f1_score=0.919] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 82:  89%|████████▉ | 228/255 [01:26<00:10,  2.63it/s, loss=0.0425, v_num=0, train_loss=0.0218, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.314, val_accuracy=0.919, val_f1_score=0.919]
Epoch 82:  90%|█████████ | 230/255 [01:26<00:09,  2.65it/s, loss=0.0425, v_num=0, train_loss=0.0218, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.314, val_accuracy=0.919, val_f1_score=0.919]
Epoch 82:  91%|█████████ | 232/255 [01:27<00:08,  2.67it/s, loss=0.0425, v_num=0, train_loss=0.0218, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.314, val_accuracy=0.919, val_f1_score=0.919]
Epoch 82:  92%|█████████▏| 234/255 [01:27<00:07,  2.68it/s, loss=0.0425, v_num=0, train_loss=0.0218, train_

Epoch 82, global step 18757: val_loss was not in top 2


Epoch 83:  89%|████████▊ | 226/255 [01:20<00:10,  2.81it/s, loss=0.0521, v_num=0, train_loss=0.00605, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.362, val_accuracy=0.926, val_f1_score=0.926]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 83:  89%|████████▉ | 228/255 [01:26<00:10,  2.62it/s, loss=0.0521, v_num=0, train_loss=0.00605, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.362, val_accuracy=0.926, val_f1_score=0.926]
Epoch 83:  90%|█████████ | 230/255 [01:27<00:09,  2.64it/s, loss=0.0521, v_num=0, train_loss=0.00605, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.362, val_accuracy=0.926, val_f1_score=0.926]
Epoch 83:  91%|█████████ | 232/255 [01:27<00:08,  2.66it/s, loss=0.0521, v_num=0, train_loss=0.00605, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.362, val_accuracy=0.926, val_f1_score=0.926]
Epoch 83:  92%|█████████▏| 234/255 [01:27<00:07,  2.68it/s, loss=0.0521, v_num=0, train_loss=0.00605, tr

Epoch 83, global step 18983: val_loss was not in top 2


Epoch 84:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.0383, v_num=0, train_loss=0.0363, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.331, val_accuracy=0.921, val_f1_score=0.921] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 84:  89%|████████▉ | 228/255 [01:26<00:10,  2.63it/s, loss=0.0383, v_num=0, train_loss=0.0363, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.331, val_accuracy=0.921, val_f1_score=0.921]
Epoch 84:  90%|█████████ | 230/255 [01:26<00:09,  2.65it/s, loss=0.0383, v_num=0, train_loss=0.0363, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.331, val_accuracy=0.921, val_f1_score=0.921]
Epoch 84:  91%|█████████ | 232/255 [01:27<00:08,  2.67it/s, loss=0.0383, v_num=0, train_loss=0.0363, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.331, val_accuracy=0.921, val_f1_score=0.921]
Epoch 84:  92%|█████████▏| 234/255 [01:27<00:07,  2.68it/s, loss=0.0383, v_num=0, train_loss=0.0363, train_

Epoch 84, global step 19209: val_loss reached 0.30718 (best 0.28694), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-3-v1.ckpt" as top 2


Epoch 85:  89%|████████▊ | 226/255 [01:20<00:10,  2.80it/s, loss=0.0242, v_num=0, train_loss=0.00927, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.307, val_accuracy=0.921, val_f1_score=0.921]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 85:  89%|████████▉ | 228/255 [01:27<00:10,  2.62it/s, loss=0.0242, v_num=0, train_loss=0.00927, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.307, val_accuracy=0.921, val_f1_score=0.921]
Epoch 85:  90%|█████████ | 230/255 [01:27<00:09,  2.64it/s, loss=0.0242, v_num=0, train_loss=0.00927, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.307, val_accuracy=0.921, val_f1_score=0.921]
Epoch 85:  91%|█████████ | 232/255 [01:27<00:08,  2.65it/s, loss=0.0242, v_num=0, train_loss=0.00927, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.307, val_accuracy=0.921, val_f1_score=0.921]
Epoch 85:  92%|█████████▏| 234/255 [01:27<00:07,  2.67it/s, loss=0.0242, v_num=0, train_loss=0.00927, tr

Epoch 85, global step 19435: val_loss was not in top 2


Epoch 86:  89%|████████▊ | 226/255 [01:20<00:10,  2.81it/s, loss=0.0276, v_num=0, train_loss=0.00224, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.362, val_accuracy=0.926, val_f1_score=0.926]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 86:  89%|████████▉ | 228/255 [01:26<00:10,  2.62it/s, loss=0.0276, v_num=0, train_loss=0.00224, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.362, val_accuracy=0.926, val_f1_score=0.926]
Epoch 86:  90%|█████████ | 230/255 [01:27<00:09,  2.64it/s, loss=0.0276, v_num=0, train_loss=0.00224, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.362, val_accuracy=0.926, val_f1_score=0.926]
Epoch 86:  91%|█████████ | 232/255 [01:27<00:08,  2.66it/s, loss=0.0276, v_num=0, train_loss=0.00224, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.362, val_accuracy=0.926, val_f1_score=0.926]
Epoch 86:  92%|█████████▏| 234/255 [01:27<00:07,  2.68it/s, loss=0.0276, v_num=0, train_loss=0.00224, tr

Epoch 86, global step 19661: val_loss was not in top 2


Epoch 87:  89%|████████▊ | 226/255 [01:20<00:10,  2.81it/s, loss=0.0301, v_num=0, train_loss=0.000577, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.336, val_accuracy=0.923, val_f1_score=0.923]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 87:  89%|████████▉ | 228/255 [01:27<00:10,  2.62it/s, loss=0.0301, v_num=0, train_loss=0.000577, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.336, val_accuracy=0.923, val_f1_score=0.923]
Epoch 87:  90%|█████████ | 230/255 [01:27<00:09,  2.64it/s, loss=0.0301, v_num=0, train_loss=0.000577, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.336, val_accuracy=0.923, val_f1_score=0.923]
Epoch 87:  91%|█████████ | 232/255 [01:27<00:08,  2.65it/s, loss=0.0301, v_num=0, train_loss=0.000577, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.336, val_accuracy=0.923, val_f1_score=0.923]
Epoch 87:  92%|█████████▏| 234/255 [01:27<00:07,  2.67it/s, loss=0.0301, v_num=0, train_loss=0.00057

Epoch 87, global step 19887: val_loss was not in top 2


Epoch 88:  89%|████████▊ | 226/255 [01:20<00:10,  2.81it/s, loss=0.0239, v_num=0, train_loss=0.000951, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.346, val_accuracy=0.922, val_f1_score=0.922]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 88:  89%|████████▉ | 228/255 [01:26<00:10,  2.62it/s, loss=0.0239, v_num=0, train_loss=0.000951, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.346, val_accuracy=0.922, val_f1_score=0.922]
Epoch 88:  90%|█████████ | 230/255 [01:27<00:09,  2.64it/s, loss=0.0239, v_num=0, train_loss=0.000951, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.346, val_accuracy=0.922, val_f1_score=0.922]
Epoch 88:  91%|█████████ | 232/255 [01:27<00:08,  2.66it/s, loss=0.0239, v_num=0, train_loss=0.000951, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.346, val_accuracy=0.922, val_f1_score=0.922]
Epoch 88:  92%|█████████▏| 234/255 [01:27<00:07,  2.68it/s, loss=0.0239, v_num=0, train_loss=0.00095

Epoch 88, global step 20113: val_loss was not in top 2


Epoch 89:  89%|████████▊ | 226/255 [01:20<00:10,  2.81it/s, loss=0.0209, v_num=0, train_loss=0.0325, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.371, val_accuracy=0.919, val_f1_score=0.919]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 89:  89%|████████▉ | 228/255 [01:26<00:10,  2.62it/s, loss=0.0209, v_num=0, train_loss=0.0325, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.371, val_accuracy=0.919, val_f1_score=0.919]
Epoch 89:  90%|█████████ | 230/255 [01:27<00:09,  2.64it/s, loss=0.0209, v_num=0, train_loss=0.0325, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.371, val_accuracy=0.919, val_f1_score=0.919]
Epoch 89:  91%|█████████ | 232/255 [01:27<00:08,  2.66it/s, loss=0.0209, v_num=0, train_loss=0.0325, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.371, val_accuracy=0.919, val_f1_score=0.919]
Epoch 89:  92%|█████████▏| 234/255 [01:27<00:07,  2.68it/s, loss=0.0209, v_num=0, train_loss=0.0325, train

Epoch 89, global step 20339: val_loss was not in top 2


Epoch 90:  89%|████████▊ | 226/255 [01:20<00:10,  2.81it/s, loss=0.0298, v_num=0, train_loss=0.0358, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.383, val_accuracy=0.924, val_f1_score=0.924] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 90:  89%|████████▉ | 228/255 [01:27<00:10,  2.62it/s, loss=0.0298, v_num=0, train_loss=0.0358, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.383, val_accuracy=0.924, val_f1_score=0.924]
Epoch 90:  90%|█████████ | 230/255 [01:27<00:09,  2.63it/s, loss=0.0298, v_num=0, train_loss=0.0358, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.383, val_accuracy=0.924, val_f1_score=0.924]
Epoch 90:  91%|█████████ | 232/255 [01:27<00:08,  2.65it/s, loss=0.0298, v_num=0, train_loss=0.0358, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.383, val_accuracy=0.924, val_f1_score=0.924]
Epoch 90:  92%|█████████▏| 234/255 [01:27<00:07,  2.67it/s, loss=0.0298, v_num=0, train_loss=0.0358, train_

Epoch 90, global step 20565: val_loss was not in top 2


Epoch 91:  89%|████████▊ | 226/255 [01:20<00:10,  2.81it/s, loss=0.0238, v_num=0, train_loss=0.0239, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.312, val_accuracy=0.923, val_f1_score=0.923] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 91:  89%|████████▉ | 228/255 [01:26<00:10,  2.62it/s, loss=0.0238, v_num=0, train_loss=0.0239, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.312, val_accuracy=0.923, val_f1_score=0.923]
Epoch 91:  90%|█████████ | 230/255 [01:27<00:09,  2.64it/s, loss=0.0238, v_num=0, train_loss=0.0239, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.312, val_accuracy=0.923, val_f1_score=0.923]
Epoch 91:  91%|█████████ | 232/255 [01:27<00:08,  2.66it/s, loss=0.0238, v_num=0, train_loss=0.0239, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.312, val_accuracy=0.923, val_f1_score=0.923]
Epoch 91:  92%|█████████▏| 234/255 [01:27<00:07,  2.68it/s, loss=0.0238, v_num=0, train_loss=0.0239, train_

Epoch 91, global step 20791: val_loss was not in top 2


Epoch 92:  89%|████████▊ | 226/255 [01:20<00:10,  2.81it/s, loss=0.036, v_num=0, train_loss=0.0223, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.315, val_accuracy=0.922, val_f1_score=0.922]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 92:  89%|████████▉ | 228/255 [01:27<00:10,  2.62it/s, loss=0.036, v_num=0, train_loss=0.0223, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.315, val_accuracy=0.922, val_f1_score=0.922]
Epoch 92:  90%|█████████ | 230/255 [01:27<00:09,  2.64it/s, loss=0.036, v_num=0, train_loss=0.0223, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.315, val_accuracy=0.922, val_f1_score=0.922]
Epoch 92:  91%|█████████ | 232/255 [01:27<00:08,  2.65it/s, loss=0.036, v_num=0, train_loss=0.0223, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.315, val_accuracy=0.922, val_f1_score=0.922]
Epoch 92:  92%|█████████▏| 234/255 [01:27<00:07,  2.67it/s, loss=0.036, v_num=0, train_loss=0.0223, train_accu

Epoch 92, global step 21017: val_loss was not in top 2


Epoch 93:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.0201, v_num=0, train_loss=0.00534, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.331, val_accuracy=0.929, val_f1_score=0.929] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 93:  89%|████████▉ | 228/255 [01:26<00:10,  2.63it/s, loss=0.0201, v_num=0, train_loss=0.00534, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.331, val_accuracy=0.929, val_f1_score=0.929]
Epoch 93:  90%|█████████ | 230/255 [01:26<00:09,  2.65it/s, loss=0.0201, v_num=0, train_loss=0.00534, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.331, val_accuracy=0.929, val_f1_score=0.929]
Epoch 93:  91%|█████████ | 232/255 [01:26<00:08,  2.67it/s, loss=0.0201, v_num=0, train_loss=0.00534, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.331, val_accuracy=0.929, val_f1_score=0.929]
Epoch 93:  92%|█████████▏| 234/255 [01:27<00:07,  2.69it/s, loss=0.0201, v_num=0, train_loss=0.00534, t

Epoch 93, global step 21243: val_loss was not in top 2


Epoch 94:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.0442, v_num=0, train_loss=0.152, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.356, val_accuracy=0.926, val_f1_score=0.926]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 94:  89%|████████▉ | 228/255 [01:26<00:10,  2.63it/s, loss=0.0442, v_num=0, train_loss=0.152, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.356, val_accuracy=0.926, val_f1_score=0.926]
Epoch 94:  90%|█████████ | 230/255 [01:27<00:09,  2.64it/s, loss=0.0442, v_num=0, train_loss=0.152, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.356, val_accuracy=0.926, val_f1_score=0.926]
Epoch 94:  91%|█████████ | 232/255 [01:27<00:08,  2.66it/s, loss=0.0442, v_num=0, train_loss=0.152, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.356, val_accuracy=0.926, val_f1_score=0.926]
Epoch 94:  92%|█████████▏| 234/255 [01:27<00:07,  2.68it/s, loss=0.0442, v_num=0, train_loss=0.152, train_accu

Epoch 94, global step 21469: val_loss was not in top 2


Epoch 95:  89%|████████▊ | 226/255 [01:20<00:10,  2.80it/s, loss=0.028, v_num=0, train_loss=0.00776, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.355, val_accuracy=0.923, val_f1_score=0.923]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 95:  89%|████████▉ | 228/255 [01:27<00:10,  2.62it/s, loss=0.028, v_num=0, train_loss=0.00776, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.355, val_accuracy=0.923, val_f1_score=0.923]
Epoch 95:  90%|█████████ | 230/255 [01:27<00:09,  2.64it/s, loss=0.028, v_num=0, train_loss=0.00776, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.355, val_accuracy=0.923, val_f1_score=0.923]
Epoch 95:  91%|█████████ | 232/255 [01:27<00:08,  2.66it/s, loss=0.028, v_num=0, train_loss=0.00776, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.355, val_accuracy=0.923, val_f1_score=0.923]
Epoch 95:  92%|█████████▏| 234/255 [01:27<00:07,  2.68it/s, loss=0.028, v_num=0, train_loss=0.00776, train

Epoch 95, global step 21695: val_loss was not in top 2


Epoch 96:  89%|████████▊ | 226/255 [01:20<00:10,  2.80it/s, loss=0.019, v_num=0, train_loss=0.00769, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.358, val_accuracy=0.919, val_f1_score=0.919]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 96:  89%|████████▉ | 228/255 [01:27<00:10,  2.62it/s, loss=0.019, v_num=0, train_loss=0.00769, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.358, val_accuracy=0.919, val_f1_score=0.919]
Validating:   7%|▋         | 2/29 [00:06<01:16,  2.82s/it][A
Epoch 96:  90%|█████████ | 230/255 [01:27<00:09,  2.62it/s, loss=0.019, v_num=0, train_loss=0.00769, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.358, val_accuracy=0.919, val_f1_score=0.919]
Validating:  14%|█▍        | 4/29 [00:07<00:26,  1.07s/it][A
Epoch 96:  91%|█████████ | 232/255 [01:27<00:08,  2.64it/s, loss=0.019, v_num=0, train_loss=0.00769, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.358, val_accuracy=0.919, va

Epoch 96, global step 21921: val_loss reached 0.28521 (best 0.28521), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-3-v1.ckpt" as top 2


Epoch 97:  89%|████████▊ | 226/255 [02:24<00:18,  1.56it/s, loss=0.0271, v_num=0, train_loss=0.000435, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.285, val_accuracy=0.932, val_f1_score=0.932]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 97:  89%|████████▉ | 228/255 [02:31<00:17,  1.51it/s, loss=0.0271, v_num=0, train_loss=0.000435, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.285, val_accuracy=0.932, val_f1_score=0.932]
Validating:   7%|▋         | 2/29 [00:06<01:15,  2.79s/it][A
Epoch 97:  90%|█████████ | 230/255 [02:31<00:16,  1.51it/s, loss=0.0271, v_num=0, train_loss=0.000435, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.285, val_accuracy=0.932, val_f1_score=0.932]
Validating:  14%|█▍        | 4/29 [00:07<00:26,  1.05s/it][A
Epoch 97:  91%|█████████ | 232/255 [02:32<00:15,  1.52it/s, loss=0.0271, v_num=0, train_loss=0.000435, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.285, val_accuracy=0.9

Epoch 97, global step 22147: val_loss was not in top 2


Epoch 98:  89%|████████▊ | 226/255 [02:26<00:18,  1.54it/s, loss=0.0417, v_num=0, train_loss=0.0167, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.448, val_accuracy=0.916, val_f1_score=0.916]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 98:  89%|████████▉ | 228/255 [02:32<00:18,  1.49it/s, loss=0.0417, v_num=0, train_loss=0.0167, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.448, val_accuracy=0.916, val_f1_score=0.916]
Validating:   7%|▋         | 2/29 [00:06<01:14,  2.76s/it][A
Epoch 98:  90%|█████████ | 230/255 [02:33<00:16,  1.50it/s, loss=0.0417, v_num=0, train_loss=0.0167, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.448, val_accuracy=0.916, val_f1_score=0.916]
Validating:  14%|█▍        | 4/29 [00:06<00:25,  1.03s/it][A
Epoch 98:  91%|█████████ | 232/255 [02:33<00:15,  1.51it/s, loss=0.0417, v_num=0, train_loss=0.0167, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.448, val_accuracy=0.916, va

Epoch 98, global step 22373: val_loss was not in top 2


Epoch 99:  89%|████████▊ | 226/255 [02:26<00:18,  1.54it/s, loss=0.0417, v_num=0, train_loss=0.0024, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.328, val_accuracy=0.916, val_f1_score=0.916] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 99:  89%|████████▉ | 228/255 [02:33<00:18,  1.49it/s, loss=0.0417, v_num=0, train_loss=0.0024, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.328, val_accuracy=0.916, val_f1_score=0.916]
Validating:   7%|▋         | 2/29 [00:06<01:12,  2.68s/it][A
Epoch 99:  90%|█████████ | 230/255 [02:33<00:16,  1.50it/s, loss=0.0417, v_num=0, train_loss=0.0024, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.328, val_accuracy=0.916, val_f1_score=0.916]
Validating:  14%|█▍        | 4/29 [00:06<00:25,  1.04s/it][A
Epoch 99:  91%|█████████ | 232/255 [02:33<00:15,  1.51it/s, loss=0.0417, v_num=0, train_loss=0.0024, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.328, val_accuracy=0.916, val

Epoch 99, global step 22599: val_loss was not in top 2


Epoch 100:  89%|████████▊ | 226/255 [02:26<00:18,  1.54it/s, loss=0.0192, v_num=0, train_loss=0.0108, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.363, val_accuracy=0.916, val_f1_score=0.916] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 100:  89%|████████▉ | 228/255 [02:32<00:18,  1.49it/s, loss=0.0192, v_num=0, train_loss=0.0108, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.363, val_accuracy=0.916, val_f1_score=0.916]
Validating:   7%|▋         | 2/29 [00:06<01:15,  2.80s/it][A
Epoch 100:  90%|█████████ | 230/255 [02:33<00:16,  1.50it/s, loss=0.0192, v_num=0, train_loss=0.0108, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.363, val_accuracy=0.916, val_f1_score=0.916]
Validating:  14%|█▍        | 4/29 [00:07<00:26,  1.06s/it][A
Epoch 100:  91%|█████████ | 232/255 [02:33<00:15,  1.51it/s, loss=0.0192, v_num=0, train_loss=0.0108, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.363, val_accuracy=0.916,

Epoch 100, global step 22825: val_loss was not in top 2


Epoch 101:  89%|████████▊ | 226/255 [02:26<00:18,  1.55it/s, loss=0.0858, v_num=0, train_loss=0.117, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.303, val_accuracy=0.928, val_f1_score=0.928]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 101:  89%|████████▉ | 228/255 [02:32<00:18,  1.49it/s, loss=0.0858, v_num=0, train_loss=0.117, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.303, val_accuracy=0.928, val_f1_score=0.928]
Validating:   7%|▋         | 2/29 [00:06<01:14,  2.78s/it][A
Epoch 101:  90%|█████████ | 230/255 [02:33<00:16,  1.50it/s, loss=0.0858, v_num=0, train_loss=0.117, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.303, val_accuracy=0.928, val_f1_score=0.928]
Validating:  14%|█▍        | 4/29 [00:06<00:25,  1.01s/it][A
Epoch 101:  91%|█████████ | 232/255 [02:33<00:15,  1.51it/s, loss=0.0858, v_num=0, train_loss=0.117, train_accuracy=0.944, train_f1_score=0.944, val_loss=0.303, val_accuracy=0.928, va

Epoch 101, global step 23051: val_loss was not in top 2


Epoch 102:  89%|████████▊ | 226/255 [02:26<00:18,  1.54it/s, loss=0.0424, v_num=0, train_loss=0.0285, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.359, val_accuracy=0.910, val_f1_score=0.910] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 102:  89%|████████▉ | 228/255 [02:33<00:18,  1.49it/s, loss=0.0424, v_num=0, train_loss=0.0285, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.359, val_accuracy=0.910, val_f1_score=0.910]
Validating:   7%|▋         | 2/29 [00:06<01:15,  2.81s/it][A
Epoch 102:  90%|█████████ | 230/255 [02:33<00:16,  1.50it/s, loss=0.0424, v_num=0, train_loss=0.0285, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.359, val_accuracy=0.910, val_f1_score=0.910]
Validating:  14%|█▍        | 4/29 [00:07<00:25,  1.02s/it][A
Epoch 102:  91%|█████████ | 232/255 [02:33<00:15,  1.51it/s, loss=0.0424, v_num=0, train_loss=0.0285, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.359, val_accuracy=0.910,

Epoch 102, global step 23277: val_loss reached 0.26176 (best 0.26176), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-3.ckpt" as top 2


Epoch 103:  89%|████████▊ | 226/255 [02:26<00:18,  1.54it/s, loss=0.0242, v_num=0, train_loss=0.00547, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.262, val_accuracy=0.930, val_f1_score=0.930]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 103:  89%|████████▉ | 228/255 [02:33<00:18,  1.49it/s, loss=0.0242, v_num=0, train_loss=0.00547, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.262, val_accuracy=0.930, val_f1_score=0.930]
Validating:   7%|▋         | 2/29 [00:06<01:15,  2.80s/it][A
Epoch 103:  90%|█████████ | 230/255 [02:33<00:16,  1.50it/s, loss=0.0242, v_num=0, train_loss=0.00547, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.262, val_accuracy=0.930, val_f1_score=0.930]
Validating:  14%|█▍        | 4/29 [00:07<00:25,  1.02s/it][A
Epoch 103:  91%|█████████ | 232/255 [02:33<00:15,  1.51it/s, loss=0.0242, v_num=0, train_loss=0.00547, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.262, val_accuracy=0.9

Epoch 103, global step 23503: val_loss was not in top 2


Epoch 104:  89%|████████▊ | 226/255 [02:26<00:18,  1.54it/s, loss=0.00494, v_num=0, train_loss=0.00109, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.357, val_accuracy=0.920, val_f1_score=0.920] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 104:  89%|████████▉ | 228/255 [02:33<00:18,  1.49it/s, loss=0.00494, v_num=0, train_loss=0.00109, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.357, val_accuracy=0.920, val_f1_score=0.920]
Validating:   7%|▋         | 2/29 [00:06<01:15,  2.78s/it][A
Epoch 104:  90%|█████████ | 230/255 [02:33<00:16,  1.50it/s, loss=0.00494, v_num=0, train_loss=0.00109, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.357, val_accuracy=0.920, val_f1_score=0.920]
Validating:  14%|█▍        | 4/29 [00:06<00:25,  1.01s/it][A
Epoch 104:  91%|█████████ | 232/255 [02:33<00:15,  1.51it/s, loss=0.00494, v_num=0, train_loss=0.00109, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.357, val_accurac

Epoch 104, global step 23729: val_loss was not in top 2


Epoch 105:  89%|████████▊ | 226/255 [02:33<00:19,  1.48it/s, loss=0.0189, v_num=0, train_loss=0.0412, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.298, val_accuracy=0.935, val_f1_score=0.935]   
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 105:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.0189, v_num=0, train_loss=0.0412, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.298, val_accuracy=0.935, val_f1_score=0.935]
Epoch 105:  90%|█████████ | 230/255 [02:39<00:17,  1.44it/s, loss=0.0189, v_num=0, train_loss=0.0412, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.298, val_accuracy=0.935, val_f1_score=0.935]
Epoch 105:  91%|█████████ | 232/255 [02:39<00:15,  1.45it/s, loss=0.0189, v_num=0, train_loss=0.0412, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.298, val_accuracy=0.935, val_f1_score=0.935]
Epoch 105:  92%|█████████▏| 234/255 [02:39<00:14,  1.46it/s, loss=0.0189, v_num=0, train_loss=0.0412,

Epoch 105, global step 23955: val_loss was not in top 2


Epoch 106:  89%|████████▊ | 226/255 [02:26<00:18,  1.54it/s, loss=0.0239, v_num=0, train_loss=0.0147, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.362, val_accuracy=0.925, val_f1_score=0.925] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 106:  89%|████████▉ | 228/255 [02:33<00:18,  1.49it/s, loss=0.0239, v_num=0, train_loss=0.0147, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.362, val_accuracy=0.925, val_f1_score=0.925]
Validating:   7%|▋         | 2/29 [00:06<01:14,  2.78s/it][A
Epoch 106:  90%|█████████ | 230/255 [02:33<00:16,  1.50it/s, loss=0.0239, v_num=0, train_loss=0.0147, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.362, val_accuracy=0.925, val_f1_score=0.925]
Validating:  14%|█▍        | 4/29 [00:06<00:25,  1.01s/it][A
Epoch 106:  91%|█████████ | 232/255 [02:33<00:15,  1.51it/s, loss=0.0239, v_num=0, train_loss=0.0147, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.362, val_accuracy=0.925,

Epoch 106, global step 24181: val_loss was not in top 2


Epoch 107:  89%|████████▊ | 226/255 [02:26<00:18,  1.54it/s, loss=0.0151, v_num=0, train_loss=0.00247, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.329, val_accuracy=0.927, val_f1_score=0.927] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 107:  89%|████████▉ | 228/255 [02:32<00:18,  1.49it/s, loss=0.0151, v_num=0, train_loss=0.00247, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.329, val_accuracy=0.927, val_f1_score=0.927]
Validating:   7%|▋         | 2/29 [00:06<01:15,  2.78s/it][A
Epoch 107:  90%|█████████ | 230/255 [02:33<00:16,  1.50it/s, loss=0.0151, v_num=0, train_loss=0.00247, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.329, val_accuracy=0.927, val_f1_score=0.927]
Validating:  14%|█▍        | 4/29 [00:06<00:25,  1.01s/it][A
Epoch 107:  91%|█████████ | 232/255 [02:33<00:15,  1.51it/s, loss=0.0151, v_num=0, train_loss=0.00247, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.329, val_accuracy=0.

Epoch 107, global step 24407: val_loss was not in top 2


Epoch 108:  89%|████████▊ | 226/255 [02:26<00:18,  1.54it/s, loss=0.0206, v_num=0, train_loss=0.00168, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.346, val_accuracy=0.928, val_f1_score=0.928]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 108:  89%|████████▉ | 228/255 [02:33<00:18,  1.49it/s, loss=0.0206, v_num=0, train_loss=0.00168, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.346, val_accuracy=0.928, val_f1_score=0.928]
Validating:   7%|▋         | 2/29 [00:06<01:14,  2.78s/it][A
Epoch 108:  90%|█████████ | 230/255 [02:33<00:16,  1.50it/s, loss=0.0206, v_num=0, train_loss=0.00168, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.346, val_accuracy=0.928, val_f1_score=0.928]
Epoch 108:  91%|█████████ | 232/255 [02:33<00:15,  1.51it/s, loss=0.0206, v_num=0, train_loss=0.00168, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.346, val_accuracy=0.928, val_f1_score=0.928]
Validating:  21%|██        | 6/29 [0

Epoch 108, global step 24633: val_loss was not in top 2


Epoch 109:  89%|████████▊ | 226/255 [02:25<00:18,  1.55it/s, loss=0.0341, v_num=0, train_loss=0.00441, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.288, val_accuracy=0.929, val_f1_score=0.929] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 109:  89%|████████▉ | 228/255 [02:32<00:18,  1.50it/s, loss=0.0341, v_num=0, train_loss=0.00441, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.288, val_accuracy=0.929, val_f1_score=0.929]
Validating:   7%|▋         | 2/29 [00:06<01:15,  2.80s/it][A
Epoch 109:  90%|█████████ | 230/255 [02:32<00:16,  1.51it/s, loss=0.0341, v_num=0, train_loss=0.00441, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.288, val_accuracy=0.929, val_f1_score=0.929]
Validating:  14%|█▍        | 4/29 [00:07<00:26,  1.06s/it][A
Epoch 109:  91%|█████████ | 232/255 [02:33<00:15,  1.52it/s, loss=0.0341, v_num=0, train_loss=0.00441, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.288, val_accuracy=0.

Epoch 109, global step 24859: val_loss was not in top 2


Epoch 110:  89%|████████▊ | 226/255 [02:26<00:18,  1.54it/s, loss=0.0138, v_num=0, train_loss=0.0009, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.316, val_accuracy=0.925, val_f1_score=0.925]   
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 110:  89%|████████▉ | 228/255 [02:33<00:18,  1.49it/s, loss=0.0138, v_num=0, train_loss=0.0009, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.316, val_accuracy=0.925, val_f1_score=0.925]
Validating:   7%|▋         | 2/29 [00:06<01:16,  2.83s/it][A
Epoch 110:  90%|█████████ | 230/255 [02:33<00:16,  1.50it/s, loss=0.0138, v_num=0, train_loss=0.0009, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.316, val_accuracy=0.925, val_f1_score=0.925]
Validating:  14%|█▍        | 4/29 [00:07<00:26,  1.07s/it][A
Epoch 110:  91%|█████████ | 232/255 [02:33<00:15,  1.51it/s, loss=0.0138, v_num=0, train_loss=0.0009, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.316, val_accuracy=0.92

Epoch 110, global step 25085: val_loss was not in top 2


Epoch 111:  89%|████████▊ | 226/255 [02:26<00:18,  1.55it/s, loss=0.0361, v_num=0, train_loss=0.0133, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.360, val_accuracy=0.928, val_f1_score=0.928] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 111:  89%|████████▉ | 228/255 [02:32<00:18,  1.49it/s, loss=0.0361, v_num=0, train_loss=0.0133, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.360, val_accuracy=0.928, val_f1_score=0.928]
Validating:   7%|▋         | 2/29 [00:06<01:15,  2.79s/it][A
Epoch 111:  90%|█████████ | 230/255 [02:33<00:16,  1.50it/s, loss=0.0361, v_num=0, train_loss=0.0133, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.360, val_accuracy=0.928, val_f1_score=0.928]
Validating:  14%|█▍        | 4/29 [00:07<00:26,  1.07s/it][A
Epoch 111:  91%|█████████ | 232/255 [02:33<00:15,  1.51it/s, loss=0.0361, v_num=0, train_loss=0.0133, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.360, val_accuracy=0.928,

Epoch 111, global step 25311: val_loss reached 0.27515 (best 0.26176), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-3-v1.ckpt" as top 2


Epoch 112:  89%|████████▊ | 226/255 [02:26<00:18,  1.54it/s, loss=0.0377, v_num=0, train_loss=0.00754, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.275, val_accuracy=0.924, val_f1_score=0.924] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 112:  89%|████████▉ | 228/255 [02:33<00:18,  1.49it/s, loss=0.0377, v_num=0, train_loss=0.00754, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.275, val_accuracy=0.924, val_f1_score=0.924]
Validating:   7%|▋         | 2/29 [00:06<01:15,  2.80s/it][A
Epoch 112:  90%|█████████ | 230/255 [02:33<00:16,  1.50it/s, loss=0.0377, v_num=0, train_loss=0.00754, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.275, val_accuracy=0.924, val_f1_score=0.924]
Epoch 112:  91%|█████████ | 232/255 [02:33<00:15,  1.51it/s, loss=0.0377, v_num=0, train_loss=0.00754, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.275, val_accuracy=0.924, val_f1_score=0.924]
Validating:  21%|██        | 6/29 [00

Epoch 112, global step 25537: val_loss was not in top 2


Epoch 113:  89%|████████▊ | 226/255 [02:26<00:18,  1.54it/s, loss=0.0247, v_num=0, train_loss=0.0028, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.313, val_accuracy=0.931, val_f1_score=0.931]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 113:  89%|████████▉ | 228/255 [02:32<00:18,  1.49it/s, loss=0.0247, v_num=0, train_loss=0.0028, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.313, val_accuracy=0.931, val_f1_score=0.931]
Validating:   7%|▋         | 2/29 [00:06<01:14,  2.77s/it][A
Epoch 113:  90%|█████████ | 230/255 [02:33<00:16,  1.50it/s, loss=0.0247, v_num=0, train_loss=0.0028, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.313, val_accuracy=0.931, val_f1_score=0.931]
Validating:  14%|█▍        | 4/29 [00:06<00:25,  1.01s/it][A
Epoch 113:  91%|█████████ | 232/255 [02:33<00:15,  1.51it/s, loss=0.0247, v_num=0, train_loss=0.0028, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.313, val_accuracy=0.931

Epoch 113, global step 25763: val_loss was not in top 2


Epoch 114:  89%|████████▊ | 226/255 [02:28<00:19,  1.52it/s, loss=0.0404, v_num=0, train_loss=0.00306, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.308, val_accuracy=0.923, val_f1_score=0.923]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 114:  89%|████████▉ | 228/255 [02:35<00:18,  1.47it/s, loss=0.0404, v_num=0, train_loss=0.00306, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.308, val_accuracy=0.923, val_f1_score=0.923]
Epoch 114:  90%|█████████ | 230/255 [02:35<00:16,  1.48it/s, loss=0.0404, v_num=0, train_loss=0.00306, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.308, val_accuracy=0.923, val_f1_score=0.923]
Epoch 114:  91%|█████████ | 232/255 [02:35<00:15,  1.49it/s, loss=0.0404, v_num=0, train_loss=0.00306, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.308, val_accuracy=0.923, val_f1_score=0.923]
Epoch 114:  92%|█████████▏| 234/255 [02:35<00:13,  1.50it/s, loss=0.0404, v_num=0, train_loss=0.00

Epoch 114, global step 25989: val_loss was not in top 2


Epoch 115:  89%|████████▊ | 226/255 [02:31<00:19,  1.49it/s, loss=0.00559, v_num=0, train_loss=0.00142, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.335, val_accuracy=0.933, val_f1_score=0.933] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 115:  89%|████████▉ | 228/255 [02:38<00:18,  1.44it/s, loss=0.00559, v_num=0, train_loss=0.00142, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.335, val_accuracy=0.933, val_f1_score=0.933]
Validating:   7%|▋         | 2/29 [00:07<01:19,  2.94s/it][A
Epoch 115:  90%|█████████ | 230/255 [02:38<00:17,  1.45it/s, loss=0.00559, v_num=0, train_loss=0.00142, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.335, val_accuracy=0.933, val_f1_score=0.933]
Validating:  14%|█▍        | 4/29 [00:07<00:26,  1.07s/it][A
Epoch 115:  91%|█████████ | 232/255 [02:39<00:15,  1.46it/s, loss=0.00559, v_num=0, train_loss=0.00142, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.335, val_accurac

Epoch 115, global step 26215: val_loss was not in top 2


Epoch 116:  89%|████████▊ | 226/255 [02:26<00:18,  1.54it/s, loss=0.0124, v_num=0, train_loss=0.0016, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.351, val_accuracy=0.930, val_f1_score=0.930]   
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 116:  89%|████████▉ | 228/255 [02:33<00:18,  1.49it/s, loss=0.0124, v_num=0, train_loss=0.0016, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.351, val_accuracy=0.930, val_f1_score=0.930]
Validating:   7%|▋         | 2/29 [00:06<01:15,  2.78s/it][A
Epoch 116:  90%|█████████ | 230/255 [02:33<00:16,  1.50it/s, loss=0.0124, v_num=0, train_loss=0.0016, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.351, val_accuracy=0.930, val_f1_score=0.930]
Validating:  14%|█▍        | 4/29 [00:06<00:25,  1.01s/it][A
Epoch 116:  91%|█████████ | 232/255 [02:34<00:15,  1.51it/s, loss=0.0124, v_num=0, train_loss=0.0016, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.351, val_accuracy=0.93

Epoch 116, global step 26441: val_loss was not in top 2


Epoch 117:  89%|████████▊ | 226/255 [02:27<00:18,  1.54it/s, loss=0.0125, v_num=0, train_loss=0.0081, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.333, val_accuracy=0.938, val_f1_score=0.938]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 117:  89%|████████▉ | 228/255 [02:33<00:18,  1.48it/s, loss=0.0125, v_num=0, train_loss=0.0081, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.333, val_accuracy=0.938, val_f1_score=0.938]
Validating:   7%|▋         | 2/29 [00:06<01:16,  2.84s/it][A
Epoch 117:  90%|█████████ | 230/255 [02:34<00:16,  1.49it/s, loss=0.0125, v_num=0, train_loss=0.0081, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.333, val_accuracy=0.938, val_f1_score=0.938]
Validating:  14%|█▍        | 4/29 [00:07<00:26,  1.04s/it][A
Epoch 117:  91%|█████████ | 232/255 [02:34<00:15,  1.50it/s, loss=0.0125, v_num=0, train_loss=0.0081, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.333, val_accuracy=0.938

Epoch 117, global step 26667: val_loss was not in top 2


Epoch 118:  89%|████████▊ | 226/255 [02:26<00:18,  1.54it/s, loss=0.00448, v_num=0, train_loss=0.00675, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.302, val_accuracy=0.930, val_f1_score=0.930] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 118:  89%|████████▉ | 228/255 [02:32<00:18,  1.49it/s, loss=0.00448, v_num=0, train_loss=0.00675, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.302, val_accuracy=0.930, val_f1_score=0.930]
Validating:   7%|▋         | 2/29 [00:06<01:14,  2.77s/it][A
Epoch 118:  90%|█████████ | 230/255 [02:33<00:16,  1.50it/s, loss=0.00448, v_num=0, train_loss=0.00675, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.302, val_accuracy=0.930, val_f1_score=0.930]
Validating:  14%|█▍        | 4/29 [00:07<00:26,  1.05s/it][A
Epoch 118:  91%|█████████ | 232/255 [02:33<00:15,  1.51it/s, loss=0.00448, v_num=0, train_loss=0.00675, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.302, val_accurac

Epoch 118, global step 26893: val_loss was not in top 2


Epoch 119:  89%|████████▊ | 226/255 [02:26<00:18,  1.55it/s, loss=0.0144, v_num=0, train_loss=0.00145, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.331, val_accuracy=0.934, val_f1_score=0.934]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 119:  89%|████████▉ | 228/255 [02:32<00:18,  1.50it/s, loss=0.0144, v_num=0, train_loss=0.00145, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.331, val_accuracy=0.934, val_f1_score=0.934]
Validating:   7%|▋         | 2/29 [00:06<01:14,  2.78s/it][A
Epoch 119:  90%|█████████ | 230/255 [02:32<00:16,  1.50it/s, loss=0.0144, v_num=0, train_loss=0.00145, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.331, val_accuracy=0.934, val_f1_score=0.934]
Validating:  14%|█▍        | 4/29 [00:06<00:25,  1.01s/it][A
Epoch 119:  91%|█████████ | 232/255 [02:33<00:15,  1.51it/s, loss=0.0144, v_num=0, train_loss=0.00145, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.331, val_accuracy=0

Epoch 119, global step 27119: val_loss was not in top 2


Epoch 120:  89%|████████▊ | 226/255 [02:26<00:18,  1.54it/s, loss=0.0179, v_num=0, train_loss=0.00661, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.324, val_accuracy=0.937, val_f1_score=0.937]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 120:  89%|████████▉ | 228/255 [02:32<00:18,  1.49it/s, loss=0.0179, v_num=0, train_loss=0.00661, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.324, val_accuracy=0.937, val_f1_score=0.937]
Validating:   7%|▋         | 2/29 [00:06<01:15,  2.78s/it][A
Epoch 120:  90%|█████████ | 230/255 [02:33<00:16,  1.50it/s, loss=0.0179, v_num=0, train_loss=0.00661, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.324, val_accuracy=0.937, val_f1_score=0.937]
Validating:  14%|█▍        | 4/29 [00:07<00:26,  1.06s/it][A
Epoch 120:  91%|█████████ | 232/255 [02:33<00:15,  1.51it/s, loss=0.0179, v_num=0, train_loss=0.00661, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.324, val_accuracy=0

Epoch 120, global step 27345: val_loss was not in top 2


Epoch 121:  89%|████████▊ | 226/255 [02:26<00:18,  1.55it/s, loss=0.0174, v_num=0, train_loss=0.00306, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.338, val_accuracy=0.928, val_f1_score=0.928]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 121:  89%|████████▉ | 228/255 [02:32<00:18,  1.49it/s, loss=0.0174, v_num=0, train_loss=0.00306, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.338, val_accuracy=0.928, val_f1_score=0.928]
Validating:   7%|▋         | 2/29 [00:06<01:17,  2.86s/it][A
Epoch 121:  90%|█████████ | 230/255 [02:33<00:16,  1.50it/s, loss=0.0174, v_num=0, train_loss=0.00306, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.338, val_accuracy=0.928, val_f1_score=0.928]
Validating:  14%|█▍        | 4/29 [00:07<00:26,  1.04s/it][A
Epoch 121:  91%|█████████ | 232/255 [02:33<00:15,  1.51it/s, loss=0.0174, v_num=0, train_loss=0.00306, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.338, val_accuracy=0

Epoch 121, global step 27571: val_loss reached 0.27450 (best 0.26176), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-3-v1.ckpt" as top 2


Epoch 122:  89%|████████▊ | 226/255 [02:26<00:18,  1.54it/s, loss=0.00709, v_num=0, train_loss=0.00831, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.275, val_accuracy=0.938, val_f1_score=0.938] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 122:  89%|████████▉ | 228/255 [02:33<00:18,  1.49it/s, loss=0.00709, v_num=0, train_loss=0.00831, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.275, val_accuracy=0.938, val_f1_score=0.938]
Validating:   7%|▋         | 2/29 [00:06<01:16,  2.85s/it][A
Epoch 122:  90%|█████████ | 230/255 [02:33<00:16,  1.50it/s, loss=0.00709, v_num=0, train_loss=0.00831, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.275, val_accuracy=0.938, val_f1_score=0.938]
Validating:  14%|█▍        | 4/29 [00:07<00:25,  1.04s/it][A
Epoch 122:  91%|█████████ | 232/255 [02:33<00:15,  1.51it/s, loss=0.00709, v_num=0, train_loss=0.00831, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.275, val_accurac

Epoch 122, global step 27797: val_loss was not in top 2


Epoch 123:  89%|████████▊ | 226/255 [02:26<00:18,  1.54it/s, loss=0.00569, v_num=0, train_loss=0.00093, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.314, val_accuracy=0.938, val_f1_score=0.938] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 123:  89%|████████▉ | 228/255 [02:33<00:18,  1.49it/s, loss=0.00569, v_num=0, train_loss=0.00093, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.314, val_accuracy=0.938, val_f1_score=0.938]
Validating:   7%|▋         | 2/29 [00:06<01:17,  2.86s/it][A
Epoch 123:  90%|█████████ | 230/255 [02:33<00:16,  1.50it/s, loss=0.00569, v_num=0, train_loss=0.00093, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.314, val_accuracy=0.938, val_f1_score=0.938]
Validating:  14%|█▍        | 4/29 [00:07<00:26,  1.05s/it][A
Epoch 123:  91%|█████████ | 232/255 [02:33<00:15,  1.51it/s, loss=0.00569, v_num=0, train_loss=0.00093, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.314, val_accurac

Epoch 123, global step 28023: val_loss was not in top 2


Epoch 124:  89%|████████▊ | 226/255 [02:31<00:19,  1.49it/s, loss=0.0121, v_num=0, train_loss=0.000308, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.343, val_accuracy=0.933, val_f1_score=0.933] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 124:  89%|████████▉ | 228/255 [02:38<00:18,  1.44it/s, loss=0.0121, v_num=0, train_loss=0.000308, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.343, val_accuracy=0.933, val_f1_score=0.933]
Epoch 124:  90%|█████████ | 230/255 [02:38<00:17,  1.45it/s, loss=0.0121, v_num=0, train_loss=0.000308, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.343, val_accuracy=0.933, val_f1_score=0.933]
Epoch 124:  91%|█████████ | 232/255 [02:38<00:15,  1.46it/s, loss=0.0121, v_num=0, train_loss=0.000308, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.343, val_accuracy=0.933, val_f1_score=0.933]
Epoch 124:  92%|█████████▏| 234/255 [02:38<00:14,  1.47it/s, loss=0.0121, v_num=0, train_loss=0

Epoch 124, global step 28249: val_loss was not in top 2


Epoch 125:  89%|████████▊ | 226/255 [02:28<00:19,  1.52it/s, loss=0.0106, v_num=0, train_loss=0.00126, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.325, val_accuracy=0.934, val_f1_score=0.934]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 125:  89%|████████▉ | 228/255 [02:35<00:18,  1.47it/s, loss=0.0106, v_num=0, train_loss=0.00126, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.325, val_accuracy=0.934, val_f1_score=0.934]
Validating:   7%|▋         | 2/29 [00:06<01:17,  2.86s/it][A
Epoch 125:  90%|█████████ | 230/255 [02:35<00:16,  1.48it/s, loss=0.0106, v_num=0, train_loss=0.00126, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.325, val_accuracy=0.934, val_f1_score=0.934]
Validating:  14%|█▍        | 4/29 [00:07<00:27,  1.08s/it][A
Epoch 125:  91%|█████████ | 232/255 [02:36<00:15,  1.49it/s, loss=0.0106, v_num=0, train_loss=0.00126, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.325, val_accuracy=0

Epoch 125, global step 28475: val_loss was not in top 2


Epoch 126:  89%|████████▊ | 226/255 [02:26<00:18,  1.54it/s, loss=0.0246, v_num=0, train_loss=0.000679, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.347, val_accuracy=0.935, val_f1_score=0.935] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 126:  89%|████████▉ | 228/255 [02:32<00:18,  1.49it/s, loss=0.0246, v_num=0, train_loss=0.000679, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.347, val_accuracy=0.935, val_f1_score=0.935]
Validating:   7%|▋         | 2/29 [00:06<01:15,  2.78s/it][A
Epoch 126:  90%|█████████ | 230/255 [02:33<00:16,  1.50it/s, loss=0.0246, v_num=0, train_loss=0.000679, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.347, val_accuracy=0.935, val_f1_score=0.935]
Epoch 126:  91%|█████████ | 232/255 [02:33<00:15,  1.51it/s, loss=0.0246, v_num=0, train_loss=0.000679, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.347, val_accuracy=0.935, val_f1_score=0.935]
Validating:  21%|██        | 6/29

Epoch 126, global step 28701: val_loss was not in top 2


Epoch 127:  89%|████████▊ | 226/255 [02:27<00:18,  1.53it/s, loss=0.0148, v_num=0, train_loss=0.00311, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.327, val_accuracy=0.933, val_f1_score=0.933]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 127:  89%|████████▉ | 228/255 [02:33<00:18,  1.48it/s, loss=0.0148, v_num=0, train_loss=0.00311, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.327, val_accuracy=0.933, val_f1_score=0.933]
Validating:   7%|▋         | 2/29 [00:06<01:16,  2.83s/it][A
Epoch 127:  90%|█████████ | 230/255 [02:34<00:16,  1.49it/s, loss=0.0148, v_num=0, train_loss=0.00311, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.327, val_accuracy=0.933, val_f1_score=0.933]
Validating:  14%|█▍        | 4/29 [00:07<00:26,  1.04s/it][A
Epoch 127:  91%|█████████ | 232/255 [02:34<00:15,  1.50it/s, loss=0.0148, v_num=0, train_loss=0.00311, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.327, val_accuracy=0

Epoch 127, global step 28927: val_loss was not in top 2


Epoch 128:  89%|████████▊ | 226/255 [02:26<00:18,  1.55it/s, loss=0.00771, v_num=0, train_loss=0.000127, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.327, val_accuracy=0.938, val_f1_score=0.938]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 128:  89%|████████▉ | 228/255 [02:32<00:18,  1.49it/s, loss=0.00771, v_num=0, train_loss=0.000127, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.327, val_accuracy=0.938, val_f1_score=0.938]
Validating:   7%|▋         | 2/29 [00:06<01:16,  2.83s/it][A
Epoch 128:  90%|█████████ | 230/255 [02:33<00:16,  1.50it/s, loss=0.00771, v_num=0, train_loss=0.000127, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.327, val_accuracy=0.938, val_f1_score=0.938]
Validating:  14%|█▍        | 4/29 [00:07<00:26,  1.08s/it][A
Epoch 128:  91%|█████████ | 232/255 [02:33<00:15,  1.51it/s, loss=0.00771, v_num=0, train_loss=0.000127, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.327, val_accu

Epoch 128, global step 29153: val_loss was not in top 2


Epoch 129:  89%|████████▊ | 226/255 [02:26<00:18,  1.54it/s, loss=0.0224, v_num=0, train_loss=0.000185, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.340, val_accuracy=0.943, val_f1_score=0.943] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 129:  89%|████████▉ | 228/255 [02:32<00:18,  1.49it/s, loss=0.0224, v_num=0, train_loss=0.000185, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.340, val_accuracy=0.943, val_f1_score=0.943]
Validating:   7%|▋         | 2/29 [00:06<01:15,  2.81s/it][A
Epoch 129:  90%|█████████ | 230/255 [02:33<00:16,  1.50it/s, loss=0.0224, v_num=0, train_loss=0.000185, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.340, val_accuracy=0.943, val_f1_score=0.943]
Validating:  14%|█▍        | 4/29 [00:07<00:26,  1.07s/it][A
Epoch 129:  91%|█████████ | 232/255 [02:33<00:15,  1.51it/s, loss=0.0224, v_num=0, train_loss=0.000185, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.340, val_accurac

Epoch 129, global step 29379: val_loss was not in top 2


Epoch 130:  89%|████████▊ | 226/255 [02:26<00:18,  1.54it/s, loss=0.0222, v_num=0, train_loss=0.0102, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.349, val_accuracy=0.938, val_f1_score=0.938]   
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 130:  89%|████████▉ | 228/255 [02:33<00:18,  1.49it/s, loss=0.0222, v_num=0, train_loss=0.0102, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.349, val_accuracy=0.938, val_f1_score=0.938]
Validating:   7%|▋         | 2/29 [00:06<01:16,  2.85s/it][A
Epoch 130:  90%|█████████ | 230/255 [02:33<00:16,  1.50it/s, loss=0.0222, v_num=0, train_loss=0.0102, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.349, val_accuracy=0.938, val_f1_score=0.938]
Validating:  14%|█▍        | 4/29 [00:07<00:26,  1.07s/it][A
Epoch 130:  91%|█████████ | 232/255 [02:34<00:15,  1.51it/s, loss=0.0222, v_num=0, train_loss=0.0102, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.349, val_accuracy=0.93

Epoch 130, global step 29605: val_loss was not in top 2


Epoch 131:  89%|████████▊ | 226/255 [02:26<00:18,  1.55it/s, loss=0.0144, v_num=0, train_loss=0.000719, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.318, val_accuracy=0.930, val_f1_score=0.930] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 131:  89%|████████▉ | 228/255 [02:32<00:18,  1.49it/s, loss=0.0144, v_num=0, train_loss=0.000719, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.318, val_accuracy=0.930, val_f1_score=0.930]
Validating:   7%|▋         | 2/29 [00:06<01:14,  2.77s/it][A
Epoch 131:  90%|█████████ | 230/255 [02:33<00:16,  1.50it/s, loss=0.0144, v_num=0, train_loss=0.000719, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.318, val_accuracy=0.930, val_f1_score=0.930]
Epoch 131:  91%|█████████ | 232/255 [02:33<00:15,  1.51it/s, loss=0.0144, v_num=0, train_loss=0.000719, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.318, val_accuracy=0.930, val_f1_score=0.930]
Validating:  21%|██        | 6/29

Epoch 131, global step 29831: val_loss was not in top 2


Epoch 132:  89%|████████▊ | 226/255 [02:26<00:18,  1.54it/s, loss=0.0353, v_num=0, train_loss=0.256, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.308, val_accuracy=0.936, val_f1_score=0.936]    
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 132:  89%|████████▉ | 228/255 [02:33<00:18,  1.49it/s, loss=0.0353, v_num=0, train_loss=0.256, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.308, val_accuracy=0.936, val_f1_score=0.936]
Validating:   7%|▋         | 2/29 [00:07<01:19,  2.94s/it][A
Epoch 132:  90%|█████████ | 230/255 [02:33<00:16,  1.49it/s, loss=0.0353, v_num=0, train_loss=0.256, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.308, val_accuracy=0.936, val_f1_score=0.936]
Validating:  14%|█▍        | 4/29 [00:07<00:26,  1.07s/it][A
Epoch 132:  91%|█████████ | 232/255 [02:34<00:15,  1.50it/s, loss=0.0353, v_num=0, train_loss=0.256, train_accuracy=0.889, train_f1_score=0.889, val_loss=0.308, val_accuracy=0.936, 

Epoch 132, global step 30057: val_loss was not in top 2


Epoch 133:  89%|████████▊ | 226/255 [02:26<00:18,  1.55it/s, loss=0.00501, v_num=0, train_loss=0.000601, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.365, val_accuracy=0.932, val_f1_score=0.932]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 133:  89%|████████▉ | 228/255 [02:32<00:18,  1.49it/s, loss=0.00501, v_num=0, train_loss=0.000601, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.365, val_accuracy=0.932, val_f1_score=0.932]
Validating:   7%|▋         | 2/29 [00:06<01:16,  2.82s/it][A
Epoch 133:  90%|█████████ | 230/255 [02:33<00:16,  1.50it/s, loss=0.00501, v_num=0, train_loss=0.000601, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.365, val_accuracy=0.932, val_f1_score=0.932]
Validating:  14%|█▍        | 4/29 [00:07<00:26,  1.07s/it][A
Epoch 133:  91%|█████████ | 232/255 [02:33<00:15,  1.51it/s, loss=0.00501, v_num=0, train_loss=0.000601, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.365, val_accu

Epoch 133, global step 30283: val_loss reached 0.25597 (best 0.25597), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-3-v1.ckpt" as top 2


Epoch 134:  89%|████████▊ | 226/255 [02:33<00:19,  1.47it/s, loss=0.0245, v_num=0, train_loss=0.00276, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.256, val_accuracy=0.943, val_f1_score=0.943]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 134:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.0245, v_num=0, train_loss=0.00276, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.256, val_accuracy=0.943, val_f1_score=0.943]
Epoch 134:  90%|█████████ | 230/255 [02:40<00:17,  1.44it/s, loss=0.0245, v_num=0, train_loss=0.00276, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.256, val_accuracy=0.943, val_f1_score=0.943]
Validating:  14%|█▍        | 4/29 [00:06<00:30,  1.23s/it][A
Epoch 134:  91%|█████████ | 232/255 [02:40<00:15,  1.45it/s, loss=0.0245, v_num=0, train_loss=0.00276, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.256, val_accuracy=0.943, val_f1_score=0.943]
Validating:  21%|██        | 6/29 [0

Epoch 134, global step 30509: val_loss reached 0.24631 (best 0.24631), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-3.ckpt" as top 2


Epoch 135:  89%|████████▊ | 226/255 [02:26<00:18,  1.54it/s, loss=0.0126, v_num=0, train_loss=0.000545, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.246, val_accuracy=0.939, val_f1_score=0.939] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 135:  89%|████████▉ | 228/255 [02:32<00:18,  1.49it/s, loss=0.0126, v_num=0, train_loss=0.000545, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.246, val_accuracy=0.939, val_f1_score=0.939]
Validating:   7%|▋         | 2/29 [00:06<01:16,  2.85s/it][A
Epoch 135:  90%|█████████ | 230/255 [02:33<00:16,  1.50it/s, loss=0.0126, v_num=0, train_loss=0.000545, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.246, val_accuracy=0.939, val_f1_score=0.939]
Validating:  14%|█▍        | 4/29 [00:07<00:25,  1.04s/it][A
Epoch 135:  91%|█████████ | 232/255 [02:33<00:15,  1.51it/s, loss=0.0126, v_num=0, train_loss=0.000545, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.246, val_accurac

Epoch 135, global step 30735: val_loss was not in top 2


Epoch 136:  89%|████████▊ | 226/255 [02:26<00:18,  1.54it/s, loss=0.0297, v_num=0, train_loss=0.00761, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.286, val_accuracy=0.935, val_f1_score=0.935] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 136:  89%|████████▉ | 228/255 [02:33<00:18,  1.49it/s, loss=0.0297, v_num=0, train_loss=0.00761, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.286, val_accuracy=0.935, val_f1_score=0.935]
Validating:   7%|▋         | 2/29 [00:06<01:16,  2.84s/it][A
Epoch 136:  90%|█████████ | 230/255 [02:33<00:16,  1.50it/s, loss=0.0297, v_num=0, train_loss=0.00761, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.286, val_accuracy=0.935, val_f1_score=0.935]
Validating:  14%|█▍        | 4/29 [00:07<00:25,  1.03s/it][A
Epoch 136:  91%|█████████ | 232/255 [02:33<00:15,  1.51it/s, loss=0.0297, v_num=0, train_loss=0.00761, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.286, val_accuracy=0.

Epoch 136, global step 30961: val_loss reached 0.22811 (best 0.22811), saving model to "/Workspace/code/checkpoints/best-checkpoint-corr-3-v1.ckpt" as top 2


Epoch 137:  89%|████████▊ | 226/255 [02:26<00:18,  1.54it/s, loss=0.00999, v_num=0, train_loss=0.00119, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.228, val_accuracy=0.933, val_f1_score=0.933]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 137:  89%|████████▉ | 228/255 [02:33<00:18,  1.49it/s, loss=0.00999, v_num=0, train_loss=0.00119, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.228, val_accuracy=0.933, val_f1_score=0.933]
Validating:   7%|▋         | 2/29 [00:06<01:16,  2.83s/it][A
Epoch 137:  90%|█████████ | 230/255 [02:33<00:16,  1.50it/s, loss=0.00999, v_num=0, train_loss=0.00119, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.228, val_accuracy=0.933, val_f1_score=0.933]
Validating:  14%|█▍        | 4/29 [00:07<00:26,  1.07s/it][A
Epoch 137:  91%|█████████ | 232/255 [02:34<00:15,  1.51it/s, loss=0.00999, v_num=0, train_loss=0.00119, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.228, val_accuracy

Epoch 137, global step 31187: val_loss was not in top 2


Epoch 138:  89%|████████▊ | 226/255 [02:26<00:18,  1.54it/s, loss=0.00213, v_num=0, train_loss=0.000566, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.249, val_accuracy=0.939, val_f1_score=0.939]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 138:  89%|████████▉ | 228/255 [02:32<00:18,  1.49it/s, loss=0.00213, v_num=0, train_loss=0.000566, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.249, val_accuracy=0.939, val_f1_score=0.939]
Validating:   7%|▋         | 2/29 [00:06<01:16,  2.84s/it][A
Epoch 138:  90%|█████████ | 230/255 [02:33<00:16,  1.50it/s, loss=0.00213, v_num=0, train_loss=0.000566, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.249, val_accuracy=0.939, val_f1_score=0.939]
Validating:  14%|█▍        | 4/29 [00:07<00:26,  1.05s/it][A
Epoch 138:  91%|█████████ | 232/255 [02:33<00:15,  1.51it/s, loss=0.00213, v_num=0, train_loss=0.000566, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.249, val_accu

Epoch 138, global step 31413: val_loss was not in top 2


Epoch 139:  89%|████████▊ | 226/255 [02:26<00:18,  1.54it/s, loss=0.0197, v_num=0, train_loss=0.0085, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.264, val_accuracy=0.940, val_f1_score=0.940]   
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 139:  89%|████████▉ | 228/255 [02:33<00:18,  1.49it/s, loss=0.0197, v_num=0, train_loss=0.0085, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.264, val_accuracy=0.940, val_f1_score=0.940]
Validating:   7%|▋         | 2/29 [00:06<01:16,  2.83s/it][A
Epoch 139:  90%|█████████ | 230/255 [02:33<00:16,  1.49it/s, loss=0.0197, v_num=0, train_loss=0.0085, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.264, val_accuracy=0.940, val_f1_score=0.940]
Validating:  14%|█▍        | 4/29 [00:07<00:26,  1.07s/it][A
Epoch 139:  91%|█████████ | 232/255 [02:34<00:15,  1.50it/s, loss=0.0197, v_num=0, train_loss=0.0085, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.264, val_accuracy=0.94

Epoch 139, global step 31639: val_loss was not in top 2


Epoch 140:  89%|████████▊ | 226/255 [02:26<00:18,  1.54it/s, loss=0.0017, v_num=0, train_loss=0.00347, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.309, val_accuracy=0.934, val_f1_score=0.934]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 140:  89%|████████▉ | 228/255 [02:33<00:18,  1.49it/s, loss=0.0017, v_num=0, train_loss=0.00347, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.309, val_accuracy=0.934, val_f1_score=0.934]
Validating:   7%|▋         | 2/29 [00:06<01:16,  2.82s/it][A
Epoch 140:  90%|█████████ | 230/255 [02:33<00:16,  1.49it/s, loss=0.0017, v_num=0, train_loss=0.00347, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.309, val_accuracy=0.934, val_f1_score=0.934]
Validating:  14%|█▍        | 4/29 [00:07<00:26,  1.08s/it][A
Epoch 140:  91%|█████████ | 232/255 [02:34<00:15,  1.50it/s, loss=0.0017, v_num=0, train_loss=0.00347, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.309, val_accuracy=0

Epoch 140, global step 31865: val_loss was not in top 2


Epoch 141:  89%|████████▊ | 226/255 [02:26<00:18,  1.54it/s, loss=0.00142, v_num=0, train_loss=0.000274, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.308, val_accuracy=0.936, val_f1_score=0.936]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 141:  89%|████████▉ | 228/255 [02:32<00:18,  1.49it/s, loss=0.00142, v_num=0, train_loss=0.000274, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.308, val_accuracy=0.936, val_f1_score=0.936]
Validating:   7%|▋         | 2/29 [00:06<01:15,  2.80s/it][A
Epoch 141:  90%|█████████ | 230/255 [02:33<00:16,  1.50it/s, loss=0.00142, v_num=0, train_loss=0.000274, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.308, val_accuracy=0.936, val_f1_score=0.936]
Epoch 141:  91%|█████████ | 232/255 [02:33<00:15,  1.51it/s, loss=0.00142, v_num=0, train_loss=0.000274, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.308, val_accuracy=0.936, val_f1_score=0.936]
Validating:  21%|██        | 6

Epoch 141, global step 32091: val_loss was not in top 2


Epoch 142:  89%|████████▊ | 226/255 [02:26<00:18,  1.55it/s, loss=0.00784, v_num=0, train_loss=0.000789, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.306, val_accuracy=0.943, val_f1_score=0.943]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 142:  89%|████████▉ | 228/255 [02:32<00:18,  1.49it/s, loss=0.00784, v_num=0, train_loss=0.000789, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.306, val_accuracy=0.943, val_f1_score=0.943]
Validating:   7%|▋         | 2/29 [00:06<01:17,  2.87s/it][A
Epoch 142:  90%|█████████ | 230/255 [02:33<00:16,  1.50it/s, loss=0.00784, v_num=0, train_loss=0.000789, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.306, val_accuracy=0.943, val_f1_score=0.943]
Validating:  14%|█▍        | 4/29 [00:07<00:27,  1.09s/it][A
Epoch 142:  91%|█████████ | 232/255 [02:33<00:15,  1.51it/s, loss=0.00784, v_num=0, train_loss=0.000789, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.306, val_accu

Epoch 142, global step 32317: val_loss was not in top 2


Epoch 143:  89%|████████▊ | 226/255 [02:32<00:19,  1.48it/s, loss=0.0152, v_num=0, train_loss=0.0257, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.323, val_accuracy=0.935, val_f1_score=0.935]   
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 143:  89%|████████▉ | 228/255 [02:39<00:18,  1.43it/s, loss=0.0152, v_num=0, train_loss=0.0257, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.323, val_accuracy=0.935, val_f1_score=0.935]
Epoch 143:  90%|█████████ | 230/255 [02:39<00:17,  1.44it/s, loss=0.0152, v_num=0, train_loss=0.0257, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.323, val_accuracy=0.935, val_f1_score=0.935]
Epoch 143:  91%|█████████ | 232/255 [02:39<00:15,  1.46it/s, loss=0.0152, v_num=0, train_loss=0.0257, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.323, val_accuracy=0.935, val_f1_score=0.935]
Epoch 143:  92%|█████████▏| 234/255 [02:39<00:14,  1.47it/s, loss=0.0152, v_num=0, train_loss=0.0257,

Epoch 143, global step 32543: val_loss was not in top 2


Epoch 144:  89%|████████▊ | 226/255 [02:29<00:19,  1.52it/s, loss=0.0148, v_num=0, train_loss=0.000648, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.282, val_accuracy=0.942, val_f1_score=0.942] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 144:  89%|████████▉ | 228/255 [02:35<00:18,  1.46it/s, loss=0.0148, v_num=0, train_loss=0.000648, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.282, val_accuracy=0.942, val_f1_score=0.942]
Epoch 144:  90%|█████████ | 230/255 [02:35<00:16,  1.47it/s, loss=0.0148, v_num=0, train_loss=0.000648, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.282, val_accuracy=0.942, val_f1_score=0.942]
Validating:  14%|█▍        | 4/29 [00:07<00:29,  1.16s/it][A
Epoch 144:  91%|█████████ | 232/255 [02:36<00:15,  1.48it/s, loss=0.0148, v_num=0, train_loss=0.000648, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.282, val_accuracy=0.942, val_f1_score=0.942]
Validating:  21%|██        | 6/29

Epoch 144, global step 32769: val_loss was not in top 2


Epoch 145:  89%|████████▊ | 226/255 [02:26<00:18,  1.54it/s, loss=0.00703, v_num=0, train_loss=0.00893, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.272, val_accuracy=0.934, val_f1_score=0.934]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 145:  89%|████████▉ | 228/255 [02:33<00:18,  1.49it/s, loss=0.00703, v_num=0, train_loss=0.00893, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.272, val_accuracy=0.934, val_f1_score=0.934]
Validating:   7%|▋         | 2/29 [00:06<01:14,  2.77s/it][A
Epoch 145:  90%|█████████ | 230/255 [02:33<00:16,  1.50it/s, loss=0.00703, v_num=0, train_loss=0.00893, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.272, val_accuracy=0.934, val_f1_score=0.934]
Validating:  14%|█▍        | 4/29 [00:07<00:26,  1.05s/it][A
Epoch 145:  91%|█████████ | 232/255 [02:34<00:15,  1.51it/s, loss=0.00703, v_num=0, train_loss=0.00893, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.272, val_accura

Epoch 145, global step 32995: val_loss was not in top 2


Epoch 146:  89%|████████▊ | 226/255 [02:27<00:18,  1.53it/s, loss=0.0026, v_num=0, train_loss=0.00014, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.315, val_accuracy=0.939, val_f1_score=0.939]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 146:  89%|████████▉ | 228/255 [02:34<00:18,  1.48it/s, loss=0.0026, v_num=0, train_loss=0.00014, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.315, val_accuracy=0.939, val_f1_score=0.939]
Validating:   7%|▋         | 2/29 [00:06<01:17,  2.89s/it][A
Epoch 146:  90%|█████████ | 230/255 [02:34<00:16,  1.49it/s, loss=0.0026, v_num=0, train_loss=0.00014, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.315, val_accuracy=0.939, val_f1_score=0.939]
Validating:  14%|█▍        | 4/29 [00:07<00:27,  1.09s/it][A
Epoch 146:  91%|█████████ | 232/255 [02:34<00:15,  1.50it/s, loss=0.0026, v_num=0, train_loss=0.00014, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.315, val_accuracy=0

Epoch 146, global step 33221: val_loss was not in top 2


Epoch 147:  89%|████████▊ | 226/255 [01:21<00:10,  2.78it/s, loss=0.0122, v_num=0, train_loss=0.0038, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.319, val_accuracy=0.940, val_f1_score=0.940]   
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 147:  89%|████████▉ | 228/255 [01:28<00:10,  2.58it/s, loss=0.0122, v_num=0, train_loss=0.0038, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.319, val_accuracy=0.940, val_f1_score=0.940]
Epoch 147:  90%|█████████ | 230/255 [01:28<00:09,  2.60it/s, loss=0.0122, v_num=0, train_loss=0.0038, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.319, val_accuracy=0.940, val_f1_score=0.940]
Epoch 147:  91%|█████████ | 232/255 [01:28<00:08,  2.62it/s, loss=0.0122, v_num=0, train_loss=0.0038, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.319, val_accuracy=0.940, val_f1_score=0.940]
Epoch 147:  92%|█████████▏| 234/255 [01:28<00:07,  2.64it/s, loss=0.0122, v_num=0, train_loss=0.0038,

Epoch 147, global step 33447: val_loss was not in top 2


Epoch 148:  89%|████████▊ | 226/255 [01:20<00:10,  2.81it/s, loss=0.00948, v_num=0, train_loss=0.000175, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.308, val_accuracy=0.940, val_f1_score=0.940]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 148:  89%|████████▉ | 228/255 [01:26<00:10,  2.63it/s, loss=0.00948, v_num=0, train_loss=0.000175, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.308, val_accuracy=0.940, val_f1_score=0.940]
Epoch 148:  90%|█████████ | 230/255 [01:26<00:09,  2.64it/s, loss=0.00948, v_num=0, train_loss=0.000175, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.308, val_accuracy=0.940, val_f1_score=0.940]
Epoch 148:  91%|█████████ | 232/255 [01:27<00:08,  2.66it/s, loss=0.00948, v_num=0, train_loss=0.000175, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.308, val_accuracy=0.940, val_f1_score=0.940]
Epoch 148:  92%|█████████▏| 234/255 [01:27<00:07,  2.68it/s, loss=0.00948, v_num=0, train_lo

Epoch 148, global step 33673: val_loss was not in top 2


Epoch 149:  89%|████████▊ | 226/255 [01:20<00:10,  2.80it/s, loss=0.0134, v_num=0, train_loss=0.0072, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.325, val_accuracy=0.935, val_f1_score=0.935]   
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 149:  89%|████████▉ | 228/255 [01:27<00:10,  2.62it/s, loss=0.0134, v_num=0, train_loss=0.0072, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.325, val_accuracy=0.935, val_f1_score=0.935]
Epoch 149:  90%|█████████ | 230/255 [01:27<00:09,  2.64it/s, loss=0.0134, v_num=0, train_loss=0.0072, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.325, val_accuracy=0.935, val_f1_score=0.935]
Epoch 149:  91%|█████████ | 232/255 [01:27<00:08,  2.65it/s, loss=0.0134, v_num=0, train_loss=0.0072, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.325, val_accuracy=0.935, val_f1_score=0.935]
Epoch 149:  92%|█████████▏| 234/255 [01:27<00:07,  2.67it/s, loss=0.0134, v_num=0, train_loss=0.0072,

Epoch 149, global step 33899: val_loss was not in top 2


Epoch 150:  89%|████████▊ | 226/255 [01:20<00:10,  2.82it/s, loss=0.00681, v_num=0, train_loss=0.000423, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.284, val_accuracy=0.934, val_f1_score=0.934]
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 150:  89%|████████▉ | 228/255 [01:26<00:10,  2.64it/s, loss=0.00681, v_num=0, train_loss=0.000423, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.284, val_accuracy=0.934, val_f1_score=0.934]
Epoch 150:  90%|█████████ | 230/255 [01:26<00:09,  2.66it/s, loss=0.00681, v_num=0, train_loss=0.000423, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.284, val_accuracy=0.934, val_f1_score=0.934]
Epoch 150:  91%|█████████ | 232/255 [01:26<00:08,  2.67it/s, loss=0.00681, v_num=0, train_loss=0.000423, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.284, val_accuracy=0.934, val_f1_score=0.934]
Epoch 150:  92%|█████████▏| 234/255 [01:26<00:07,  2.69it/s, loss=0.00681, v_num=0, train_lo

Epoch 150, global step 34125: val_loss was not in top 2


Epoch 151:  89%|████████▊ | 226/255 [01:21<00:10,  2.79it/s, loss=0.0019, v_num=0, train_loss=0.00188, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.270, val_accuracy=0.938, val_f1_score=0.938]  
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 151:  89%|████████▉ | 228/255 [01:27<00:10,  2.62it/s, loss=0.0019, v_num=0, train_loss=0.00188, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.270, val_accuracy=0.938, val_f1_score=0.938]
Epoch 151:  90%|█████████ | 230/255 [01:27<00:09,  2.63it/s, loss=0.0019, v_num=0, train_loss=0.00188, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.270, val_accuracy=0.938, val_f1_score=0.938]
Epoch 151:  91%|█████████ | 232/255 [01:27<00:08,  2.65it/s, loss=0.0019, v_num=0, train_loss=0.00188, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.270, val_accuracy=0.938, val_f1_score=0.938]
Epoch 151:  92%|█████████▏| 234/255 [01:27<00:07,  2.67it/s, loss=0.0019, v_num=0, train_loss=0.00

Epoch 151, global step 34351: val_loss was not in top 2


Epoch 152:  89%|████████▊ | 226/255 [01:20<00:10,  2.81it/s, loss=0.0195, v_num=0, train_loss=0.0244, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.270, val_accuracy=0.938, val_f1_score=0.938]   
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 152:  89%|████████▉ | 228/255 [01:26<00:10,  2.63it/s, loss=0.0195, v_num=0, train_loss=0.0244, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.270, val_accuracy=0.938, val_f1_score=0.938]
Epoch 152:  90%|█████████ | 230/255 [01:26<00:09,  2.64it/s, loss=0.0195, v_num=0, train_loss=0.0244, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.270, val_accuracy=0.938, val_f1_score=0.938]
Epoch 152:  91%|█████████ | 232/255 [01:27<00:08,  2.66it/s, loss=0.0195, v_num=0, train_loss=0.0244, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.270, val_accuracy=0.938, val_f1_score=0.938]
Epoch 152:  92%|█████████▏| 234/255 [01:27<00:07,  2.68it/s, loss=0.0195, v_num=0, train_loss=0.0244,

Epoch 152, global step 34577: val_loss was not in top 2


Epoch 153:  89%|████████▊ | 226/255 [01:20<00:10,  2.81it/s, loss=0.0124, v_num=0, train_loss=0.00145, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.287, val_accuracy=0.940, val_f1_score=0.940] 
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 153:  89%|████████▉ | 228/255 [01:27<00:10,  2.62it/s, loss=0.0124, v_num=0, train_loss=0.00145, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.287, val_accuracy=0.940, val_f1_score=0.940]
Validating:   7%|▋         | 2/29 [00:06<01:17,  2.87s/it][A
Epoch 153:  90%|█████████ | 230/255 [01:27<00:09,  2.63it/s, loss=0.0124, v_num=0, train_loss=0.00145, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.287, val_accuracy=0.940, val_f1_score=0.940]
Validating:  14%|█▍        | 4/29 [00:07<00:26,  1.05s/it][A
Epoch 153:  91%|█████████ | 232/255 [01:27<00:08,  2.64it/s, loss=0.0124, v_num=0, train_loss=0.00145, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.287, val_accuracy=0.

Epoch 153, global step 34803: val_loss was not in top 2


Epoch 154:  89%|████████▊ | 226/255 [02:27<00:18,  1.53it/s, loss=0.016, v_num=0, train_loss=0.00607, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.271, val_accuracy=0.935, val_f1_score=0.935]   
Validating: 0it [00:00, ?it/s][A
Validating:   0%|          | 0/29 [00:00<?, ?it/s][A
Epoch 154:  89%|████████▉ | 228/255 [02:33<00:18,  1.48it/s, loss=0.016, v_num=0, train_loss=0.00607, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.271, val_accuracy=0.935, val_f1_score=0.935]
Validating:   7%|▋         | 2/29 [00:06<01:13,  2.71s/it][A
Epoch 154:  90%|█████████ | 230/255 [02:34<00:16,  1.49it/s, loss=0.016, v_num=0, train_loss=0.00607, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.271, val_accuracy=0.935, val_f1_score=0.935]
Validating:  14%|█▍        | 4/29 [00:06<00:25,  1.03s/it][A
Epoch 154:  91%|█████████ | 232/255 [02:34<00:15,  1.50it/s, loss=0.016, v_num=0, train_loss=0.00607, train_accuracy=1.000, train_f1_score=1.000, val_loss=0.271, val_accuracy=0.93

Epoch 154, global step 35029: val_loss was not in top 2


Epoch 155:  23%|██▎       | 58/255 [00:44<02:29,  1.32it/s, loss=0.0063, v_num=0, train_loss=0.056, train_accuracy=0.980, train_f1_score=0.980, val_loss=0.265, val_accuracy=0.935, val_f1_score=0.935]    

  rank_zero_warn("Detected KeyboardInterrupt, attempting graceful shutdown...")
LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1,2]


Testing: 100%|██████████| 29/29 [00:12<00:00,  2.37it/s]/s, loss=0.0063, v_num=0, train_loss=0.056, train_accuracy=0.980, train_f1_score=0.980, val_loss=0.265, val_accuracy=0.935, val_f1_score=0.935]--------------------------------------------------------------------------------
DATALOADER:0 TEST RESULTS
{'test_f1_score': 0.9474804997444153,
 'test_train_accuracy': 0.9474804997444153,
 'test_train_loss': 0.2336176037788391}
--------------------------------------------------------------------------------
Testing: 100%|██████████| 29/29 [00:12<00:00,  2.29it/s]
------------------ Round: 4 ------------------
['O2', 'O1', 'FT7', 'F4', 'TP7', 'C3', 'C4', 'F3', 'FT8', 'T6', 'HEOR', 'T5', 'VEOL', 'F7', 'FZ', 'VEOU', 'A1', 'P3', 'PZ', 'CP3', 'P4', 'CPZ', 'A2', 'HEOL', 'CP4', 'FT9', 'F8', 'OZ', 'CZ', 'FC4', 'FC3', 'FP1', 'PO1', 'T3', 'T4', 'PO2']
Len: 36


Traceback (most recent call last):
  File "/usr/lib/python3.6/multiprocessing/queues.py", line 240, in _feed
    send_bytes(obj)
  File "/usr/lib/python3.6/multiprocessing/connection.py", line 200, in send_bytes
    self._send_bytes(m[offset:offset + size])
  File "/usr/lib/python3.6/multiprocessing/connection.py", line 404, in _send_bytes
    self._send(header + buf)
  File "/usr/lib/python3.6/multiprocessing/connection.py", line 368, in _send
    n = write(self._handle, buf)
BrokenPipeError: [Errno 32] Broken pipe


## Load Checkpoint 

In [None]:
# best-checkpoint-corr-3-v1.ckptn
# trainer.fit(model, data_module, ckpt_path="/Workspace/code/checkpoints/best-checkpoint-corr-3-v1.ckpt")