## 0. Imports and Constants
- Select user before proceeding

In [74]:
############## AUTORELOAD MAGIC ###################
%load_ext autoreload
%autoreload 2
###################################################

############## FUNDAMENTAL MODULES ################
import json
from PIL import Image
import os
import sys
import matplotlib.pyplot as plt
import numpy as np
import pickle
import re
 ##################################################

############## TASK-SPECIFIC MODULES ##############
sys.path.append(os.path.join(os.getcwd(),"src"))
from vanilla_dataset import VanillaDataset
from vanilla_nn import VanillaNN
from trainer import Trainer
###################################################


####################### CONSTANTS ########################
SPLITS = ["train", "dev", "test", "gold"]
TRAIN, DEV, TEST, TXT, IMG = "train", "dev", "test", "txt", "img"
FE_METHODS = ["txt_embeddings", "img_embeddings", "concat", "sum", "mean", "hadamard"]
#FE_METHODS += ["concat_cos", "sum_cos", "mean_cos", "hadamard_cos"]
##########################################################

############## DATA SCIENCE & ML MODULES #################
from transformers import CLIPTokenizerFast, CLIPProcessor, CLIPModel
import torch
import pandas as pd
from scipy import stats
from sklearn.svm import SVC
from sklearn.metrics import classification_report
##########################################################

####################### SELECT ###########################
users = ["patriziopalmisano", "onurdenizguler", "jockl"]
user = users[2] # SELECT USER
version = "v2" # SELECT DATASET VERSION
dataset_version = version
##########################################################

if user in users[:2]:
    data_dir = f"/Users/{user}/Library/CloudStorage/GoogleDrive-check.worthiness@gmail.com/My Drive/data/CT23_1A_checkworthy_multimodal_english_{version}"
    cw_dir = f"/Users/{user}/Library/CloudStorage/GoogleDrive-check.worthiness@gmail.com/My Drive"

else:
    data_dir = f"/home/jockl/Insync/check.worthiness@gmail.com/Google Drive/data/CT23_1A_checkworthy_multimodal_english_{dataset_version}"
    cw_dir = "/home/jockl/Insync/check.worthiness@gmail.com/Google Drive"

features_dir = f"{data_dir}/features"
labels_dir = f"{data_dir}/labels"
models_dir = f"{cw_dir}/models/vanillann_hyperparam_search"

The autoreload extension is already loaded. To reload it, use:
  %reload_ext autoreload


# 1. Load the Datasets

In [75]:
split_to_labels = {split: 
                   np.load(f"{labels_dir}/{split}_labels_{dataset_version}.pickle", allow_pickle=True) if split != "gold" else np.load(f"{labels_dir}/{split}_labels.pickle", allow_pickle=True)
                   for split in SPLITS}

method_to_split_to_data = {fe_method: {
                                    split: 
                                    np.load(f"{features_dir}/{fe_method}/{fe_method}_{split}_{dataset_version}.pickle", allow_pickle=True) if split != "gold" else np.load(f"{features_dir}/{fe_method}/{fe_method}_{split}.pickle", allow_pickle=True)
                                    for split in SPLITS
                                    } 
                            for fe_method in FE_METHODS}

method_to_split_to_dataset = {fe_method: {
                                        split:
                                        VanillaDataset(method_to_split_to_data[fe_method][split], split_to_labels[split]) 
                                        for split in SPLITS
                                        } 
                                for fe_method in FE_METHODS}

# 2. Hyperparam Search

In this section, the same hyperparameter search is performed on different feature engineering methods. Every search features the following parameters:

In [76]:
# Hyperparams to search from
model_init_param_configs = [
    [128, 64, 32, 16],
    [128, 64, 32],
    [64, 32, 128],
    [128, 64],
    [64, 32],
    [32, 16],
    [64],
    [32],
    [16]
]
learning_rates = [1e-7, 1e-6, 1e-5, 1e-4, 1e-3]
batch_sizes = [8, 16, 32, 64, 128]
num_epochs = 1000

In [77]:
# Select device
device = "cpu"

## 2.1 Hyperparam Search on Text Embeddings

In [78]:
# Select method 
dataset_method = "txt_embeddings"
dataset_dict = method_to_split_to_dataset[dataset_method]

# Select model architecture and model class
model = VanillaNN

# Instantiate a trainer on the selected model class, model architecture, and dataset
trainer_text = Trainer(model, dataset_method, dataset_dict)

In [79]:
# Perform hyper param search on the selected method
for model_config in model_init_param_configs:
    trainer_text.hyperparameter_search(model_init_params = model_config,
                                    device = device,
                                    learning_rates = learning_rates,
                                    batch_sizes = batch_sizes,
                                    num_epochs = num_epochs)

100%|██████████| 1000/1000 [14:48<00:00,  1.12it/s]
100%|██████████| 1000/1000 [07:27<00:00,  2.23it/s]
  2%|▏         | 16/1000 [00:04<04:43,  3.47it/s]
  0%|          | 1/1000 [00:00<02:49,  5.89it/s]

Early quitting at epoch: 16


  1%|          | 10/1000 [00:01<03:02,  5.41it/s]
  0%|          | 1/1000 [00:00<01:52,  8.91it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:01<02:07,  7.78it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


 35%|███▌      | 354/1000 [05:02<09:12,  1.17it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 354


 48%|████▊     | 479/1000 [03:36<03:55,  2.21it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 479


  2%|▏         | 15/1000 [00:04<04:27,  3.69it/s]
  0%|          | 1/1000 [00:00<02:21,  7.04it/s]

Early quitting at epoch: 15


  1%|          | 10/1000 [00:01<02:31,  6.54it/s]
  0%|          | 1/1000 [00:00<01:41,  9.87it/s]

Early quitting at epoch: 10


  1%|▏         | 13/1000 [00:01<01:56,  8.51it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 13


  5%|▍         | 46/1000 [00:40<14:09,  1.12it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 46


  6%|▌         | 59/1000 [00:27<07:16,  2.16it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 59


  7%|▋         | 70/1000 [00:18<04:08,  3.74it/s]
  0%|          | 1/1000 [00:00<02:19,  7.18it/s]

Early quitting at epoch: 70


  6%|▌         | 57/1000 [00:08<02:26,  6.42it/s]
  0%|          | 1/1000 [00:00<01:45,  9.50it/s]

Early quitting at epoch: 57


  5%|▍         | 47/1000 [00:04<01:33, 10.15it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 47


  1%|          | 10/1000 [00:09<15:24,  1.07it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:04<08:13,  2.01it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 12/1000 [00:03<04:30,  3.66it/s]
  0%|          | 1/1000 [00:00<02:26,  6.84it/s]

Early quitting at epoch: 12


  2%|▏         | 17/1000 [00:02<02:42,  6.04it/s]
  0%|          | 1/1000 [00:00<01:44,  9.58it/s]

Early quitting at epoch: 17


  2%|▏         | 18/1000 [00:01<01:46,  9.23it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 18


  1%|          | 10/1000 [00:09<15:47,  1.04it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:05<08:36,  1.92it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:02<04:19,  3.82it/s]
  0%|          | 1/1000 [00:00<02:27,  6.78it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:01<02:43,  6.07it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:01<01:51,  8.84it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


 92%|█████████▏| 919/1000 [11:54<01:03,  1.29it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 919


 98%|█████████▊| 980/1000 [06:42<00:08,  2.43it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 980


  1%|          | 11/1000 [00:02<04:07,  4.00it/s]
  0%|          | 1/1000 [00:00<02:28,  6.72it/s]

Early quitting at epoch: 11


  1%|          | 11/1000 [00:01<02:27,  6.70it/s]
  0%|          | 2/1000 [00:00<01:18, 12.79it/s]

Early quitting at epoch: 11


  1%|          | 12/1000 [00:01<01:44,  9.41it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 12


 28%|██▊       | 277/1000 [03:38<09:29,  1.27it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 277


 40%|████      | 401/1000 [02:47<04:10,  2.39it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 401


  1%|          | 12/1000 [00:03<04:11,  3.93it/s]
  0%|          | 1/1000 [00:00<02:11,  7.59it/s]

Early quitting at epoch: 12


  1%|          | 12/1000 [00:01<02:22,  6.93it/s]
  0%|          | 2/1000 [00:00<01:27, 11.45it/s]

Early quitting at epoch: 12


  1%|          | 11/1000 [00:01<01:37, 10.10it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 11


  4%|▎         | 35/1000 [00:27<12:48,  1.26it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 35


  5%|▍         | 48/1000 [00:19<06:34,  2.41it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 48


  5%|▌         | 51/1000 [00:11<03:42,  4.27it/s]
  0%|          | 1/1000 [00:00<02:06,  7.88it/s]

Early quitting at epoch: 51


  4%|▍         | 43/1000 [00:06<02:23,  6.68it/s]
  0%|          | 2/1000 [00:00<01:30, 10.98it/s]

Early quitting at epoch: 43


  2%|▏         | 21/1000 [00:02<01:34, 10.33it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 21


  1%|          | 10/1000 [00:08<13:27,  1.23it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:04<07:06,  2.32it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 11/1000 [00:02<04:14,  3.89it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 11


  2%|▏         | 18/1000 [00:02<02:37,  6.22it/s]
  0%|          | 1/1000 [00:00<01:42,  9.76it/s]

Early quitting at epoch: 18


  2%|▏         | 18/1000 [00:01<01:36, 10.17it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 18


  1%|          | 10/1000 [00:08<13:39,  1.21it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:04<07:22,  2.23it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:02<04:42,  3.51it/s]
  0%|          | 1/1000 [00:00<02:18,  7.24it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:01<02:40,  6.16it/s]
  0%|          | 1/1000 [00:00<01:53,  8.78it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:01<01:51,  8.85it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


 81%|████████  | 811/1000 [09:06<02:07,  1.48it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 811


100%|██████████| 1000/1000 [06:07<00:00,  2.72it/s]
  1%|          | 12/1000 [00:02<03:39,  4.50it/s]
  0%|          | 1/1000 [00:00<01:57,  8.50it/s]

Early quitting at epoch: 12


  1%|          | 12/1000 [00:01<02:14,  7.36it/s]
  0%|          | 2/1000 [00:00<01:32, 10.81it/s]

Early quitting at epoch: 12


  1%|          | 10/1000 [00:00<01:34, 10.44it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


 36%|███▌      | 357/1000 [04:05<07:21,  1.46it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 357


 42%|████▏     | 416/1000 [02:34<03:36,  2.70it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 416


  6%|▌         | 60/1000 [00:12<03:15,  4.81it/s]
  0%|          | 1/1000 [00:00<01:56,  8.58it/s]

Early quitting at epoch: 60


  1%|          | 10/1000 [00:01<02:30,  6.59it/s]
  0%|          | 2/1000 [00:00<01:19, 12.59it/s]

Early quitting at epoch: 10


  1%|          | 12/1000 [00:01<01:31, 10.82it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 12


  5%|▍         | 49/1000 [00:34<11:07,  1.42it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 49


  6%|▋         | 64/1000 [00:24<05:59,  2.60it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 64


  4%|▍         | 43/1000 [00:09<03:26,  4.64it/s]
  0%|          | 1/1000 [00:00<02:06,  7.90it/s]

Early quitting at epoch: 43


  5%|▌         | 51/1000 [00:06<01:59,  7.96it/s]
  0%|          | 2/1000 [00:00<01:28, 11.28it/s]

Early quitting at epoch: 51


  4%|▍         | 38/1000 [00:03<01:21, 11.76it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 38


  1%|          | 10/1000 [00:07<12:13,  1.35it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 11/1000 [00:04<06:57,  2.37it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 11


  1%|▏         | 14/1000 [00:03<03:34,  4.60it/s]
  0%|          | 1/1000 [00:00<01:51,  8.99it/s]

Early quitting at epoch: 14


  1%|▏         | 14/1000 [00:01<02:03,  7.99it/s]
  0%|          | 2/1000 [00:00<01:15, 13.20it/s]

Early quitting at epoch: 14


  2%|▏         | 17/1000 [00:01<01:30, 10.87it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 17


  1%|          | 10/1000 [00:07<12:08,  1.36it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:04<06:39,  2.48it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:02<03:51,  4.27it/s]
  0%|          | 1/1000 [00:00<02:08,  7.78it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:01<02:16,  7.26it/s]
  0%|          | 2/1000 [00:00<01:27, 11.39it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:01<01:41,  9.71it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


 63%|██████▎   | 634/1000 [07:03<04:04,  1.50it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 634


 98%|█████████▊| 984/1000 [05:56<00:05,  2.76it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 984


 12%|█▏        | 121/1000 [00:25<03:07,  4.70it/s]
  0%|          | 1/1000 [00:00<02:07,  7.81it/s]

Early quitting at epoch: 121


  1%|          | 10/1000 [00:01<02:36,  6.32it/s]
  0%|          | 2/1000 [00:00<01:26, 11.58it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:00<01:38, 10.05it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


 24%|██▍       | 245/1000 [02:44<08:26,  1.49it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 245


 36%|███▌      | 361/1000 [02:13<03:55,  2.71it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 361


 11%|█         | 106/1000 [00:22<03:07,  4.77it/s]
  0%|          | 1/1000 [00:00<02:09,  7.70it/s]

Early quitting at epoch: 106


  6%|▋         | 65/1000 [00:08<02:00,  7.78it/s]
  0%|          | 2/1000 [00:00<01:18, 12.64it/s]

Early quitting at epoch: 65


  2%|▏         | 15/1000 [00:01<01:25, 11.56it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 15


  4%|▍         | 42/1000 [00:29<11:02,  1.45it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 42


  6%|▌         | 61/1000 [00:22<05:49,  2.68it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 61


  5%|▍         | 49/1000 [00:10<03:25,  4.62it/s]
  0%|          | 1/1000 [00:00<02:00,  8.27it/s]

Early quitting at epoch: 49


  3%|▎         | 30/1000 [00:03<02:08,  7.54it/s]
  0%|          | 2/1000 [00:00<01:18, 12.75it/s]

Early quitting at epoch: 30


  3%|▎         | 33/1000 [00:02<01:25, 11.35it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 33


  1%|          | 10/1000 [00:07<12:30,  1.32it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:04<06:36,  2.49it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 11/1000 [00:02<04:02,  4.07it/s]
  0%|          | 1/1000 [00:00<02:09,  7.71it/s]

Early quitting at epoch: 11


  2%|▏         | 17/1000 [00:02<02:15,  7.28it/s]
  0%|          | 2/1000 [00:00<01:23, 12.02it/s]

Early quitting at epoch: 17


  1%|▏         | 13/1000 [00:01<01:25, 11.48it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 13


  1%|          | 10/1000 [00:07<11:49,  1.39it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:04<06:40,  2.47it/s]
  0%|          | 1/1000 [00:00<03:03,  5.44it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:02<03:54,  4.23it/s]
  0%|          | 1/1000 [00:00<02:09,  7.73it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:01<02:17,  7.18it/s]
  0%|          | 2/1000 [00:00<01:33, 10.65it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:01<01:40,  9.90it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


 72%|███████▏  | 717/1000 [06:56<02:44,  1.72it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 717


100%|██████████| 1000/1000 [05:11<00:00,  3.21it/s]
  1%|          | 10/1000 [00:01<03:09,  5.22it/s]
  0%|          | 1/1000 [00:00<01:44,  9.59it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:01<01:54,  8.63it/s]
  0%|          | 2/1000 [00:00<01:17, 12.84it/s]

Early quitting at epoch: 10


  1%|          | 11/1000 [00:00<01:24, 11.77it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 11


 34%|███▎      | 335/1000 [03:13<06:23,  1.73it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 335


 37%|███▋      | 374/1000 [01:56<03:15,  3.20it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 374


 10%|█         | 103/1000 [00:18<02:42,  5.54it/s]
  0%|          | 1/1000 [00:00<02:01,  8.24it/s]

Early quitting at epoch: 103


  1%|          | 12/1000 [00:01<01:50,  8.94it/s]
  0%|          | 2/1000 [00:00<01:00, 16.62it/s]

Early quitting at epoch: 12


  2%|▏         | 16/1000 [00:01<01:20, 12.26it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 16


  7%|▋         | 66/1000 [00:38<09:09,  1.70it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 66


  9%|▊         | 86/1000 [00:26<04:36,  3.30it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 86


  6%|▋         | 64/1000 [00:11<02:49,  5.52it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 64


  5%|▌         | 53/1000 [00:05<01:43,  9.16it/s]
  0%|          | 2/1000 [00:00<01:10, 14.23it/s]

Early quitting at epoch: 53


  3%|▎         | 31/1000 [00:02<01:16, 12.66it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 31


  1%|          | 11/1000 [00:06<10:27,  1.58it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 11


  1%|▏         | 14/1000 [00:04<05:29,  3.00it/s]
  0%|          | 1/1000 [00:00<02:56,  5.66it/s]

Early quitting at epoch: 14


  1%|▏         | 14/1000 [00:02<03:15,  5.03it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 14


  2%|▏         | 17/1000 [00:01<01:47,  9.15it/s]
  0%|          | 2/1000 [00:00<01:08, 14.50it/s]

Early quitting at epoch: 17


  2%|▏         | 20/1000 [00:01<01:12, 13.54it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 20


  1%|          | 10/1000 [00:06<10:24,  1.59it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:03<05:38,  2.92it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:02<03:21,  4.91it/s]
  0%|          | 1/1000 [00:00<01:42,  9.79it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:01<01:54,  8.63it/s]
  0%|          | 2/1000 [00:00<01:12, 13.70it/s]

Early quitting at epoch: 10


  1%|          | 11/1000 [00:00<01:20, 12.22it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 11


 58%|█████▊    | 579/1000 [04:54<03:34,  1.97it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 579


100%|██████████| 1000/1000 [04:34<00:00,  3.64it/s]
  1%|▏         | 13/1000 [00:02<02:46,  5.94it/s]
  0%|          | 2/1000 [00:00<01:27, 11.44it/s]

Early quitting at epoch: 13


  1%|▏         | 13/1000 [00:01<01:37, 10.15it/s]
  0%|          | 2/1000 [00:00<01:06, 15.11it/s]

Early quitting at epoch: 13


  1%|          | 10/1000 [00:00<01:10, 14.07it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


 33%|███▎      | 330/1000 [02:49<05:43,  1.95it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 330


 51%|█████     | 507/1000 [02:19<02:15,  3.64it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 507


  2%|▎         | 25/1000 [00:04<02:42,  5.98it/s]
  0%|          | 2/1000 [00:00<01:23, 11.98it/s]

Early quitting at epoch: 25


  6%|▌         | 58/1000 [00:05<01:31, 10.32it/s]
  0%|          | 2/1000 [00:00<01:05, 15.25it/s]

Early quitting at epoch: 58


  1%|          | 10/1000 [00:00<01:12, 13.61it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  8%|▊         | 81/1000 [00:42<07:59,  1.91it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 81


 12%|█▏        | 120/1000 [00:33<04:02,  3.63it/s]
  0%|          | 1/1000 [00:00<02:16,  7.34it/s]

Early quitting at epoch: 120


  6%|▌         | 60/1000 [00:09<02:26,  6.42it/s]
  0%|          | 1/1000 [00:00<01:45,  9.49it/s]

Early quitting at epoch: 60


  4%|▍         | 40/1000 [00:04<01:36,  9.99it/s]
  0%|          | 2/1000 [00:00<01:12, 13.69it/s]

Early quitting at epoch: 40


  2%|▏         | 17/1000 [00:01<01:10, 13.88it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 17


  1%|▏         | 13/1000 [00:07<09:16,  1.77it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 13


  2%|▏         | 15/1000 [00:04<04:50,  3.39it/s]
  0%|          | 1/1000 [00:00<02:23,  6.96it/s]

Early quitting at epoch: 15


  2%|▏         | 21/1000 [00:03<02:32,  6.41it/s]
  0%|          | 2/1000 [00:00<01:34, 10.55it/s]

Early quitting at epoch: 21


  2%|▏         | 24/1000 [00:02<01:39,  9.80it/s]
  0%|          | 2/1000 [00:00<01:04, 15.52it/s]

Early quitting at epoch: 24


  2%|▏         | 21/1000 [00:01<01:06, 14.78it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 21


  1%|          | 10/1000 [00:05<09:15,  1.78it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:03<05:06,  3.23it/s]
  0%|          | 1/1000 [00:00<02:36,  6.38it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:01<02:54,  5.66it/s]
  0%|          | 1/1000 [00:00<01:46,  9.39it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:01<01:47,  9.21it/s]
  0%|          | 2/1000 [00:00<01:03, 15.60it/s]

Early quitting at epoch: 10


  1%|          | 11/1000 [00:00<01:12, 13.67it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 11


 54%|█████▍    | 543/1000 [04:11<03:31,  2.16it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 543


 95%|█████████▌| 953/1000 [04:03<00:12,  3.92it/s]
  0%|          | 1/1000 [00:00<02:39,  6.25it/s]

Early quitting at epoch: 953


  2%|▏         | 18/1000 [00:02<02:38,  6.19it/s]
  0%|          | 2/1000 [00:00<01:23, 12.02it/s]

Early quitting at epoch: 18


  1%|          | 12/1000 [00:01<01:32, 10.64it/s]
  0%|          | 2/1000 [00:00<01:06, 15.02it/s]

Early quitting at epoch: 12


  1%|          | 10/1000 [00:00<01:08, 14.55it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


 24%|██▎       | 235/1000 [01:49<05:56,  2.15it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 235


 33%|███▎      | 327/1000 [01:22<02:49,  3.97it/s]
  0%|          | 1/1000 [00:00<02:24,  6.93it/s]

Early quitting at epoch: 327


  8%|▊         | 77/1000 [00:11<02:22,  6.47it/s]
  0%|          | 2/1000 [00:00<01:23, 11.92it/s]

Early quitting at epoch: 77


  2%|▏         | 17/1000 [00:01<01:33, 10.53it/s]
  0%|          | 2/1000 [00:00<01:05, 15.18it/s]

Early quitting at epoch: 17


  1%|          | 11/1000 [00:00<01:14, 13.30it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 11


  8%|▊         | 81/1000 [00:37<07:08,  2.14it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 81


 10%|█         | 104/1000 [00:26<03:52,  3.86it/s]
  0%|          | 1/1000 [00:00<02:27,  6.78it/s]

Early quitting at epoch: 104


  4%|▍         | 40/1000 [00:06<02:27,  6.49it/s]
  0%|          | 2/1000 [00:00<01:30, 11.03it/s]

Early quitting at epoch: 40


  5%|▍         | 46/1000 [00:04<01:30, 10.58it/s]
  0%|          | 2/1000 [00:00<00:54, 18.24it/s]

Early quitting at epoch: 46


  3%|▎         | 34/1000 [00:02<01:02, 15.45it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 34


  1%|▏         | 13/1000 [00:06<08:29,  1.94it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 13


  2%|▏         | 15/1000 [00:03<04:19,  3.80it/s]
  0%|          | 1/1000 [00:00<02:20,  7.12it/s]

Early quitting at epoch: 15


  2%|▏         | 16/1000 [00:02<02:36,  6.29it/s]
  0%|          | 2/1000 [00:00<01:35, 10.44it/s]

Early quitting at epoch: 16


  2%|▏         | 17/1000 [00:01<01:35, 10.28it/s]
  0%|          | 2/1000 [00:00<01:00, 16.52it/s]

Early quitting at epoch: 17


  2%|▏         | 21/1000 [00:01<01:11, 13.64it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 21


  1%|          | 10/1000 [00:05<08:19,  1.98it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:02<04:44,  3.48it/s]
  0%|          | 1/1000 [00:00<02:23,  6.98it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:01<02:42,  6.08it/s]
  0%|          | 2/1000 [00:00<01:25, 11.72it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:01<01:43,  9.56it/s]
  0%|          | 2/1000 [00:00<01:02, 15.93it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:00<01:08, 14.48it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


 42%|████▏     | 416/1000 [02:53<04:03,  2.40it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 416


 73%|███████▎  | 729/1000 [02:46<01:01,  4.38it/s]
  0%|          | 1/1000 [00:00<02:36,  6.38it/s]

Early quitting at epoch: 729


  1%|          | 10/1000 [00:01<02:43,  6.04it/s]
  0%|          | 2/1000 [00:00<01:34, 10.57it/s]

Early quitting at epoch: 10


  1%|          | 11/1000 [00:01<01:34, 10.48it/s]
  0%|          | 2/1000 [00:00<00:53, 18.65it/s]

Early quitting at epoch: 11


  2%|▏         | 17/1000 [00:01<00:58, 16.74it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 17


 22%|██▏       | 223/1000 [01:33<05:27,  2.38it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 223


 36%|███▌      | 362/1000 [01:21<02:24,  4.42it/s]
  0%|          | 1/1000 [00:00<02:03,  8.08it/s]

Early quitting at epoch: 362


  6%|▌         | 62/1000 [00:08<02:06,  7.44it/s]
  0%|          | 2/1000 [00:00<01:11, 13.91it/s]

Early quitting at epoch: 62


  2%|▏         | 15/1000 [00:01<01:25, 11.58it/s]
  0%|          | 2/1000 [00:00<01:00, 16.45it/s]

Early quitting at epoch: 15


  1%|▏         | 14/1000 [00:00<01:02, 15.80it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 14


 10%|▉         | 95/1000 [00:40<06:27,  2.34it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 95


 12%|█▏        | 122/1000 [00:27<03:21,  4.37it/s]
  0%|          | 1/1000 [00:00<01:59,  8.39it/s]

Early quitting at epoch: 122


  5%|▌         | 54/1000 [00:07<02:05,  7.57it/s]
  0%|          | 2/1000 [00:00<01:13, 13.49it/s]

Early quitting at epoch: 54


  3%|▎         | 29/1000 [00:02<01:18, 12.32it/s]
  0%|          | 2/1000 [00:00<00:52, 18.84it/s]

Early quitting at epoch: 29


  3%|▎         | 34/1000 [00:01<00:55, 17.55it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 34


  2%|▏         | 15/1000 [00:06<07:25,  2.21it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 15


  2%|▏         | 17/1000 [00:04<03:56,  4.15it/s]
  0%|          | 1/1000 [00:00<02:04,  8.02it/s]

Early quitting at epoch: 17


  2%|▏         | 19/1000 [00:02<02:16,  7.20it/s]
  0%|          | 1/1000 [00:00<02:51,  5.83it/s]

Early quitting at epoch: 19


  1%|▏         | 14/1000 [00:01<01:39,  9.90it/s]
  0%|          | 2/1000 [00:00<01:05, 15.25it/s]

Early quitting at epoch: 14


  1%|▏         | 14/1000 [00:00<01:01, 16.03it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 14


  1%|          | 10/1000 [00:04<07:32,  2.19it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:02<04:15,  3.88it/s]
  0%|          | 1/1000 [00:00<02:10,  7.64it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:01<02:26,  6.76it/s]
  0%|          | 2/1000 [00:00<01:19, 12.48it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:01<01:40,  9.89it/s]
  0%|          | 2/1000 [00:00<00:56, 17.69it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:00<01:04, 15.27it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


 54%|█████▍    | 539/1000 [03:32<03:01,  2.54it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 539


 77%|███████▋  | 767/1000 [02:45<00:50,  4.63it/s]
  0%|          | 1/1000 [00:00<02:14,  7.41it/s]

Early quitting at epoch: 767


  1%|          | 11/1000 [00:01<02:28,  6.67it/s]
  0%|          | 2/1000 [00:00<01:16, 13.00it/s]

Early quitting at epoch: 11


  1%|          | 10/1000 [00:00<01:25, 11.55it/s]
  0%|          | 2/1000 [00:00<00:53, 18.54it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:00<01:01, 15.99it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


 39%|███▉      | 392/1000 [02:34<03:59,  2.54it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 392


 37%|███▋      | 372/1000 [01:20<02:15,  4.65it/s]
  0%|          | 1/1000 [00:00<02:03,  8.10it/s]

Early quitting at epoch: 372


 13%|█▎        | 127/1000 [00:16<01:51,  7.85it/s]
  0%|          | 2/1000 [00:00<01:19, 12.52it/s]

Early quitting at epoch: 127


  6%|▋         | 65/1000 [00:05<01:13, 12.77it/s]
  0%|          | 2/1000 [00:00<01:29, 11.15it/s]

Early quitting at epoch: 65


  1%|          | 10/1000 [00:00<01:10, 14.03it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


 11%|█         | 112/1000 [00:42<05:40,  2.61it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 112


 17%|█▋        | 168/1000 [00:36<03:01,  4.57it/s]
  0%|          | 1/1000 [00:00<02:16,  7.33it/s]

Early quitting at epoch: 168


  4%|▍         | 40/1000 [00:04<01:59,  8.06it/s]
  0%|          | 2/1000 [00:00<01:24, 11.79it/s]

Early quitting at epoch: 40


  4%|▍         | 44/1000 [00:03<01:14, 12.79it/s]
  0%|          | 2/1000 [00:00<00:57, 17.39it/s]

Early quitting at epoch: 44


  2%|▏         | 20/1000 [00:01<00:59, 16.36it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 20


  2%|▏         | 18/1000 [00:07<06:33,  2.50it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 18


  2%|▏         | 24/1000 [00:05<03:36,  4.50it/s]
  0%|          | 1/1000 [00:00<01:45,  9.51it/s]

Early quitting at epoch: 24


  3%|▎         | 28/1000 [00:03<02:03,  7.88it/s]
  0%|          | 2/1000 [00:00<01:20, 12.41it/s]

Early quitting at epoch: 28


  2%|▏         | 17/1000 [00:01<01:26, 11.38it/s]
  0%|          | 2/1000 [00:00<00:53, 18.67it/s]

Early quitting at epoch: 17


  2%|▏         | 22/1000 [00:01<00:56, 17.17it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 22


  1%|          | 10/1000 [00:04<07:01,  2.35it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:02<03:52,  4.26it/s]
  0%|          | 1/1000 [00:00<02:01,  8.20it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:01<02:19,  7.11it/s]
  0%|          | 2/1000 [00:00<01:05, 15.17it/s]

Early quitting at epoch: 10


  1%|          | 11/1000 [00:00<01:21, 12.09it/s]
  0%|          | 2/1000 [00:00<00:59, 16.83it/s]

Early quitting at epoch: 11


  1%|          | 10/1000 [00:00<01:02, 15.72it/s]

Early quitting at epoch: 10





In [80]:
# Save all trained models
dir = f"{models_dir}/{dataset_method}"
trainer_text.save_trained_models(dir=dir, to_be_saved_models=None)

## 2.2 Hyperparam Search on Concat Embeddings

In [81]:
# Select method 
dataset_method = "concat"
dataset_dict = method_to_split_to_dataset[dataset_method]

# Select model architecture and model class
model = VanillaNN

# Instantiate a trainer on the selected model class, model architecture, and dataset
trainer_concat = Trainer(model, dataset_method, dataset_dict)

In [82]:
# Perform hyper param search on the selected method
for model_config in model_init_param_configs:
    trainer_concat.hyperparameter_search(model_init_params = model_config,
                                    device = device,
                                    learning_rates = learning_rates,
                                    batch_sizes = batch_sizes,
                                    num_epochs = num_epochs)

 76%|███████▌  | 759/1000 [17:09<05:26,  1.36s/it]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 759


100%|██████████| 1000/1000 [11:06<00:00,  1.50it/s]
  1%|          | 12/1000 [00:04<06:17,  2.62it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 12


  1%|          | 11/1000 [00:02<03:31,  4.68it/s]
  0%|          | 1/1000 [00:00<01:57,  8.54it/s]

Early quitting at epoch: 11


  1%|          | 10/1000 [00:01<02:32,  6.51it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


 26%|██▌       | 261/1000 [05:50<16:31,  1.34s/it]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 261


 42%|████▏     | 421/1000 [04:42<06:27,  1.49it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 421


  1%|▏         | 13/1000 [00:04<06:15,  2.63it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 13


  2%|▏         | 15/1000 [00:03<03:45,  4.36it/s]
  0%|          | 1/1000 [00:00<02:15,  7.38it/s]

Early quitting at epoch: 15


  1%|          | 12/1000 [00:01<02:28,  6.65it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 12


  3%|▎         | 33/1000 [00:44<21:55,  1.36s/it]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 33


  4%|▍         | 42/1000 [00:28<10:57,  1.46it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 42


  4%|▍         | 39/1000 [00:14<05:53,  2.72it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 39


  5%|▌         | 50/1000 [00:10<03:26,  4.61it/s]
  0%|          | 1/1000 [00:00<02:21,  7.04it/s]

Early quitting at epoch: 50


  1%|          | 10/1000 [00:01<02:48,  5.88it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:15<24:50,  1.51s/it]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:07<11:50,  1.39it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:04<06:38,  2.48it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  2%|▏         | 15/1000 [00:03<03:53,  4.23it/s]
  0%|          | 1/1000 [00:00<02:28,  6.74it/s]

Early quitting at epoch: 15


  2%|▏         | 17/1000 [00:02<02:38,  6.20it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 17


  1%|          | 10/1000 [00:14<24:34,  1.49s/it]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:07<12:23,  1.33it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:04<06:36,  2.49it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:02<03:52,  4.27it/s]
  0%|          | 1/1000 [00:00<02:06,  7.91it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:01<02:22,  6.96it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


 95%|█████████▌| 954/1000 [19:49<00:57,  1.25s/it]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 954


100%|██████████| 1000/1000 [10:20<00:00,  1.61it/s]
  1%|▏         | 13/1000 [00:04<05:36,  2.93it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 13


  1%|▏         | 14/1000 [00:03<03:44,  4.38it/s]
  0%|          | 1/1000 [00:00<01:55,  8.66it/s]

Early quitting at epoch: 14


  1%|          | 10/1000 [00:01<02:13,  7.43it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


 21%|██        | 208/1000 [04:20<16:31,  1.25s/it]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 208


 30%|███       | 300/1000 [03:06<07:14,  1.61it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 300


 11%|█▏        | 113/1000 [00:38<05:02,  2.93it/s]
  0%|          | 1/1000 [00:00<03:06,  5.37it/s]

Early quitting at epoch: 113


  1%|          | 11/1000 [00:02<03:27,  4.77it/s]
  0%|          | 1/1000 [00:00<02:25,  6.84it/s]

Early quitting at epoch: 11


  1%|          | 11/1000 [00:01<02:42,  6.07it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 11


  2%|▏         | 23/1000 [00:30<21:34,  1.32s/it]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 23


  3%|▎         | 32/1000 [00:20<10:21,  1.56it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 32


  3%|▎         | 32/1000 [00:11<05:38,  2.86it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 32


  4%|▎         | 36/1000 [00:07<03:23,  4.73it/s]
  0%|          | 1/1000 [00:00<02:10,  7.64it/s]

Early quitting at epoch: 36


  5%|▌         | 51/1000 [00:06<02:06,  7.49it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 51


  1%|          | 10/1000 [00:14<23:24,  1.42s/it]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:06<11:11,  1.47it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:03<06:24,  2.58it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 12/1000 [00:02<03:43,  4.41it/s]
  0%|          | 1/1000 [00:00<02:13,  7.48it/s]

Early quitting at epoch: 12


  2%|▏         | 16/1000 [00:02<02:23,  6.84it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 16


  1%|          | 10/1000 [00:13<22:43,  1.38s/it]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:07<12:03,  1.37it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:03<06:01,  2.74it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:02<03:29,  4.73it/s]
  0%|          | 1/1000 [00:00<02:19,  7.16it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:01<02:32,  6.47it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


100%|██████████| 1000/1000 [13:35<00:00,  1.23it/s]
100%|██████████| 1000/1000 [07:02<00:00,  2.37it/s]
  1%|          | 10/1000 [00:02<04:45,  3.46it/s]
  0%|          | 1/1000 [00:00<02:26,  6.84it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:01<02:54,  5.68it/s]
  0%|          | 1/1000 [00:00<01:50,  9.06it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:01<02:04,  7.98it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


 21%|██▏       | 214/1000 [02:54<10:40,  1.23it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 214


 31%|███       | 307/1000 [02:16<05:08,  2.24it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 307


 11%|█         | 108/1000 [00:27<03:43,  4.00it/s]
  0%|          | 1/1000 [00:00<02:33,  6.51it/s]

Early quitting at epoch: 108


 12%|█▎        | 125/1000 [00:19<02:13,  6.55it/s]
  0%|          | 1/1000 [00:00<01:44,  9.58it/s]

Early quitting at epoch: 125


  3%|▎         | 29/1000 [00:03<01:45,  9.22it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 29


  3%|▎         | 29/1000 [00:24<13:28,  1.20it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 29


  4%|▎         | 37/1000 [00:16<07:10,  2.24it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 37


  4%|▎         | 36/1000 [00:09<04:17,  3.74it/s]
  0%|          | 1/1000 [00:00<02:17,  7.24it/s]

Early quitting at epoch: 36


  4%|▍         | 43/1000 [00:06<02:30,  6.34it/s]
  0%|          | 2/1000 [00:00<01:34, 10.60it/s]

Early quitting at epoch: 43


  3%|▎         | 31/1000 [00:03<01:43,  9.35it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 31


  1%|          | 10/1000 [00:09<15:25,  1.07it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:04<08:06,  2.03it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:02<04:19,  3.82it/s]
  0%|          | 1/1000 [00:00<02:21,  7.04it/s]

Early quitting at epoch: 10


  1%|          | 12/1000 [00:01<02:42,  6.08it/s]
  0%|          | 1/1000 [00:00<01:41,  9.83it/s]

Early quitting at epoch: 12


  2%|▏         | 18/1000 [00:02<01:51,  8.81it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 18


  1%|          | 10/1000 [00:09<14:53,  1.11it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:04<07:48,  2.11it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:02<04:20,  3.80it/s]
  0%|          | 1/1000 [00:00<01:58,  8.41it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:01<02:33,  6.44it/s]
  0%|          | 2/1000 [00:00<01:33, 10.62it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:01<01:46,  9.32it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


 63%|██████▎   | 630/1000 [11:53<06:58,  1.13s/it]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 630


 89%|████████▉ | 888/1000 [08:22<01:03,  1.77it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 888


 17%|█▋        | 172/1000 [00:54<04:23,  3.14it/s]
  0%|          | 1/1000 [00:00<02:52,  5.80it/s]

Early quitting at epoch: 172


  1%|          | 10/1000 [00:02<03:20,  4.95it/s]
  0%|          | 1/1000 [00:00<02:18,  7.19it/s]

Early quitting at epoch: 10


  1%|          | 11/1000 [00:01<02:18,  7.14it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 11


 17%|█▋        | 172/1000 [03:14<15:38,  1.13s/it]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 172


 27%|██▋       | 266/1000 [02:33<07:02,  1.74it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 266


 13%|█▎        | 128/1000 [00:41<04:40,  3.11it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 128


  1%|▏         | 14/1000 [00:02<03:10,  5.17it/s]
  0%|          | 1/1000 [00:00<01:52,  8.85it/s]

Early quitting at epoch: 14


  1%|          | 10/1000 [00:01<02:07,  7.79it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  2%|▏         | 23/1000 [00:27<19:14,  1.18s/it]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 23


  3%|▎         | 32/1000 [00:18<09:25,  1.71it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 32


  4%|▍         | 41/1000 [00:13<05:13,  3.06it/s]
  0%|          | 1/1000 [00:00<02:56,  5.67it/s]

Early quitting at epoch: 41


  3%|▎         | 29/1000 [00:05<03:10,  5.09it/s]
  0%|          | 1/1000 [00:00<02:06,  7.88it/s]

Early quitting at epoch: 29


  4%|▍         | 44/1000 [00:05<02:00,  7.93it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 44


  1%|          | 10/1000 [00:12<21:06,  1.28s/it]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:06<10:12,  1.62it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:03<06:08,  2.69it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:02<03:34,  4.62it/s]
  0%|          | 1/1000 [00:00<02:04,  8.04it/s]

Early quitting at epoch: 10


  2%|▏         | 21/1000 [00:02<02:13,  7.35it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 21


  1%|          | 10/1000 [00:12<20:27,  1.24s/it]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:06<10:58,  1.50it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:03<05:27,  3.02it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:01<03:13,  5.11it/s]
  0%|          | 1/1000 [00:00<01:54,  8.75it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:01<02:07,  7.74it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


 90%|████████▉ | 896/1000 [09:48<01:08,  1.52it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 896


100%|██████████| 1000/1000 [06:13<00:00,  2.68it/s]
  1%|          | 11/1000 [00:02<03:59,  4.14it/s]
  0%|          | 1/1000 [00:00<02:02,  8.15it/s]

Early quitting at epoch: 11


  1%|          | 12/1000 [00:01<02:19,  7.11it/s]
  0%|          | 2/1000 [00:00<01:28, 11.26it/s]

Early quitting at epoch: 12


  1%|          | 10/1000 [00:00<01:37, 10.20it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


 22%|██▏       | 223/1000 [02:37<09:08,  1.42it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 223


 35%|███▍      | 347/1000 [02:11<04:07,  2.64it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 347


 18%|█▊        | 181/1000 [00:40<03:01,  4.51it/s]
  0%|          | 1/1000 [00:00<01:59,  8.34it/s]

Early quitting at epoch: 181


  1%|          | 12/1000 [00:01<02:14,  7.34it/s]
  0%|          | 2/1000 [00:00<01:28, 11.27it/s]

Early quitting at epoch: 12


  2%|▏         | 18/1000 [00:01<01:35, 10.30it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 18


  4%|▍         | 38/1000 [00:26<11:12,  1.43it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 38


  5%|▌         | 53/1000 [00:19<05:50,  2.70it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 53


  6%|▌         | 57/1000 [00:12<03:22,  4.66it/s]
  0%|          | 1/1000 [00:00<02:00,  8.29it/s]

Early quitting at epoch: 57


  4%|▍         | 40/1000 [00:05<02:11,  7.29it/s]
  0%|          | 2/1000 [00:00<01:29, 11.13it/s]

Early quitting at epoch: 40


  2%|▏         | 16/1000 [00:01<01:36, 10.23it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 16


  1%|          | 10/1000 [00:06<11:26,  1.44it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:03<06:30,  2.53it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 11/1000 [00:02<03:48,  4.33it/s]
  0%|          | 1/1000 [00:00<02:27,  6.77it/s]

Early quitting at epoch: 11


  2%|▏         | 15/1000 [00:02<02:17,  7.15it/s]
  0%|          | 2/1000 [00:00<01:25, 11.64it/s]

Early quitting at epoch: 15


  1%|          | 12/1000 [00:01<01:42,  9.59it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 12


  1%|          | 10/1000 [00:07<12:26,  1.33it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:04<06:42,  2.46it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:02<04:00,  4.11it/s]
  0%|          | 1/1000 [00:00<02:12,  7.53it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:01<02:21,  7.01it/s]
  0%|          | 2/1000 [00:00<01:29, 11.17it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:00<01:36, 10.27it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


100%|██████████| 1000/1000 [09:31<00:00,  1.75it/s]
100%|██████████| 1000/1000 [05:12<00:00,  3.20it/s]
  1%|          | 10/1000 [00:02<03:19,  4.96it/s]
  0%|          | 1/1000 [00:00<01:51,  8.97it/s]

Early quitting at epoch: 10


  1%|          | 11/1000 [00:01<02:14,  7.35it/s]
  0%|          | 2/1000 [00:00<01:12, 13.79it/s]

Early quitting at epoch: 11


  2%|▏         | 15/1000 [00:01<01:16, 12.80it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 15


 27%|██▋       | 273/1000 [02:33<06:49,  1.78it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 273


 47%|████▋     | 469/1000 [02:24<02:43,  3.26it/s]
  0%|          | 1/1000 [00:00<02:45,  6.02it/s]

Early quitting at epoch: 469


  1%|          | 12/1000 [00:02<03:07,  5.26it/s]
  0%|          | 1/1000 [00:00<01:46,  9.40it/s]

Early quitting at epoch: 12


  1%|▏         | 13/1000 [00:01<02:10,  7.56it/s]
  0%|          | 2/1000 [00:00<01:24, 11.85it/s]

Early quitting at epoch: 13


  2%|▏         | 15/1000 [00:01<01:21, 12.10it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 15


  4%|▍         | 41/1000 [00:23<09:14,  1.73it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 41


  8%|▊         | 75/1000 [00:24<05:00,  3.08it/s]
  0%|          | 1/1000 [00:00<02:56,  5.66it/s]

Early quitting at epoch: 75


  5%|▌         | 51/1000 [00:09<02:53,  5.47it/s]
  0%|          | 1/1000 [00:00<02:12,  7.56it/s]

Early quitting at epoch: 51


  5%|▍         | 46/1000 [00:05<01:49,  8.72it/s]
  0%|          | 2/1000 [00:00<01:20, 12.35it/s]

Early quitting at epoch: 46


  4%|▍         | 38/1000 [00:03<01:22, 11.59it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 38


  1%|          | 10/1000 [00:06<10:46,  1.53it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 12/1000 [00:04<05:41,  2.90it/s]
  0%|          | 1/1000 [00:00<02:47,  5.98it/s]

Early quitting at epoch: 12


  1%|▏         | 14/1000 [00:02<03:19,  4.94it/s]
  0%|          | 1/1000 [00:00<01:55,  8.66it/s]

Early quitting at epoch: 14


  2%|▏         | 17/1000 [00:02<01:55,  8.48it/s]
  0%|          | 2/1000 [00:00<01:15, 13.22it/s]

Early quitting at epoch: 17


  2%|▏         | 16/1000 [00:01<01:21, 12.02it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 16


  1%|          | 10/1000 [00:06<10:54,  1.51it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:03<06:00,  2.74it/s]
  0%|          | 1/1000 [00:00<02:45,  6.02it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:01<03:08,  5.26it/s]
  0%|          | 1/1000 [00:00<01:48,  9.22it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:01<01:55,  8.57it/s]
  0%|          | 2/1000 [00:00<01:06, 14.92it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:00<01:17, 12.85it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


 43%|████▎     | 433/1000 [04:02<05:17,  1.79it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 433


 77%|███████▋  | 768/1000 [03:58<01:12,  3.22it/s]
  0%|          | 1/1000 [00:00<02:47,  5.95it/s]

Early quitting at epoch: 768


  1%|▏         | 14/1000 [00:02<03:04,  5.34it/s]
  0%|          | 1/1000 [00:00<01:55,  8.65it/s]

Early quitting at epoch: 14


  1%|          | 11/1000 [00:01<01:57,  8.45it/s]
  0%|          | 2/1000 [00:00<01:23, 12.00it/s]

Early quitting at epoch: 11


  1%|          | 11/1000 [00:00<01:26, 11.45it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 11


 21%|██▏       | 213/1000 [01:58<07:19,  1.79it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 213


 22%|██▏       | 217/1000 [01:07<04:02,  3.23it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 217


 10%|▉         | 99/1000 [00:18<02:50,  5.28it/s]
  0%|          | 1/1000 [00:00<01:47,  9.26it/s]

Early quitting at epoch: 99


  3%|▎         | 29/1000 [00:03<01:48,  8.92it/s]
  0%|          | 2/1000 [00:00<01:23, 11.94it/s]

Early quitting at epoch: 29


  2%|▏         | 20/1000 [00:01<01:34, 10.34it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 20


  4%|▍         | 42/1000 [00:24<09:08,  1.75it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 42


  6%|▌         | 55/1000 [00:17<04:58,  3.16it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 55


  4%|▍         | 40/1000 [00:07<03:05,  5.17it/s]
  0%|          | 1/1000 [00:00<01:44,  9.54it/s]

Early quitting at epoch: 40


  4%|▎         | 36/1000 [00:04<01:50,  8.72it/s]
  0%|          | 1/1000 [00:00<01:42,  9.71it/s]

Early quitting at epoch: 36


  2%|▏         | 23/1000 [00:02<01:28, 11.10it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 23


  1%|          | 10/1000 [00:06<10:11,  1.62it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:03<05:53,  2.80it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|▏         | 13/1000 [00:02<03:27,  4.77it/s]
  0%|          | 1/1000 [00:00<01:54,  8.69it/s]

Early quitting at epoch: 13


  1%|          | 12/1000 [00:01<02:00,  8.17it/s]
  0%|          | 2/1000 [00:00<01:28, 11.29it/s]

Early quitting at epoch: 12


  2%|▏         | 17/1000 [00:01<01:24, 11.60it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 17


  1%|          | 10/1000 [00:06<10:07,  1.63it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:03<05:40,  2.91it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:02<03:32,  4.65it/s]
  0%|          | 1/1000 [00:00<01:58,  8.42it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:01<02:12,  7.48it/s]
  0%|          | 2/1000 [00:00<01:26, 11.57it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:00<01:34, 10.45it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


 34%|███▍      | 342/1000 [02:42<05:12,  2.11it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 342


 96%|█████████▋| 965/1000 [04:13<00:09,  3.80it/s]
  0%|          | 1/1000 [00:00<02:27,  6.79it/s]

Early quitting at epoch: 965


  2%|▏         | 16/1000 [00:02<02:34,  6.39it/s]
  0%|          | 2/1000 [00:00<01:32, 10.84it/s]

Early quitting at epoch: 16


  1%|          | 11/1000 [00:01<01:53,  8.70it/s]
  0%|          | 2/1000 [00:00<01:10, 14.19it/s]

Early quitting at epoch: 11


  1%|          | 12/1000 [00:01<01:22, 11.93it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 12


 26%|██▋       | 263/1000 [02:05<05:50,  2.10it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 263


 36%|███▌      | 358/1000 [01:33<02:47,  3.83it/s]
  0%|          | 1/1000 [00:00<02:27,  6.75it/s]

Early quitting at epoch: 358


  7%|▋         | 68/1000 [00:11<02:33,  6.06it/s]
  0%|          | 2/1000 [00:00<01:33, 10.68it/s]

Early quitting at epoch: 68


  3%|▎         | 34/1000 [00:03<01:35, 10.14it/s]
  0%|          | 2/1000 [00:00<01:04, 15.59it/s]

Early quitting at epoch: 34


  1%|▏         | 13/1000 [00:00<01:12, 13.53it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 13


  5%|▌         | 50/1000 [00:24<07:36,  2.08it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 50


  8%|▊         | 79/1000 [00:20<04:03,  3.78it/s]
  0%|          | 1/1000 [00:00<02:17,  7.25it/s]

Early quitting at epoch: 79


  4%|▍         | 43/1000 [00:06<02:31,  6.32it/s]
  0%|          | 1/1000 [00:00<01:51,  8.99it/s]

Early quitting at epoch: 43


  4%|▍         | 38/1000 [00:03<01:41,  9.52it/s]
  0%|          | 2/1000 [00:00<01:05, 15.22it/s]

Early quitting at epoch: 38


  2%|▏         | 21/1000 [00:01<01:09, 14.06it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 21


  1%|          | 10/1000 [00:05<08:15,  2.00it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|▏         | 13/1000 [00:03<04:27,  3.69it/s]
  0%|          | 1/1000 [00:00<02:48,  5.94it/s]

Early quitting at epoch: 13


  1%|▏         | 13/1000 [00:02<02:38,  6.23it/s]
  0%|          | 1/1000 [00:00<01:49,  9.09it/s]

Early quitting at epoch: 13


  1%|▏         | 14/1000 [00:01<01:49,  9.02it/s]
  0%|          | 2/1000 [00:00<01:12, 13.79it/s]

Early quitting at epoch: 14


  2%|▏         | 18/1000 [00:01<01:18, 12.52it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 18


  1%|          | 10/1000 [00:05<08:42,  1.89it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:02<04:28,  3.69it/s]
  0%|          | 1/1000 [00:00<02:24,  6.92it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:01<02:46,  5.94it/s]
  0%|          | 1/1000 [00:00<01:53,  8.80it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:01<01:57,  8.45it/s]
  0%|          | 2/1000 [00:00<01:14, 13.48it/s]

Early quitting at epoch: 10


  1%|          | 11/1000 [00:01<01:30, 10.98it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 11


 41%|████      | 407/1000 [02:48<04:06,  2.41it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 407


 63%|██████▎   | 629/1000 [02:26<01:26,  4.31it/s]
  0%|          | 1/1000 [00:00<02:20,  7.12it/s]

Early quitting at epoch: 629


  1%|          | 11/1000 [00:01<02:24,  6.86it/s]
  0%|          | 2/1000 [00:00<01:23, 11.95it/s]

Early quitting at epoch: 11


  1%|          | 12/1000 [00:01<01:37, 10.13it/s]
  0%|          | 2/1000 [00:00<01:04, 15.47it/s]

Early quitting at epoch: 12


  1%|▏         | 14/1000 [00:00<01:07, 14.65it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 14


 31%|███       | 307/1000 [02:07<04:47,  2.41it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 307


 47%|████▋     | 467/1000 [01:47<02:03,  4.33it/s]
  0%|          | 1/1000 [00:00<02:14,  7.44it/s]

Early quitting at epoch: 467


  7%|▋         | 73/1000 [00:10<02:07,  7.24it/s]
  0%|          | 2/1000 [00:00<01:24, 11.81it/s]

Early quitting at epoch: 73


  2%|▏         | 18/1000 [00:01<01:29, 11.00it/s]
  0%|          | 2/1000 [00:00<01:08, 14.58it/s]

Early quitting at epoch: 18


  1%|          | 11/1000 [00:00<01:15, 13.04it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 11


  7%|▋         | 67/1000 [00:28<06:32,  2.37it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 67


  9%|▉         | 90/1000 [00:20<03:31,  4.30it/s]
  0%|          | 1/1000 [00:00<02:08,  7.77it/s]

Early quitting at epoch: 90


  4%|▍         | 41/1000 [00:05<02:16,  7.03it/s]
  0%|          | 2/1000 [00:00<01:20, 12.34it/s]

Early quitting at epoch: 41


  4%|▎         | 37/1000 [00:03<01:22, 11.64it/s]
  0%|          | 2/1000 [00:00<00:59, 16.90it/s]

Early quitting at epoch: 37


  3%|▎         | 29/1000 [00:01<01:04, 15.05it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 29


  1%|          | 12/1000 [00:05<07:17,  2.26it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 12


  2%|▏         | 15/1000 [00:03<04:00,  4.09it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 15


  2%|▏         | 21/1000 [00:03<02:28,  6.58it/s]
  0%|          | 2/1000 [00:00<01:16, 13.11it/s]

Early quitting at epoch: 21


  2%|▏         | 17/1000 [00:01<01:25, 11.52it/s]
  0%|          | 2/1000 [00:00<00:57, 17.21it/s]

Early quitting at epoch: 17


  2%|▏         | 19/1000 [00:01<01:00, 16.20it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 19


  1%|          | 10/1000 [00:04<07:11,  2.30it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:02<04:28,  3.69it/s]
  0%|          | 1/1000 [00:00<02:12,  7.55it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:01<02:34,  6.39it/s]
  0%|          | 2/1000 [00:00<01:20, 12.42it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:00<01:30, 10.93it/s]
  0%|          | 2/1000 [00:00<01:04, 15.42it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:00<01:13, 13.55it/s]

Early quitting at epoch: 10





In [83]:
# Save all trained models
dir = f"{models_dir}/{dataset_method}"
trainer_concat.save_trained_models(dir=dir, to_be_saved_models=None)

## 2.3 Hyperparam Search on Mean Embeddings

In [84]:
# Select method 
dataset_method = "mean"
dataset_dict = method_to_split_to_dataset[dataset_method]

# Select model architecture and model class
model = VanillaNN

# Instantiate a trainer on the selected model class, model architecture, and dataset
trainer_mean = Trainer(model, dataset_method, dataset_dict)

In [85]:
# Perform hyper param search on the selected method
for model_config in model_init_param_configs:
    trainer_mean.hyperparameter_search(model_init_params = model_config,
                                    device = device,
                                    learning_rates = learning_rates,
                                    batch_sizes = batch_sizes,
                                    num_epochs = num_epochs)

  3%|▎         | 26/1000 [00:26<16:50,  1.04s/it]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 26


  1%|▏         | 13/1000 [00:07<09:09,  1.80it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 13


  1%|          | 10/1000 [00:03<05:02,  3.27it/s]
  0%|          | 1/1000 [00:00<02:17,  7.29it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:01<02:46,  5.94it/s]
  0%|          | 1/1000 [00:00<02:16,  7.30it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:01<02:04,  7.94it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


 28%|██▊       | 275/1000 [04:12<11:06,  1.09it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 275


 39%|███▊      | 387/1000 [02:59<04:44,  2.15it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 387


  2%|▏         | 23/1000 [00:06<04:24,  3.69it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 23


  2%|▏         | 18/1000 [00:02<02:42,  6.03it/s]
  0%|          | 1/1000 [00:00<01:43,  9.69it/s]

Early quitting at epoch: 18


  1%|▏         | 13/1000 [00:01<01:42,  9.67it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 13


  3%|▎         | 32/1000 [00:28<14:32,  1.11it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 32


  5%|▍         | 47/1000 [00:22<07:26,  2.13it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 47


  5%|▌         | 51/1000 [00:13<04:18,  3.67it/s]
  0%|          | 1/1000 [00:00<02:28,  6.71it/s]

Early quitting at epoch: 51


  6%|▌         | 58/1000 [00:08<02:25,  6.47it/s]
  0%|          | 1/1000 [00:00<01:44,  9.60it/s]

Early quitting at epoch: 58


  1%|          | 12/1000 [00:01<02:01,  8.10it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 12


  1%|          | 10/1000 [00:09<15:56,  1.04it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:04<08:02,  2.05it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|▏         | 13/1000 [00:03<04:41,  3.51it/s]
  0%|          | 1/1000 [00:00<02:49,  5.88it/s]

Early quitting at epoch: 13


  2%|▏         | 15/1000 [00:02<02:57,  5.55it/s]
  0%|          | 1/1000 [00:00<01:46,  9.39it/s]

Early quitting at epoch: 15


  2%|▏         | 16/1000 [00:01<01:47,  9.16it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 16


  1%|          | 10/1000 [00:09<16:12,  1.02it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:04<07:59,  2.07it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:03<04:59,  3.31it/s]
  0%|          | 1/1000 [00:00<02:31,  6.58it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:01<02:46,  5.94it/s]
  0%|          | 1/1000 [00:00<01:58,  8.44it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:01<01:42,  9.67it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


 80%|████████  | 805/1000 [10:24<02:31,  1.29it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 805


  6%|▌         | 61/1000 [00:25<06:34,  2.38it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 61


  1%|          | 10/1000 [00:02<04:21,  3.78it/s]
  0%|          | 1/1000 [00:00<02:23,  6.98it/s]

Early quitting at epoch: 10


  2%|▏         | 16/1000 [00:02<02:24,  6.82it/s]
  0%|          | 2/1000 [00:00<01:28, 11.25it/s]

Early quitting at epoch: 16


  1%|▏         | 14/1000 [00:01<01:38, 10.05it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 14


 25%|██▌       | 252/1000 [03:16<09:44,  1.28it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 252


 39%|███▊      | 387/1000 [02:40<04:14,  2.40it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 387


  7%|▋         | 72/1000 [00:17<03:41,  4.18it/s]
  0%|          | 1/1000 [00:00<02:28,  6.73it/s]

Early quitting at epoch: 72


  6%|▌         | 62/1000 [00:09<02:17,  6.80it/s]
  0%|          | 2/1000 [00:00<01:29, 11.19it/s]

Early quitting at epoch: 62


  1%|          | 10/1000 [00:00<01:36, 10.22it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  3%|▎         | 31/1000 [00:24<12:48,  1.26it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 31


  4%|▍         | 42/1000 [00:17<06:45,  2.36it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 42


  4%|▍         | 40/1000 [00:09<03:54,  4.10it/s]
  0%|          | 1/1000 [00:00<02:22,  7.00it/s]

Early quitting at epoch: 40


  4%|▍         | 40/1000 [00:06<02:25,  6.62it/s]
  0%|          | 2/1000 [00:00<01:29, 11.20it/s]

Early quitting at epoch: 40


  5%|▍         | 46/1000 [00:04<01:27, 10.90it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 46


  1%|          | 10/1000 [00:08<14:44,  1.12it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:04<07:41,  2.15it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:02<04:19,  3.82it/s]
  0%|          | 1/1000 [00:00<02:01,  8.21it/s]

Early quitting at epoch: 10


  1%|▏         | 14/1000 [00:01<02:15,  7.30it/s]
  0%|          | 2/1000 [00:00<01:25, 11.69it/s]

Early quitting at epoch: 14


  2%|▏         | 16/1000 [00:01<01:28, 11.13it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 16


  1%|          | 10/1000 [00:08<14:45,  1.12it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:04<07:31,  2.19it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:02<04:33,  3.62it/s]
  0%|          | 1/1000 [00:00<02:22,  7.03it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:01<02:26,  6.76it/s]
  0%|          | 2/1000 [00:00<01:30, 11.03it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:00<01:36, 10.25it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


 78%|███████▊  | 779/1000 [08:55<02:32,  1.45it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 779


100%|██████████| 1000/1000 [06:06<00:00,  2.73it/s]
  1%|          | 10/1000 [00:02<03:47,  4.35it/s]
  0%|          | 1/1000 [00:00<02:05,  7.96it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:01<02:19,  7.08it/s]
  0%|          | 2/1000 [00:00<01:22, 12.09it/s]

Early quitting at epoch: 10


  1%|          | 11/1000 [00:00<01:26, 11.40it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 11


 26%|██▌       | 260/1000 [02:59<08:31,  1.45it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 260


 38%|███▊      | 379/1000 [02:19<03:48,  2.72it/s]
  0%|          | 1/1000 [00:00<03:06,  5.37it/s]

Early quitting at epoch: 379


 13%|█▎        | 129/1000 [00:27<03:03,  4.76it/s]
  0%|          | 1/1000 [00:00<01:57,  8.53it/s]

Early quitting at epoch: 129


  1%|          | 10/1000 [00:01<02:12,  7.46it/s]
  0%|          | 2/1000 [00:00<01:21, 12.22it/s]

Early quitting at epoch: 10


  1%|          | 11/1000 [00:00<01:25, 11.57it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 11


  3%|▎         | 32/1000 [00:22<11:27,  1.41it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 32


  5%|▍         | 47/1000 [00:17<05:55,  2.68it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 47


  6%|▌         | 56/1000 [00:12<03:23,  4.63it/s]
  0%|          | 1/1000 [00:00<01:53,  8.80it/s]

Early quitting at epoch: 56


  5%|▌         | 50/1000 [00:06<02:01,  7.81it/s]
  0%|          | 2/1000 [00:00<01:20, 12.39it/s]

Early quitting at epoch: 50


  4%|▍         | 41/1000 [00:03<01:19, 12.12it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 41


  1%|          | 10/1000 [00:07<13:00,  1.27it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:03<06:11,  2.67it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 12/1000 [00:02<03:49,  4.30it/s]
  0%|          | 1/1000 [00:00<02:03,  8.10it/s]

Early quitting at epoch: 12


  2%|▏         | 15/1000 [00:01<02:04,  7.89it/s]
  0%|          | 2/1000 [00:00<01:12, 13.82it/s]

Early quitting at epoch: 15


  2%|▏         | 15/1000 [00:01<01:28, 11.18it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 15


  1%|          | 10/1000 [00:07<12:15,  1.35it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:03<06:18,  2.61it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:02<03:42,  4.46it/s]
  0%|          | 1/1000 [00:00<01:57,  8.52it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:01<02:30,  6.57it/s]
  0%|          | 2/1000 [00:00<01:17, 12.85it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:00<01:37, 10.17it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


 68%|██████▊   | 678/1000 [07:36<03:36,  1.49it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 678


100%|██████████| 1000/1000 [06:01<00:00,  2.77it/s]
  1%|          | 11/1000 [00:02<03:50,  4.29it/s]
  0%|          | 1/1000 [00:00<02:15,  7.35it/s]

Early quitting at epoch: 11


  1%|          | 11/1000 [00:01<02:34,  6.40it/s]
  0%|          | 2/1000 [00:00<01:25, 11.70it/s]

Early quitting at epoch: 11


  1%|          | 10/1000 [00:00<01:24, 11.65it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


 23%|██▎       | 232/1000 [02:36<08:36,  1.49it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 232


 32%|███▎      | 325/1000 [01:57<04:04,  2.76it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 325


 10%|▉         | 96/1000 [00:20<03:09,  4.78it/s]
  0%|          | 1/1000 [00:00<02:10,  7.67it/s]

Early quitting at epoch: 96


  5%|▌         | 54/1000 [00:07<02:03,  7.68it/s]
  0%|          | 1/1000 [00:00<01:40,  9.94it/s]

Early quitting at epoch: 54


  2%|▏         | 20/1000 [00:01<01:33, 10.48it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 20


  3%|▎         | 30/1000 [00:20<11:06,  1.46it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 30


  4%|▍         | 44/1000 [00:16<06:02,  2.64it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 44


  5%|▌         | 54/1000 [00:11<03:23,  4.64it/s]
  0%|          | 1/1000 [00:00<02:25,  6.84it/s]

Early quitting at epoch: 54


  4%|▍         | 42/1000 [00:05<02:04,  7.66it/s]
  0%|          | 2/1000 [00:00<01:23, 11.98it/s]

Early quitting at epoch: 42


  2%|▏         | 23/1000 [00:02<01:25, 11.48it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 23


  1%|          | 10/1000 [00:07<12:25,  1.33it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:04<06:54,  2.39it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 11/1000 [00:02<03:52,  4.26it/s]
  0%|          | 1/1000 [00:00<02:01,  8.24it/s]

Early quitting at epoch: 11


  1%|▏         | 14/1000 [00:01<02:10,  7.58it/s]
  0%|          | 2/1000 [00:00<01:22, 12.10it/s]

Early quitting at epoch: 14


  1%|          | 12/1000 [00:01<01:31, 10.76it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 12


  1%|          | 10/1000 [00:07<11:48,  1.40it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:03<06:29,  2.54it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:02<03:56,  4.19it/s]
  0%|          | 1/1000 [00:00<02:38,  6.30it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:01<02:32,  6.49it/s]
  0%|          | 2/1000 [00:00<01:21, 12.19it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:00<01:28, 11.15it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


 76%|███████▋  | 764/1000 [07:19<02:15,  1.74it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 764


100%|██████████| 1000/1000 [05:09<00:00,  3.23it/s]
  1%|          | 10/1000 [00:01<03:05,  5.34it/s]
  0%|          | 1/1000 [00:00<01:41,  9.88it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:01<01:48,  9.10it/s]
  0%|          | 2/1000 [00:00<01:09, 14.40it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:00<01:26, 11.50it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


 30%|██▉       | 296/1000 [02:51<06:48,  1.72it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 296


 41%|████▏     | 414/1000 [02:10<03:04,  3.18it/s]
  0%|          | 1/1000 [00:00<02:47,  5.98it/s]

Early quitting at epoch: 414


 16%|█▋        | 163/1000 [00:29<02:30,  5.57it/s]
  0%|          | 2/1000 [00:00<01:34, 10.55it/s]

Early quitting at epoch: 163


  1%|          | 12/1000 [00:01<01:46,  9.27it/s]
  0%|          | 2/1000 [00:00<01:02, 15.89it/s]

Early quitting at epoch: 12


  1%|          | 11/1000 [00:00<01:17, 12.82it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 11


  5%|▍         | 47/1000 [00:27<09:08,  1.74it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 47


  7%|▋         | 71/1000 [00:22<04:49,  3.21it/s]
  0%|          | 1/1000 [00:00<02:52,  5.79it/s]

Early quitting at epoch: 71


  4%|▍         | 44/1000 [00:08<02:55,  5.45it/s]
  0%|          | 1/1000 [00:00<02:06,  7.87it/s]

Early quitting at epoch: 44


  5%|▍         | 49/1000 [00:05<01:41,  9.33it/s]
  0%|          | 2/1000 [00:00<01:13, 13.60it/s]

Early quitting at epoch: 49


  4%|▍         | 44/1000 [00:03<01:12, 13.22it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 44


  1%|          | 10/1000 [00:06<09:54,  1.66it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 11/1000 [00:03<05:12,  3.16it/s]
  0%|          | 1/1000 [00:00<02:55,  5.69it/s]

Early quitting at epoch: 11


  1%|▏         | 14/1000 [00:02<03:10,  5.18it/s]
  0%|          | 1/1000 [00:00<01:52,  8.90it/s]

Early quitting at epoch: 14


  2%|▏         | 16/1000 [00:01<01:47,  9.16it/s]
  0%|          | 2/1000 [00:00<01:08, 14.57it/s]

Early quitting at epoch: 16


  2%|▏         | 23/1000 [00:01<01:13, 13.36it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 23


  1%|          | 10/1000 [00:06<10:20,  1.60it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:03<05:24,  3.05it/s]
  0%|          | 1/1000 [00:00<02:53,  5.75it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:01<03:07,  5.28it/s]
  0%|          | 1/1000 [00:00<02:03,  8.12it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:01<02:01,  8.15it/s]
  0%|          | 2/1000 [00:00<01:26, 11.58it/s]

Early quitting at epoch: 10


  1%|          | 11/1000 [00:01<01:35, 10.34it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 11


100%|██████████| 1000/1000 [08:28<00:00,  1.97it/s]
  1%|          | 12/1000 [00:03<05:03,  3.25it/s]
  0%|          | 1/1000 [00:00<02:42,  6.14it/s]

Early quitting at epoch: 12


  1%|          | 10/1000 [00:01<02:50,  5.80it/s]
  0%|          | 1/1000 [00:00<01:46,  9.37it/s]

Early quitting at epoch: 10


  1%|          | 12/1000 [00:01<01:45,  9.36it/s]
  0%|          | 2/1000 [00:00<00:58, 17.03it/s]

Early quitting at epoch: 12


  1%|          | 10/1000 [00:00<01:10, 14.03it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


 34%|███▍      | 340/1000 [02:53<05:36,  1.96it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 340


 61%|██████    | 608/1000 [02:46<01:47,  3.65it/s]
  0%|          | 1/1000 [00:00<02:40,  6.22it/s]

Early quitting at epoch: 608


  2%|▏         | 17/1000 [00:02<02:45,  5.94it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 17


  1%|          | 11/1000 [00:01<01:44,  9.43it/s]
  0%|          | 2/1000 [00:00<01:08, 14.67it/s]

Early quitting at epoch: 11


  1%|          | 11/1000 [00:00<01:08, 14.48it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 11


  8%|▊         | 79/1000 [00:41<08:01,  1.91it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 79


  9%|▉         | 92/1000 [00:25<04:06,  3.68it/s]
  0%|          | 1/1000 [00:00<02:37,  6.36it/s]

Early quitting at epoch: 92


  5%|▍         | 49/1000 [00:07<02:28,  6.38it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 49


  6%|▌         | 55/1000 [00:05<01:34,  9.96it/s]
  0%|          | 2/1000 [00:00<01:08, 14.58it/s]

Early quitting at epoch: 55


  1%|          | 10/1000 [00:00<01:14, 13.35it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 11/1000 [00:05<08:41,  1.90it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 11


  1%|          | 12/1000 [00:03<04:45,  3.46it/s]
  0%|          | 1/1000 [00:00<02:55,  5.71it/s]

Early quitting at epoch: 12


  2%|▏         | 18/1000 [00:02<02:41,  6.07it/s]
  0%|          | 2/1000 [00:00<01:29, 11.16it/s]

Early quitting at epoch: 18


  3%|▎         | 26/1000 [00:02<01:31, 10.62it/s]
  0%|          | 2/1000 [00:00<01:01, 16.17it/s]

Early quitting at epoch: 26


  2%|▏         | 24/1000 [00:01<01:05, 14.90it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 24


  1%|          | 10/1000 [00:05<09:28,  1.74it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:02<04:34,  3.61it/s]
  0%|          | 1/1000 [00:00<02:40,  6.21it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:01<02:45,  5.98it/s]
  0%|          | 2/1000 [00:00<01:25, 11.72it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:00<01:38, 10.03it/s]
  0%|          | 2/1000 [00:00<01:14, 13.34it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:00<01:22, 12.07it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


 72%|███████▏  | 724/1000 [05:29<02:05,  2.20it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 724


 93%|█████████▎| 934/1000 [03:55<00:16,  3.96it/s]
  0%|          | 1/1000 [00:00<02:13,  7.46it/s]

Early quitting at epoch: 934


  2%|▏         | 20/1000 [00:03<02:38,  6.20it/s]
  0%|          | 2/1000 [00:00<01:31, 10.86it/s]

Early quitting at epoch: 20


  2%|▏         | 17/1000 [00:01<01:40,  9.77it/s]
  0%|          | 2/1000 [00:00<01:00, 16.50it/s]

Early quitting at epoch: 17


  1%|          | 10/1000 [00:00<01:08, 14.42it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


 35%|███▍      | 348/1000 [02:40<05:01,  2.17it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 348


 38%|███▊      | 379/1000 [01:35<02:36,  3.96it/s]
  0%|          | 1/1000 [00:00<02:31,  6.58it/s]

Early quitting at epoch: 379


  8%|▊         | 76/1000 [00:11<02:20,  6.56it/s]
  0%|          | 2/1000 [00:00<01:31, 10.89it/s]

Early quitting at epoch: 76


  2%|▏         | 19/1000 [00:02<01:43,  9.46it/s]
  0%|          | 2/1000 [00:00<01:04, 15.59it/s]

Early quitting at epoch: 19


  2%|▏         | 16/1000 [00:01<01:08, 14.40it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 16


  6%|▌         | 61/1000 [00:28<07:12,  2.17it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 61


  8%|▊         | 79/1000 [00:20<03:56,  3.89it/s]
  0%|          | 1/1000 [00:00<02:31,  6.61it/s]

Early quitting at epoch: 79


  4%|▍         | 38/1000 [00:05<02:25,  6.63it/s]
  0%|          | 1/1000 [00:00<01:43,  9.69it/s]

Early quitting at epoch: 38


  3%|▎         | 31/1000 [00:02<01:32, 10.47it/s]
  0%|          | 2/1000 [00:00<01:04, 15.56it/s]

Early quitting at epoch: 31


  1%|          | 12/1000 [00:00<01:13, 13.50it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 12


  1%|          | 11/1000 [00:05<07:48,  2.11it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 11


  1%|          | 12/1000 [00:03<04:23,  3.76it/s]
  0%|          | 1/1000 [00:00<02:13,  7.47it/s]

Early quitting at epoch: 12


  1%|▏         | 14/1000 [00:02<02:38,  6.22it/s]
  0%|          | 2/1000 [00:00<01:28, 11.23it/s]

Early quitting at epoch: 14


  2%|▏         | 17/1000 [00:01<01:44,  9.42it/s]
  0%|          | 2/1000 [00:00<01:07, 14.75it/s]

Early quitting at epoch: 17


  2%|▏         | 17/1000 [00:01<01:06, 14.69it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 17


  1%|          | 10/1000 [00:05<08:31,  1.94it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:02<04:47,  3.44it/s]
  0%|          | 1/1000 [00:00<02:31,  6.59it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:01<02:47,  5.91it/s]
  0%|          | 1/1000 [00:00<01:43,  9.70it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:00<01:37, 10.13it/s]
  0%|          | 2/1000 [00:00<00:57, 17.23it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:00<01:05, 15.18it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


 83%|████████▎ | 834/1000 [05:43<01:08,  2.43it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 834


 80%|███████▉  | 799/1000 [03:00<00:45,  4.42it/s]
  0%|          | 1/1000 [00:00<02:02,  8.18it/s]

Early quitting at epoch: 799


  2%|▏         | 17/1000 [00:02<02:15,  7.27it/s]
  0%|          | 2/1000 [00:00<01:23, 11.97it/s]

Early quitting at epoch: 17


  1%|▏         | 14/1000 [00:01<01:26, 11.44it/s]
  0%|          | 2/1000 [00:00<00:57, 17.30it/s]

Early quitting at epoch: 14


  1%|          | 12/1000 [00:00<01:01, 16.02it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 12


 27%|██▋       | 270/1000 [01:52<05:05,  2.39it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 270


 47%|████▋     | 474/1000 [01:47<01:59,  4.40it/s]
  0%|          | 1/1000 [00:00<02:08,  7.77it/s]

Early quitting at epoch: 474


  6%|▌         | 58/1000 [00:07<02:06,  7.43it/s]
  0%|          | 2/1000 [00:00<01:13, 13.50it/s]

Early quitting at epoch: 58


  2%|▏         | 15/1000 [00:01<01:22, 11.94it/s]
  0%|          | 2/1000 [00:00<00:58, 17.18it/s]

Early quitting at epoch: 15


  1%|▏         | 13/1000 [00:00<01:05, 15.16it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 13


  7%|▋         | 73/1000 [00:31<06:34,  2.35it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 73


 10%|▉         | 96/1000 [00:22<03:28,  4.34it/s]
  0%|          | 1/1000 [00:00<01:56,  8.55it/s]

Early quitting at epoch: 96


  6%|▌         | 57/1000 [00:07<02:07,  7.38it/s]
  0%|          | 2/1000 [00:00<01:16, 13.01it/s]

Early quitting at epoch: 57


  5%|▌         | 53/1000 [00:04<01:20, 11.81it/s]
  0%|          | 2/1000 [00:00<01:01, 16.23it/s]

Early quitting at epoch: 53


  2%|▏         | 24/1000 [00:01<00:57, 16.86it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 24


  1%|▏         | 14/1000 [00:06<07:03,  2.33it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 14


  2%|▏         | 15/1000 [00:03<03:59,  4.12it/s]
  0%|          | 1/1000 [00:00<02:19,  7.18it/s]

Early quitting at epoch: 15


  2%|▏         | 20/1000 [00:02<02:17,  7.10it/s]
  0%|          | 2/1000 [00:00<01:17, 12.95it/s]

Early quitting at epoch: 20


  2%|▏         | 20/1000 [00:01<01:26, 11.33it/s]
  0%|          | 2/1000 [00:00<00:59, 16.84it/s]

Early quitting at epoch: 20


  2%|▏         | 22/1000 [00:01<01:01, 16.01it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 22


  1%|          | 10/1000 [00:04<07:53,  2.09it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:02<04:04,  4.06it/s]
  0%|          | 1/1000 [00:00<02:14,  7.40it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:01<02:29,  6.61it/s]
  0%|          | 2/1000 [00:00<01:24, 11.83it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:00<01:28, 11.18it/s]
  0%|          | 2/1000 [00:00<00:52, 18.90it/s]

Early quitting at epoch: 10


  1%|          | 12/1000 [00:00<01:03, 15.67it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 12


 81%|████████  | 806/1000 [05:15<01:15,  2.56it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 806


100%|██████████| 1000/1000 [03:35<00:00,  4.65it/s]
  1%|▏         | 13/1000 [00:01<02:11,  7.51it/s]
  0%|          | 2/1000 [00:00<01:10, 14.08it/s]

Early quitting at epoch: 13


  1%|          | 10/1000 [00:00<01:19, 12.53it/s]
  0%|          | 2/1000 [00:00<00:59, 16.87it/s]

Early quitting at epoch: 10


  1%|          | 11/1000 [00:00<00:58, 16.97it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 11


 37%|███▋      | 374/1000 [02:27<04:06,  2.54it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 374


 45%|████▌     | 454/1000 [01:37<01:56,  4.68it/s]
  0%|          | 1/1000 [00:00<01:57,  8.49it/s]

Early quitting at epoch: 454


  2%|▏         | 18/1000 [00:02<02:12,  7.41it/s]
  0%|          | 2/1000 [00:00<01:19, 12.52it/s]

Early quitting at epoch: 18


  2%|▎         | 25/1000 [00:02<01:19, 12.25it/s]
  0%|          | 2/1000 [00:00<00:56, 17.58it/s]

Early quitting at epoch: 25


  1%|          | 10/1000 [00:00<00:59, 16.69it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  9%|▉         | 93/1000 [00:36<05:57,  2.53it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 93


 14%|█▍        | 141/1000 [00:30<03:05,  4.62it/s]
  0%|          | 1/1000 [00:00<01:54,  8.70it/s]

Early quitting at epoch: 141


  7%|▋         | 66/1000 [00:08<02:00,  7.75it/s]
  0%|          | 2/1000 [00:00<01:21, 12.24it/s]

Early quitting at epoch: 66


  3%|▎         | 30/1000 [00:02<01:19, 12.26it/s]
  0%|          | 2/1000 [00:00<00:54, 18.45it/s]

Early quitting at epoch: 30


  4%|▍         | 41/1000 [00:02<00:55, 17.43it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 41


  1%|▏         | 14/1000 [00:05<06:57,  2.36it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 14


  2%|▏         | 17/1000 [00:03<03:44,  4.38it/s]
  0%|          | 1/1000 [00:00<02:15,  7.35it/s]

Early quitting at epoch: 17


  2%|▎         | 25/1000 [00:03<02:05,  7.78it/s]
  0%|          | 1/1000 [00:00<02:44,  6.07it/s]

Early quitting at epoch: 25


  2%|▏         | 19/1000 [00:01<01:24, 11.63it/s]
  0%|          | 3/1000 [00:00<00:44, 22.18it/s]

Early quitting at epoch: 19


  1%|          | 11/1000 [00:00<00:53, 18.42it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 11


  1%|          | 10/1000 [00:04<07:32,  2.19it/s]
  0%|          | 0/1000 [00:00<?, ?it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:02<03:34,  4.62it/s]
  0%|          | 1/1000 [00:00<02:00,  8.26it/s]

Early quitting at epoch: 10


  1%|          | 10/1000 [00:01<02:19,  7.09it/s]
  0%|          | 2/1000 [00:00<01:27, 11.37it/s]

Early quitting at epoch: 10


  1%|          | 11/1000 [00:00<01:28, 11.21it/s]
  0%|          | 2/1000 [00:00<00:53, 18.79it/s]

Early quitting at epoch: 11


  1%|          | 11/1000 [00:00<01:02, 15.87it/s]

Early quitting at epoch: 11





In [86]:
# Save all trained models
dir = f"{models_dir}/{dataset_method}"
trainer_mean.save_trained_models(dir=dir, to_be_saved_models=None)