In [1]:
%load_ext autoreload
%autoreload 2

import torch
import torchvision
import torch.nn.functional as F
from torch import nn
from sklearn.metrics import precision_recall_fscore_support
import numpy as np

# manage ray's relative imports

import ray
runtime_env = {"working_dir": ".." }
ray.init(runtime_env=runtime_env, dashboard_port=13065, include_dashboard=True, dashboard_host="0.0.0.0")
from ray import tune
from ray.tune.suggest.optuna import OptunaSearch
from ray.tune import JupyterNotebookReporter

# manage beams's relative imports
import sys
sys.path.append('..')

from src.beam import beam_arguments, Experiment, Study
from src.beam import UniversalDataset, UniversalBatchSampler
from src.beam import Algorithm
from src.beam import LinearNet
from torchvision import transforms
import matplotlib.pyplot as plt

from src.beam import DataTensor
from src.beam.utils import is_notebook
from cifar10_example import Cifar10Network, CIFAR10Algorithm, CIFAR10Dataset

from ray.tune.suggest.hebo import HEBOSearch

2022-07-06 20:35:57,004	INFO services.py:1456 -- View the Ray dashboard at [1m[32mhttp://172.17.0.2:13065[39m[22m
2022-07-06 20:35:58,022	INFO packaging.py:388 -- Creating a file package for local directory '..'.
2022-07-06 20:35:58,279	INFO packaging.py:241 -- Pushing file package 'gcs://_ray_pkg_c2239984b08464ed.zip' (1.24MiB) to Ray cluster...
2022-07-06 20:35:58,307	INFO packaging.py:243 -- Successfully pushed file package 'gcs://_ray_pkg_c2239984b08464ed.zip'.


In [2]:
path_to_data = '/localdata/elads/data/datasets/cifar10'
root_dir = '/localdata/elads/data/cifar10'

# path_to_data = '/home/shared/data/dataset/cifar10'
# root_dir = '/home/shared/data/results/cifar10'

## Training with a single worker

In [12]:
# here you put all actions which are performed only once before initializing the workers
# for example, setti`ng running arguments and experiment:

args = beam_arguments(f"--project-name=cifar10 --root-dir={root_dir} --algorithm=CIFAR10Algorithm --device=0 --amp --lr-d=1e-2 --batch-size=512",
                      "--n-epochs=40 --clip-gradient=1000 --parallel=0 --accumulate=1 --no-deterministic",
                      "--weight-decay=3e-5 --beta1=0.9", 
                      path_to_data=path_to_data, dropout=.0, activation='relu', channels=1024, label_smoothing=.2,
                      padding=6, gain=.2, turn_point=512, final_point=4096, minimal_gain=.05, temperature=0.05)

experiment = Experiment(args)

[32m2022-07-06 20:43:29[0m | [1mINFO    [0m | [1mCreating new experiment[0m
[32m2022-07-06 20:43:29[0m | [1mINFO    [0m | [1mExperiment directory is: /localdata/elads/data/cifar10/cifar10/CIFAR10Algorithm/debug/0159_20220706_204329[0m
[32m2022-07-06 20:43:30[0m | [1mINFO    [0m | [1mbeam project: cifar10[0m
[32m2022-07-06 20:43:30[0m | [1mINFO    [0m | [1mExperiment Hyperparameters[0m
[32m2022-07-06 20:43:30[0m | [1mINFO    [0m | [1mproject_name: cifar10[0m
[32m2022-07-06 20:43:30[0m | [1mINFO    [0m | [1malgorithm: CIFAR10Algorithm[0m
[32m2022-07-06 20:43:30[0m | [1mINFO    [0m | [1midentifier: debug[0m
[32m2022-07-06 20:43:30[0m | [1mINFO    [0m | [1mmp_port: random[0m
[32m2022-07-06 20:43:30[0m | [1mINFO    [0m | [1mroot_dir: /localdata/elads/data/cifar10[0m
[32m2022-07-06 20:43:30[0m | [1mINFO    [0m | [1mreload: False[0m
[32m2022-07-06 20:43:30[0m | [1mINFO    [0m | [1mresume: -1[0m
[32m2022-07-06 20:43:30[0m | [

In [16]:
experiment = Experiment.reload_from_path('/localdata/elads/data/cifar10/cifar10/CIFAR10Algorithm/debug/0159_20220706_204329')

[32m2022-07-06 20:48:44[0m | [1mINFO    [0m | [1mReload experiment from path: /localdata/elads/data/cifar10/cifar10/CIFAR10Algorithm/debug/0159_20220706_204329[0m
[32m2022-07-06 20:48:44[0m | [1mINFO    [0m | [1mResuming existing experiment[0m
[32m2022-07-06 20:48:44[0m | [1mINFO    [0m | [1mbeam project: cifar10[0m
[32m2022-07-06 20:48:44[0m | [1mINFO    [0m | [1mExperiment Hyperparameters[0m
[32m2022-07-06 20:48:44[0m | [1mINFO    [0m | [1mproject_name: cifar10[0m
[32m2022-07-06 20:48:44[0m | [1mINFO    [0m | [1malgorithm: CIFAR10Algorithm[0m
[32m2022-07-06 20:48:44[0m | [1mINFO    [0m | [1midentifier: debug[0m
[32m2022-07-06 20:48:44[0m | [1mINFO    [0m | [1mmp_port: random[0m
[32m2022-07-06 20:48:44[0m | [1mINFO    [0m | [1mroot_dir: /localdata/elads/data/cifar10[0m
[32m2022-07-06 20:48:44[0m | [1mINFO    [0m | [1mreload: True[0m
[32m2022-07-06 20:48:44[0m | [1mINFO    [0m | [1mresume: 0159_20220706_204329[0m
[32m20

In [None]:
alg = experiment.fit(CIFAR10Algorithm, CIFAR10Dataset, tensorboard_arguments={'images': {'sample': {'dataformats': 'NCHW'}}})

[32m2022-07-06 20:48:50[0m | [1mINFO    [0m | [1mSingle worker mode[0m
[32m2022-07-06 20:48:50[0m | [1mINFO    [0m | [1mWorker: 1/1 is running...[0m
[32m2022-07-06 20:48:50[0m | [1mINFO    [0m | [1mReload experiment from checkpoint: /localdata/elads/data/cifar10/cifar10/CIFAR10Algorithm/debug/0159_20220706_204329/checkpoints/checkpoint_000015[0m


train:   0%|          | 0/73 [00:00<?, ?it/s]

validation:   0%|          | 0/22 [00:00<?, ?it/s]

[32m2022-07-06 20:49:02[0m | [1mINFO    [0m | [1m[0m
[32m2022-07-06 20:49:02[0m | [1mINFO    [0m | [1mFinished epoch 1/40:[0m
[32m2022-07-06 20:49:02[0m | [1mINFO    [0m | [1mtrain:[0m
[32m2022-07-06 20:49:02[0m | [1mINFO    [0m | [1mloss:           | avg: 613.4     | std: 16.78     | min: 577.2     | 25%: 601.5     | 50%: 614.0     | 75%: 621.9     | max: 667.8     [0m
[32m2022-07-06 20:49:02[0m | [1mINFO    [0m | [1macc:            | avg: 0.8465    | std: 0.02106   | min: 0.7812    | 25%: 0.834     | 50%: 0.8496    | 75%: 0.8613    | max: 0.8926    [0m
[32m2022-07-06 20:49:02[0m | [1mINFO    [0m | [1mlr:             | avg: 0.0005    | std: nan       | min: 0.0005    | 25%: 0.0005    | 50%: 0.0005    | 75%: 0.0005    | max: 0.0005    [0m
[32m2022-07-06 20:49:02[0m | [1mINFO    [0m | [1mvalidation:[0m
[32m2022-07-06 20:49:02[0m | [1mINFO    [0m | [1mloss:           | avg: 611.1     | std: 9.262     | min: 597.8     | 25%: 603.9     | 50%: 

train:   0%|          | 0/73 [00:00<?, ?it/s]

validation:   0%|          | 0/22 [00:00<?, ?it/s]

[32m2022-07-06 20:49:21[0m | [1mINFO    [0m | [1m[0m
[32m2022-07-06 20:49:21[0m | [1mINFO    [0m | [1mFinished epoch 2/40:[0m
[32m2022-07-06 20:49:21[0m | [1mINFO    [0m | [1mtrain:[0m
[32m2022-07-06 20:49:21[0m | [1mINFO    [0m | [1mloss:           | avg: 590.8     | std: 12.92     | min: 561.9     | 25%: 581.7     | 50%: 589.4     | 75%: 600.8     | max: 624.2     [0m
[32m2022-07-06 20:49:21[0m | [1mINFO    [0m | [1macc:            | avg: 0.8701    | std: 0.01719   | min: 0.8281    | 25%: 0.8574    | 50%: 0.8711    | 75%: 0.8828    | max: 0.9121    [0m
[32m2022-07-06 20:49:21[0m | [1mINFO    [0m | [1mlr:             | avg: 0.0005703 | std: nan       | min: 0.0005703 | 25%: 0.0005703 | 50%: 0.0005703 | 75%: 0.0005703 | max: 0.0005703 [0m
[32m2022-07-06 20:49:21[0m | [1mINFO    [0m | [1mvalidation:[0m
[32m2022-07-06 20:49:21[0m | [1mINFO    [0m | [1mloss:           | avg: 612.5     | std: 10.3      | min: 596.8     | 25%: 604.4     | 50%: 

train:   0%|          | 0/73 [00:00<?, ?it/s]

## Training with 4 workers

In [6]:
# here you put all actions which are performed only once before initializing the workers
# for example, setti`ng running arguments and experiment:

args = beam_arguments(f"--project-name=cifar10 --root-dir={root_dir} --algorithm=CIFAR10Algorithm --device=0 --half --lr-d=1e-3 --batch-size=512",
                      "--n-epochs=40 --clip-gradient=1000 --parallel=4 --accumulate=1 --no-deterministic",
                      "--weight-decay=1e-5 --beta1=0.9 --beta2=0.9", 
                      path_to_data=path_to_data, dropout=.0, activation='relu', channels=512, label_smoothing=.2,
                      padding=6, gain=.2, turn_point=1024, final_point=3000, minimal_gain=.05, temperature=1)

experiment = Experiment(args)

[32m2022-07-06 12:28:01[0m | [1mINFO    [0m | [1mCreating new experiment[0m
[32m2022-07-06 12:28:01[0m | [1mINFO    [0m | [1mExperiment directory is: /localdata/elads/data/cifar10/cifar10/CIFAR10Algorithm/debug/0147_20220706_122801[0m
[32m2022-07-06 12:28:02[0m | [1mINFO    [0m | [1mbeam project: cifar10[0m
[32m2022-07-06 12:28:02[0m | [1mINFO    [0m | [1mExperiment Hyperparameters[0m
[32m2022-07-06 12:28:02[0m | [1mINFO    [0m | [1mproject_name: cifar10[0m
[32m2022-07-06 12:28:02[0m | [1mINFO    [0m | [1malgorithm: CIFAR10Algorithm[0m
[32m2022-07-06 12:28:02[0m | [1mINFO    [0m | [1midentifier: debug[0m
[32m2022-07-06 12:28:02[0m | [1mINFO    [0m | [1mmp_port: random[0m
[32m2022-07-06 12:28:02[0m | [1mINFO    [0m | [1mroot_dir: /localdata/elads/data/cifar10[0m
[32m2022-07-06 12:28:02[0m | [1mINFO    [0m | [1mreload: False[0m
[32m2022-07-06 12:28:02[0m | [1mINFO    [0m | [1mresume: -1[0m
[32m2022-07-06 12:28:02[0m | [

In [7]:
alg = experiment.fit(CIFAR10Algorithm, CIFAR10Dataset, tensorboard_arguments={'images': {'sample': {'dataformats': 'NCHW'}}})

[32m2022-07-06 12:28:07[0m | [1mINFO    [0m | [1mInitializing 4 parallel workers[0m
[32m2022-07-06 12:28:07[0m | [1mINFO    [0m | [1mMultiprocessing port is: 45081[0m
[32m2022-07-06 12:28:10[0m | [1mINFO    [0m | [1mWorker: 3/4 is running...[0m
[32m2022-07-06 12:28:10[0m | [1mINFO    [0m | [1mWorker: 4/4 is running...[0m
[32m2022-07-06 12:28:10[0m | [1mINFO    [0m | [1mWorker: 1/4 is running...[0m
[32m2022-07-06 12:28:10[0m | [1mINFO    [0m | [1mWorker: 2/4 is running...[0m


[W socket.cpp:558] [c10d] The client socket has failed to connect to [localhost]:45081 (errno: 101 - Network is unreachable).
[W socket.cpp:558] [c10d] The client socket has failed to connect to [localhost]:45081 (errno: 101 - Network is unreachable).
train: 100%|██████████| 73/73 [00:15<00:00,  4.79it/s]
validation:   0%|          | 0/22 [00:00<?, ?it/s]
train: 100%|██████████| 73/73 [00:16<00:00,  4.39it/s]
validation:   0%|          | 0/22 [00:00<?, ?it/s]
validation: 100%|██████████| 22/22 [00:00<00:00, 36.45it/s]


[32m2022-07-06 12:28:32[0m | [1mINFO    [0m | [1mFinished epoch 1/40:[0m
[32m2022-07-06 12:28:32[0m | [1mINFO    [0m | [1mtrain:[0m
[32m2022-07-06 12:28:32[0m | [1mINFO    [0m | [1mloss:	| avg: inf      	|  std: nan      	|  min: 993.0    	|  25%: 1.099e+03	|  50%: 1.308e+03	|  75%: 1.602e+03	|  max: inf      [0m
[32m2022-07-06 12:28:32[0m | [1mINFO    [0m | [1macc:	| avg: 0.2357   	|  std: 0.08556  	|  min: 0.08398  	|  25%: 0.1621   	|  50%: 0.2227   	|  75%: 0.3125   	|  max: 0.4141   [0m
[32m2022-07-06 12:28:32[0m | [1mINFO    [0m | [1mlr:	| avg: 5e-05    	|  std: nan      	|  min: 5e-05    	|  25%: 5e-05    	|  50%: 5e-05    	|  75%: 5e-05    	|  max: 5e-05    [0m
[32m2022-07-06 12:28:32[0m | [1mINFO    [0m | [1mvalidation:[0m
[32m2022-07-06 12:28:32[0m | [1mINFO    [0m | [1mloss:	| avg: 1.029e+03	|  std: 24.41    	|  min: 991.0    	|  25%: 1.013e+03	|  50%: 1.026e+03	|  75%: 1.042e+03	|  max: 1.078e+03[0m
[32m2022-07-06 12:28:32[0m | 


train:   0%|          | 0/73 [00:00<?, ?it/s]

train:   0%|          | 0/73 [00:00<?, ?it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  4.99it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  4.99it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  4.99it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  4.99it/s]
validation: 100%|██████████| 22/22 [00:00<00:00, 37.24it/s]


[32m2022-07-06 12:28:48[0m | [1mINFO    [0m | [1mFinished epoch 2/40:[0m
[32m2022-07-06 12:28:48[0m | [1mINFO    [0m | [1mtrain:[0m
[32m2022-07-06 12:28:48[0m | [1mINFO    [0m | [1mloss:	| avg: 924.1    	|  std: 61.74    	|  min: 812.5    	|  25%: 880.0    	|  50%: 919.5    	|  75%: 965.5    	|  max: 1.06e+03 [0m
[32m2022-07-06 12:28:48[0m | [1mINFO    [0m | [1macc:	| avg: 0.4973   	|  std: 0.06777  	|  min: 0.3652   	|  25%: 0.4473   	|  50%: 0.5059   	|  75%: 0.5488   	|  max: 0.6426   [0m
[32m2022-07-06 12:28:48[0m | [1mINFO    [0m | [1mlr:	| avg: 5e-05    	|  std: nan      	|  min: 5e-05    	|  25%: 5e-05    	|  50%: 5e-05    	|  75%: 5e-05    	|  max: 5e-05    [0m
[32m2022-07-06 12:28:48[0m | [1mINFO    [0m | [1mvalidation:[0m
[32m2022-07-06 12:28:48[0m | [1mINFO    [0m | [1mloss:	| avg: 863.6    	|  std: 20.77    	|  min: 838.0    	|  25%: 848.2    	|  50%: 857.2    	|  75%: 874.5    	|  max: 908.0    [0m
[32m2022-07-06 12:28:48[0m | 


train:   0%|          | 0/73 [00:00<?, ?it/s]


train: 100%|██████████| 73/73 [00:14<00:00,  5.01it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.01it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.01it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.01it/s]
validation: 100%|██████████| 22/22 [00:00<00:00, 37.63it/s]


[32m2022-07-06 12:29:04[0m | [1mINFO    [0m | [1mFinished epoch 3/40:[0m
[32m2022-07-06 12:29:04[0m | [1mINFO    [0m | [1mtrain:[0m
[32m2022-07-06 12:29:04[0m | [1mINFO    [0m | [1mloss:	| avg: 808.7    	|  std: 26.52    	|  min: 745.5    	|  25%: 793.5    	|  50%: 807.0    	|  75%: 824.5    	|  max: 889.0    [0m
[32m2022-07-06 12:29:04[0m | [1mINFO    [0m | [1macc:	| avg: 0.626    	|  std: 0.03987  	|  min: 0.5293   	|  25%: 0.6035   	|  50%: 0.623    	|  75%: 0.6504   	|  max: 0.7383   [0m
[32m2022-07-06 12:29:04[0m | [1mINFO    [0m | [1mlr:	| avg: 5e-05    	|  std: nan      	|  min: 5e-05    	|  25%: 5e-05    	|  50%: 5e-05    	|  75%: 5e-05    	|  max: 5e-05    [0m
[32m2022-07-06 12:29:04[0m | [1mINFO    [0m | [1mvalidation:[0m
[32m2022-07-06 12:29:04[0m | [1mINFO    [0m | [1mloss:	| avg: 778.9    	|  std: 15.98    	|  min: 756.0    	|  25%: 767.2    	|  50%: 777.0    	|  75%: 789.5    	|  max: 815.0    [0m
[32m2022-07-06 12:29:04[0m | 


train:   0%|          | 0/73 [00:00<?, ?it/s]
train:   0%|          | 0/73 [00:00<?, ?it/s]

train: 100%|██████████| 73/73 [00:14<00:00,  5.00it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.00it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.00it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.00it/s]
validation: 100%|██████████| 22/22 [00:00<00:00, 37.13it/s]


[32m2022-07-06 12:29:20[0m | [1mINFO    [0m | [1mFinished epoch 4/40:[0m
[32m2022-07-06 12:29:20[0m | [1mINFO    [0m | [1mtrain:[0m
[32m2022-07-06 12:29:20[0m | [1mINFO    [0m | [1mloss:	| avg: 755.4    	|  std: 24.95    	|  min: 702.5    	|  25%: 735.0    	|  50%: 754.0    	|  75%: 772.0    	|  max: 809.0    [0m
[32m2022-07-06 12:29:20[0m | [1mINFO    [0m | [1macc:	| avg: 0.6929   	|  std: 0.03324  	|  min: 0.6035   	|  25%: 0.6719   	|  50%: 0.6973   	|  75%: 0.7188   	|  max: 0.752    [0m
[32m2022-07-06 12:29:20[0m | [1mINFO    [0m | [1mlr:	| avg: 5.703e-05	|  std: nan      	|  min: 5.703e-05	|  25%: 5.703e-05	|  50%: 5.703e-05	|  75%: 5.703e-05	|  max: 5.703e-05[0m
[32m2022-07-06 12:29:20[0m | [1mINFO    [0m | [1mvalidation:[0m
[32m2022-07-06 12:29:20[0m | [1mINFO    [0m | [1mloss:	| avg: 786.5    	|  std: 17.26    	|  min: 744.5    	|  25%: 780.8    	|  50%: 787.2    	|  75%: 792.8    	|  max: 821.0    [0m
[32m2022-07-06 12:29:20[0m | 



train:   0%|          | 0/73 [00:00<?, ?it/s]

train: 100%|██████████| 73/73 [00:14<00:00,  5.00it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.00it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  4.99it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  4.99it/s]
validation: 100%|██████████| 22/22 [00:00<00:00, 37.28it/s]


[32m2022-07-06 12:29:36[0m | [1mINFO    [0m | [1mFinished epoch 5/40:[0m
[32m2022-07-06 12:29:36[0m | [1mINFO    [0m | [1mtrain:[0m
[32m2022-07-06 12:29:36[0m | [1mINFO    [0m | [1mloss:	| avg: 731.3    	|  std: 25.39    	|  min: 690.5    	|  25%: 716.0    	|  50%: 728.0    	|  75%: 746.5    	|  max: 815.5    [0m
[32m2022-07-06 12:29:36[0m | [1mINFO    [0m | [1macc:	| avg: 0.7293   	|  std: 0.02984  	|  min: 0.6445   	|  25%: 0.7129   	|  50%: 0.7324   	|  75%: 0.75     	|  max: 0.7793   [0m
[32m2022-07-06 12:29:36[0m | [1mINFO    [0m | [1mlr:	| avg: 7.129e-05	|  std: nan      	|  min: 7.129e-05	|  25%: 7.129e-05	|  50%: 7.129e-05	|  75%: 7.129e-05	|  max: 7.129e-05[0m
[32m2022-07-06 12:29:36[0m | [1mINFO    [0m | [1mvalidation:[0m
[32m2022-07-06 12:29:36[0m | [1mINFO    [0m | [1mloss:	| avg: 732.4    	|  std: 14.61    	|  min: 709.0    	|  25%: 720.6    	|  50%: 732.2    	|  75%: 742.6    	|  max: 766.0    [0m
[32m2022-07-06 12:29:36[0m | 


train:   0%|          | 0/73 [00:00<?, ?it/s]

train:   0%|          | 0/73 [00:00<?, ?it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.00it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.00it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.00it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.00it/s]
validation: 100%|██████████| 22/22 [00:00<00:00, 35.21it/s]


[32m2022-07-06 12:29:52[0m | [1mINFO    [0m | [1mFinished epoch 6/40:[0m
[32m2022-07-06 12:29:52[0m | [1mINFO    [0m | [1mtrain:[0m
[32m2022-07-06 12:29:52[0m | [1mINFO    [0m | [1mloss:	| avg: 721.0    	|  std: 19.66    	|  min: 675.0    	|  25%: 707.5    	|  50%: 722.0    	|  75%: 732.0    	|  max: 790.0    [0m
[32m2022-07-06 12:29:52[0m | [1mINFO    [0m | [1macc:	| avg: 0.7541   	|  std: 0.02168  	|  min: 0.6914   	|  25%: 0.7422   	|  50%: 0.7559   	|  75%: 0.7695   	|  max: 0.8125   [0m
[32m2022-07-06 12:29:52[0m | [1mINFO    [0m | [1mlr:	| avg: 8.555e-05	|  std: nan      	|  min: 8.555e-05	|  25%: 8.555e-05	|  50%: 8.555e-05	|  75%: 8.555e-05	|  max: 8.555e-05[0m
[32m2022-07-06 12:29:52[0m | [1mINFO    [0m | [1mvalidation:[0m
[32m2022-07-06 12:29:52[0m | [1mINFO    [0m | [1mloss:	| avg: 773.8    	|  std: 28.19    	|  min: 723.0    	|  25%: 752.2    	|  50%: 768.2    	|  75%: 780.9    	|  max: 829.0    [0m
[32m2022-07-06 12:29:52[0m | 





train: 100%|██████████| 73/73 [00:14<00:00,  5.01it/s]
validation:   0%|          | 0/22 [00:00<?, ?it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.01it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.01it/s]
validation: 100%|██████████| 22/22 [00:00<00:00, 35.70it/s]


[32m2022-07-06 12:30:08[0m | [1mINFO    [0m | [1mFinished epoch 7/40:[0m
[32m2022-07-06 12:30:08[0m | [1mINFO    [0m | [1mtrain:[0m
[32m2022-07-06 12:30:08[0m | [1mINFO    [0m | [1mloss:	| avg: 721.2    	|  std: 28.79    	|  min: 666.0    	|  25%: 699.5    	|  50%: 718.0    	|  75%: 741.0    	|  max: 800.0    [0m
[32m2022-07-06 12:30:08[0m | [1mINFO    [0m | [1macc:	| avg: 0.7643   	|  std: 0.03148  	|  min: 0.6699   	|  25%: 0.75     	|  50%: 0.7676   	|  75%: 0.7852   	|  max: 0.8184   [0m
[32m2022-07-06 12:30:08[0m | [1mINFO    [0m | [1mlr:	| avg: 9.98e-05 	|  std: nan      	|  min: 9.98e-05 	|  25%: 9.98e-05 	|  50%: 9.98e-05 	|  75%: 9.98e-05 	|  max: 9.98e-05 [0m
[32m2022-07-06 12:30:08[0m | [1mINFO    [0m | [1mvalidation:[0m
[32m2022-07-06 12:30:08[0m | [1mINFO    [0m | [1mloss:	| avg: 797.3    	|  std: 55.22    	|  min: 740.5    	|  25%: 771.2    	|  50%: 781.5    	|  75%: 812.5    	|  max: 1.006e+03[0m
[32m2022-07-06 12:30:08[0m | 


train:   0%|          | 0/73 [00:00<?, ?it/s]


train: 100%|██████████| 73/73 [00:14<00:00,  5.00it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.00it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.00it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.00it/s]
validation: 100%|██████████| 22/22 [00:00<00:00, 37.11it/s]


[32m2022-07-06 12:30:24[0m | [1mINFO    [0m | [1mFinished epoch 8/40:[0m
[32m2022-07-06 12:30:24[0m | [1mINFO    [0m | [1mtrain:[0m
[32m2022-07-06 12:30:24[0m | [1mINFO    [0m | [1mloss:	| avg: 719.3    	|  std: 29.96    	|  min: 656.0    	|  25%: 698.0    	|  50%: 716.5    	|  75%: 732.0    	|  max: 804.0    [0m
[32m2022-07-06 12:30:24[0m | [1mINFO    [0m | [1macc:	| avg: 0.7814   	|  std: 0.02569  	|  min: 0.7344   	|  25%: 0.7598   	|  50%: 0.7793   	|  75%: 0.8008   	|  max: 0.8359   [0m
[32m2022-07-06 12:30:24[0m | [1mINFO    [0m | [1mlr:	| avg: 0.0001141	|  std: nan      	|  min: 0.0001141	|  25%: 0.0001141	|  50%: 0.0001141	|  75%: 0.0001141	|  max: 0.0001141[0m
[32m2022-07-06 12:30:24[0m | [1mINFO    [0m | [1mvalidation:[0m
[32m2022-07-06 12:30:24[0m | [1mINFO    [0m | [1mloss:	| avg: 778.5    	|  std: 55.88    	|  min: 716.0    	|  25%: 740.0    	|  50%: 757.0    	|  75%: 797.2    	|  max: 947.5    [0m
[32m2022-07-06 12:30:24[0m | 


train:   0%|          | 0/73 [00:00<?, ?it/s]
train:   0%|          | 0/73 [00:00<?, ?it/s]

train: 100%|██████████| 73/73 [00:14<00:00,  4.98it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  4.98it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  4.97it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  4.97it/s]
validation: 100%|██████████| 22/22 [00:00<00:00, 37.38it/s]


[32m2022-07-06 12:30:40[0m | [1mINFO    [0m | [1mFinished epoch 9/40:[0m
[32m2022-07-06 12:30:40[0m | [1mINFO    [0m | [1mtrain:[0m
[32m2022-07-06 12:30:40[0m | [1mINFO    [0m | [1mloss:	| avg: 717.5    	|  std: 35.93    	|  min: 652.0    	|  25%: 689.0    	|  50%: 719.0    	|  75%: 743.5    	|  max: 827.0    [0m
[32m2022-07-06 12:30:40[0m | [1mINFO    [0m | [1macc:	| avg: 0.7911   	|  std: 0.02992  	|  min: 0.6914   	|  25%: 0.7812   	|  50%: 0.791    	|  75%: 0.8105   	|  max: 0.8516   [0m
[32m2022-07-06 12:30:40[0m | [1mINFO    [0m | [1mlr:	| avg: 0.0001283	|  std: nan      	|  min: 0.0001283	|  25%: 0.0001283	|  50%: 0.0001283	|  75%: 0.0001283	|  max: 0.0001283[0m
[32m2022-07-06 12:30:40[0m | [1mINFO    [0m | [1mvalidation:[0m
[32m2022-07-06 12:30:40[0m | [1mINFO    [0m | [1mloss:	| avg: 796.5    	|  std: 72.07    	|  min: 728.0    	|  25%: 744.4    	|  50%: 766.5    	|  75%: 820.0    	|  max: 978.5    [0m
[32m2022-07-06 12:30:40[0m | 


train:   0%|          | 0/73 [00:00<?, ?it/s]

train:   0%|          | 0/73 [00:00<?, ?it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  4.96it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  4.96it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  4.95it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  4.95it/s]
validation: 100%|██████████| 22/22 [00:00<00:00, 37.35it/s]


[32m2022-07-06 12:30:56[0m | [1mINFO    [0m | [1mFinished epoch 10/40:[0m
[32m2022-07-06 12:30:56[0m | [1mINFO    [0m | [1mtrain:[0m
[32m2022-07-06 12:30:56[0m | [1mINFO    [0m | [1mloss:	| avg: 727.3    	|  std: 42.68    	|  min: 641.0    	|  25%: 704.0    	|  50%: 726.0    	|  75%: 757.0    	|  max: 845.0    [0m
[32m2022-07-06 12:30:56[0m | [1mINFO    [0m | [1macc:	| avg: 0.802    	|  std: 0.03386  	|  min: 0.6953   	|  25%: 0.7832   	|  50%: 0.8047   	|  75%: 0.8242   	|  max: 0.8652   [0m
[32m2022-07-06 12:30:56[0m | [1mINFO    [0m | [1mlr:	| avg: 0.0001426	|  std: nan      	|  min: 0.0001426	|  25%: 0.0001426	|  50%: 0.0001426	|  75%: 0.0001426	|  max: 0.0001426[0m
[32m2022-07-06 12:30:56[0m | [1mINFO    [0m | [1mvalidation:[0m
[32m2022-07-06 12:30:56[0m | [1mINFO    [0m | [1mloss:	| avg: 778.2    	|  std: 56.57    	|  min: 721.5    	|  25%: 740.1    	|  50%: 759.2    	|  75%: 790.1    	|  max: 898.0    [0m
[32m2022-07-06 12:30:56[0m | 


train:   0%|          | 0/73 [00:00<?, ?it/s]

train:   0%|          | 0/73 [00:00<?, ?it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  4.95it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  4.95it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  4.95it/s]
validation:   0%|          | 0/22 [00:00<?, ?it/s]
validation: 100%|██████████| 22/22 [00:00<00:00, 37.41it/s]


[32m2022-07-06 12:31:13[0m | [1mINFO    [0m | [1mFinished epoch 11/40:[0m
[32m2022-07-06 12:31:13[0m | [1mINFO    [0m | [1mtrain:[0m
[32m2022-07-06 12:31:13[0m | [1mINFO    [0m | [1mloss:	| avg: 710.3    	|  std: 44.0     	|  min: 631.0    	|  25%: 675.0    	|  50%: 703.0    	|  75%: 737.0    	|  max: 829.5    [0m
[32m2022-07-06 12:31:13[0m | [1mINFO    [0m | [1macc:	| avg: 0.8194   	|  std: 0.02619  	|  min: 0.7441   	|  25%: 0.8008   	|  50%: 0.8223   	|  75%: 0.8379   	|  max: 0.8691   [0m
[32m2022-07-06 12:31:13[0m | [1mINFO    [0m | [1mlr:	| avg: 0.0001568	|  std: nan      	|  min: 0.0001568	|  25%: 0.0001568	|  50%: 0.0001568	|  75%: 0.0001568	|  max: 0.0001568[0m
[32m2022-07-06 12:31:13[0m | [1mINFO    [0m | [1mvalidation:[0m
[32m2022-07-06 12:31:13[0m | [1mINFO    [0m | [1mloss:	| avg: 788.7    	|  std: 58.93    	|  min: 708.0    	|  25%: 749.6    	|  50%: 778.0    	|  75%: 829.1    	|  max: 908.0    [0m
[32m2022-07-06 12:31:13[0m | 


train:   0%|          | 0/73 [00:00<?, ?it/s]

train:   0%|          | 0/73 [00:00<?, ?it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.02it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.02it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.02it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.02it/s]
validation: 100%|██████████| 22/22 [00:00<00:00, 36.99it/s]


[32m2022-07-06 12:31:28[0m | [1mINFO    [0m | [1mFinished epoch 12/40:[0m
[32m2022-07-06 12:31:28[0m | [1mINFO    [0m | [1mtrain:[0m
[32m2022-07-06 12:31:28[0m | [1mINFO    [0m | [1mloss:	| avg: 703.3    	|  std: 40.33    	|  min: 624.0    	|  25%: 671.5    	|  50%: 701.5    	|  75%: 732.0    	|  max: 802.0    [0m
[32m2022-07-06 12:31:28[0m | [1mINFO    [0m | [1macc:	| avg: 0.8301   	|  std: 0.02834  	|  min: 0.7734   	|  25%: 0.8086   	|  50%: 0.8301   	|  75%: 0.8477   	|  max: 0.9102   [0m
[32m2022-07-06 12:31:28[0m | [1mINFO    [0m | [1mlr:	| avg: 0.0001711	|  std: nan      	|  min: 0.0001711	|  25%: 0.0001711	|  50%: 0.0001711	|  75%: 0.0001711	|  max: 0.0001711[0m
[32m2022-07-06 12:31:28[0m | [1mINFO    [0m | [1mvalidation:[0m
[32m2022-07-06 12:31:28[0m | [1mINFO    [0m | [1mloss:	| avg: 779.7    	|  std: 70.39    	|  min: 706.0    	|  25%: 736.0    	|  50%: 751.5    	|  75%: 827.0    	|  max: 969.0    [0m
[32m2022-07-06 12:31:28[0m | 


train:   0%|          | 0/73 [00:00<?, ?it/s]

train:   0%|          | 0/73 [00:00<?, ?it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.06it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.06it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.05it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.05it/s]
validation: 100%|██████████| 22/22 [00:00<00:00, 37.34it/s]


[32m2022-07-06 12:31:44[0m | [1mINFO    [0m | [1mFinished epoch 13/40:[0m
[32m2022-07-06 12:31:44[0m | [1mINFO    [0m | [1mtrain:[0m
[32m2022-07-06 12:31:44[0m | [1mINFO    [0m | [1mloss:	| avg: 698.1    	|  std: 43.73    	|  min: 628.0    	|  25%: 666.5    	|  50%: 689.0    	|  75%: 722.0    	|  max: 832.5    [0m
[32m2022-07-06 12:31:44[0m | [1mINFO    [0m | [1macc:	| avg: 0.8443   	|  std: 0.02363  	|  min: 0.7852   	|  25%: 0.8262   	|  50%: 0.8477   	|  75%: 0.8594   	|  max: 0.8926   [0m
[32m2022-07-06 12:31:44[0m | [1mINFO    [0m | [1mlr:	| avg: 0.0001854	|  std: nan      	|  min: 0.0001854	|  25%: 0.0001854	|  50%: 0.0001854	|  75%: 0.0001854	|  max: 0.0001854[0m
[32m2022-07-06 12:31:44[0m | [1mINFO    [0m | [1mvalidation:[0m
[32m2022-07-06 12:31:44[0m | [1mINFO    [0m | [1mloss:	| avg: 711.8    	|  std: 29.01    	|  min: 649.0    	|  25%: 696.1    	|  50%: 716.0    	|  75%: 721.8    	|  max: 783.0    [0m
[32m2022-07-06 12:31:44[0m | 


train:   0%|          | 0/73 [00:00<?, ?it/s]


train: 100%|██████████| 73/73 [00:14<00:00,  5.05it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.04it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.04it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.04it/s]
validation: 100%|██████████| 22/22 [00:00<00:00, 37.28it/s]


[32m2022-07-06 12:32:00[0m | [1mINFO    [0m | [1mFinished epoch 14/40:[0m
[32m2022-07-06 12:32:00[0m | [1mINFO    [0m | [1mtrain:[0m
[32m2022-07-06 12:32:00[0m | [1mINFO    [0m | [1mloss:	| avg: 686.0    	|  std: 45.49    	|  min: 600.5    	|  25%: 654.0    	|  50%: 678.0    	|  75%: 710.5    	|  max: 804.5    [0m
[32m2022-07-06 12:32:00[0m | [1mINFO    [0m | [1macc:	| avg: 0.8602   	|  std: 0.02515  	|  min: 0.7617   	|  25%: 0.8457   	|  50%: 0.8594   	|  75%: 0.877    	|  max: 0.9082   [0m
[32m2022-07-06 12:32:00[0m | [1mINFO    [0m | [1mlr:	| avg: 0.0001996	|  std: nan      	|  min: 0.0001996	|  25%: 0.0001996	|  50%: 0.0001996	|  75%: 0.0001996	|  max: 0.0001996[0m
[32m2022-07-06 12:32:00[0m | [1mINFO    [0m | [1mvalidation:[0m
[32m2022-07-06 12:32:00[0m | [1mINFO    [0m | [1mloss:	| avg: 663.7    	|  std: 49.56    	|  min: 624.0    	|  25%: 638.6    	|  50%: 645.0    	|  75%: 656.2    	|  max: 811.5    [0m
[32m2022-07-06 12:32:00[0m | 


train:   0%|          | 0/73 [00:00<?, ?it/s]


train: 100%|██████████| 73/73 [00:14<00:00,  5.07it/s]
validation:   0%|          | 0/22 [00:00<?, ?it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.07it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.06it/s]
validation: 100%|██████████| 22/22 [00:00<00:00, 36.33it/s]


[32m2022-07-06 12:32:16[0m | [1mINFO    [0m | [1mFinished epoch 15/40:[0m
[32m2022-07-06 12:32:16[0m | [1mINFO    [0m | [1mtrain:[0m
[32m2022-07-06 12:32:16[0m | [1mINFO    [0m | [1mloss:	| avg: 631.0    	|  std: 39.36    	|  min: 556.0    	|  25%: 604.0    	|  50%: 628.0    	|  75%: 658.0    	|  max: 719.0    [0m
[32m2022-07-06 12:32:16[0m | [1mINFO    [0m | [1macc:	| avg: 0.8925   	|  std: 0.02382  	|  min: 0.8262   	|  25%: 0.877    	|  50%: 0.8965   	|  75%: 0.9102   	|  max: 0.9316   [0m
[32m2022-07-06 12:32:16[0m | [1mINFO    [0m | [1mlr:	| avg: 0.0001928	|  std: nan      	|  min: 0.0001928	|  25%: 0.0001928	|  50%: 0.0001928	|  75%: 0.0001928	|  max: 0.0001928[0m
[32m2022-07-06 12:32:16[0m | [1mINFO    [0m | [1mvalidation:[0m
[32m2022-07-06 12:32:16[0m | [1mINFO    [0m | [1mloss:	| avg: 618.2    	|  std: 29.49    	|  min: 587.0    	|  25%: 601.2    	|  50%: 606.8    	|  75%: 630.5    	|  max: 700.0    [0m
[32m2022-07-06 12:32:16[0m | 


train:   0%|          | 0/73 [00:00<?, ?it/s]


train: 100%|██████████| 73/73 [00:14<00:00,  5.07it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.07it/s]

train: 100%|██████████| 73/73 [00:14<00:00,  5.07it/s]
validation: 100%|██████████| 22/22 [00:00<00:00, 37.64it/s]


[32m2022-07-06 12:32:32[0m | [1mINFO    [0m | [1mFinished epoch 16/40:[0m
[32m2022-07-06 12:32:32[0m | [1mINFO    [0m | [1mtrain:[0m
[32m2022-07-06 12:32:32[0m | [1mINFO    [0m | [1mloss:	| avg: 580.3    	|  std: 26.2     	|  min: 541.0    	|  25%: 561.0    	|  50%: 578.0    	|  75%: 596.0    	|  max: 657.0    [0m
[32m2022-07-06 12:32:32[0m | [1mINFO    [0m | [1macc:	| avg: 0.9257   	|  std: 0.01752  	|  min: 0.8867   	|  25%: 0.9141   	|  50%: 0.9277   	|  75%: 0.9395   	|  max: 0.957    [0m
[32m2022-07-06 12:32:32[0m | [1mINFO    [0m | [1mlr:	| avg: 0.0001854	|  std: nan      	|  min: 0.0001854	|  25%: 0.0001854	|  50%: 0.0001854	|  75%: 0.0001854	|  max: 0.0001854[0m
[32m2022-07-06 12:32:32[0m | [1mINFO    [0m | [1mvalidation:[0m
[32m2022-07-06 12:32:32[0m | [1mINFO    [0m | [1mloss:	| avg: 657.2    	|  std: 92.77    	|  min: 611.5    	|  25%: 616.8    	|  50%: 630.5    	|  75%: 650.8    	|  max: 1.05e+03 [0m
[32m2022-07-06 12:32:32[0m | 



train:   0%|          | 0/73 [00:00<?, ?it/s]

train: 100%|██████████| 73/73 [00:14<00:00,  5.10it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.10it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.10it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.10it/s]
validation: 100%|██████████| 22/22 [00:00<00:00, 37.71it/s]


[32m2022-07-06 12:32:47[0m | [1mINFO    [0m | [1mFinished epoch 17/40:[0m
[32m2022-07-06 12:32:47[0m | [1mINFO    [0m | [1mtrain:[0m
[32m2022-07-06 12:32:47[0m | [1mINFO    [0m | [1mloss:	| avg: 558.7    	|  std: 19.0     	|  min: 525.0    	|  25%: 546.5    	|  50%: 557.0    	|  75%: 569.0    	|  max: 616.0    [0m
[32m2022-07-06 12:32:47[0m | [1mINFO    [0m | [1macc:	| avg: 0.9398   	|  std: 0.01474  	|  min: 0.8887   	|  25%: 0.9336   	|  50%: 0.9414   	|  75%: 0.9492   	|  max: 0.9648   [0m
[32m2022-07-06 12:32:47[0m | [1mINFO    [0m | [1mlr:	| avg: 0.000178 	|  std: nan      	|  min: 0.000178 	|  25%: 0.000178 	|  50%: 0.000178 	|  75%: 0.000178 	|  max: 0.000178 [0m
[32m2022-07-06 12:32:47[0m | [1mINFO    [0m | [1mvalidation:[0m
[32m2022-07-06 12:32:47[0m | [1mINFO    [0m | [1mloss:	| avg: 605.8    	|  std: 24.72    	|  min: 577.0    	|  25%: 592.6    	|  50%: 596.0    	|  75%: 611.6    	|  max: 670.0    [0m
[32m2022-07-06 12:32:47[0m | 


train:   0%|          | 0/73 [00:00<?, ?it/s]
train:   0%|          | 0/73 [00:00<?, ?it/s]

train: 100%|██████████| 73/73 [00:14<00:00,  5.08it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.08it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.07it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.07it/s]
validation: 100%|██████████| 22/22 [00:00<00:00, 37.45it/s]


[32m2022-07-06 12:33:03[0m | [1mINFO    [0m | [1mFinished epoch 18/40:[0m
[32m2022-07-06 12:33:03[0m | [1mINFO    [0m | [1mtrain:[0m
[32m2022-07-06 12:33:03[0m | [1mINFO    [0m | [1mloss:	| avg: 536.4    	|  std: 15.69    	|  min: 508.5    	|  25%: 527.0    	|  50%: 534.0    	|  75%: 545.0    	|  max: 604.0    [0m
[32m2022-07-06 12:33:03[0m | [1mINFO    [0m | [1macc:	| avg: 0.9533   	|  std: 0.01314  	|  min: 0.9199   	|  25%: 0.9453   	|  50%: 0.9531   	|  75%: 0.9629   	|  max: 0.9844   [0m
[32m2022-07-06 12:33:03[0m | [1mINFO    [0m | [1mlr:	| avg: 0.0001706	|  std: nan      	|  min: 0.0001706	|  25%: 0.0001706	|  50%: 0.0001706	|  75%: 0.0001706	|  max: 0.0001706[0m
[32m2022-07-06 12:33:03[0m | [1mINFO    [0m | [1mvalidation:[0m
[32m2022-07-06 12:33:03[0m | [1mINFO    [0m | [1mloss:	| avg: 573.6    	|  std: 16.06    	|  min: 550.0    	|  25%: 564.2    	|  50%: 572.5    	|  75%: 580.0    	|  max: 628.0    [0m
[32m2022-07-06 12:33:03[0m | 


train:   0%|          | 0/73 [00:00<?, ?it/s]
train:   0%|          | 0/73 [00:00<?, ?it/s]

train: 100%|██████████| 73/73 [00:14<00:00,  5.13it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.13it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.13it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.13it/s]
validation: 100%|██████████| 22/22 [00:00<00:00, 37.52it/s]


[32m2022-07-06 12:33:19[0m | [1mINFO    [0m | [1mFinished epoch 19/40:[0m
[32m2022-07-06 12:33:19[0m | [1mINFO    [0m | [1mtrain:[0m
[32m2022-07-06 12:33:19[0m | [1mINFO    [0m | [1mloss:	| avg: 521.4    	|  std: 14.52    	|  min: 498.5    	|  25%: 511.0    	|  50%: 518.0    	|  75%: 527.0    	|  max: 571.5    [0m
[32m2022-07-06 12:33:19[0m | [1mINFO    [0m | [1macc:	| avg: 0.9636   	|  std: 0.01295  	|  min: 0.9297   	|  25%: 0.9551   	|  50%: 0.9668   	|  75%: 0.9727   	|  max: 0.9863   [0m
[32m2022-07-06 12:33:19[0m | [1mINFO    [0m | [1mlr:	| avg: 0.0001633	|  std: nan      	|  min: 0.0001633	|  25%: 0.0001633	|  50%: 0.0001633	|  75%: 0.0001633	|  max: 0.0001633[0m
[32m2022-07-06 12:33:19[0m | [1mINFO    [0m | [1mvalidation:[0m
[32m2022-07-06 12:33:19[0m | [1mINFO    [0m | [1mloss:	| avg: 606.6    	|  std: 31.4     	|  min: 574.0    	|  25%: 583.5    	|  50%: 599.0    	|  75%: 616.5    	|  max: 685.0    [0m
[32m2022-07-06 12:33:19[0m | 


train:   0%|          | 0/73 [00:00<?, ?it/s]
train:   0%|          | 0/73 [00:00<?, ?it/s]

train: 100%|██████████| 73/73 [00:14<00:00,  5.13it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.13it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.13it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.13it/s]
validation: 100%|██████████| 22/22 [00:00<00:00, 37.48it/s]


[32m2022-07-06 12:33:34[0m | [1mINFO    [0m | [1mFinished epoch 20/40:[0m
[32m2022-07-06 12:33:34[0m | [1mINFO    [0m | [1mtrain:[0m
[32m2022-07-06 12:33:34[0m | [1mINFO    [0m | [1mloss:	| avg: 509.0    	|  std: 14.28    	|  min: 491.2    	|  25%: 499.0    	|  50%: 506.2    	|  75%: 515.0    	|  max: 555.0    [0m
[32m2022-07-06 12:33:34[0m | [1mINFO    [0m | [1macc:	| avg: 0.9722   	|  std: 0.01407  	|  min: 0.9199   	|  25%: 0.9668   	|  50%: 0.9727   	|  75%: 0.9805   	|  max: 0.9961   [0m
[32m2022-07-06 12:33:34[0m | [1mINFO    [0m | [1mlr:	| avg: 0.0001559	|  std: nan      	|  min: 0.0001559	|  25%: 0.0001559	|  50%: 0.0001559	|  75%: 0.0001559	|  max: 0.0001559[0m
[32m2022-07-06 12:33:34[0m | [1mINFO    [0m | [1mvalidation:[0m
[32m2022-07-06 12:33:34[0m | [1mINFO    [0m | [1mloss:	| avg: 564.4    	|  std: 14.26    	|  min: 550.0    	|  25%: 554.0    	|  50%: 559.0    	|  75%: 571.0    	|  max: 602.0    [0m
[32m2022-07-06 12:33:34[0m | 


train:   0%|          | 0/73 [00:00<?, ?it/s]
train:   0%|          | 0/73 [00:00<?, ?it/s]

train: 100%|██████████| 73/73 [00:14<00:00,  5.17it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.17it/s]
validation:   0%|          | 0/22 [00:00<?, ?it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.17it/s]
validation: 100%|██████████| 22/22 [00:00<00:00, 37.39it/s]


[32m2022-07-06 12:33:50[0m | [1mINFO    [0m | [1mFinished epoch 21/40:[0m
[32m2022-07-06 12:33:50[0m | [1mINFO    [0m | [1mtrain:[0m
[32m2022-07-06 12:33:50[0m | [1mINFO    [0m | [1mloss:	| avg: 500.3    	|  std: 9.966    	|  min: 479.8    	|  25%: 494.2    	|  50%: 499.5    	|  75%: 505.5    	|  max: 532.0    [0m
[32m2022-07-06 12:33:50[0m | [1mINFO    [0m | [1macc:	| avg: 0.9782   	|  std: 0.008721 	|  min: 0.9512   	|  25%: 0.9727   	|  50%: 0.9785   	|  75%: 0.9844   	|  max: 0.9922   [0m
[32m2022-07-06 12:33:50[0m | [1mINFO    [0m | [1mlr:	| avg: 0.0001485	|  std: nan      	|  min: 0.0001485	|  25%: 0.0001485	|  50%: 0.0001485	|  75%: 0.0001485	|  max: 0.0001485[0m
[32m2022-07-06 12:33:50[0m | [1mINFO    [0m | [1mvalidation:[0m
[32m2022-07-06 12:33:50[0m | [1mINFO    [0m | [1mloss:	| avg: 569.6    	|  std: 31.02    	|  min: 537.5    	|  25%: 553.2    	|  50%: 561.5    	|  75%: 574.8    	|  max: 684.0    [0m
[32m2022-07-06 12:33:50[0m | 


train:   0%|          | 0/73 [00:00<?, ?it/s]

train:   0%|          | 0/73 [00:00<?, ?it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.13it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.13it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.13it/s]

validation: 100%|██████████| 22/22 [00:00<00:00, 37.43it/s]


[32m2022-07-06 12:34:05[0m | [1mINFO    [0m | [1mFinished epoch 22/40:[0m
[32m2022-07-06 12:34:05[0m | [1mINFO    [0m | [1mtrain:[0m
[32m2022-07-06 12:34:05[0m | [1mINFO    [0m | [1mloss:	| avg: 487.7    	|  std: 6.198    	|  min: 474.0    	|  25%: 484.5    	|  50%: 487.2    	|  75%: 491.5    	|  max: 505.5    [0m
[32m2022-07-06 12:34:05[0m | [1mINFO    [0m | [1macc:	| avg: 0.9871   	|  std: 0.005812 	|  min: 0.9727   	|  25%: 0.9824   	|  50%: 0.9883   	|  75%: 0.9902   	|  max: 0.998    [0m
[32m2022-07-06 12:34:05[0m | [1mINFO    [0m | [1mlr:	| avg: 0.0001411	|  std: nan      	|  min: 0.0001411	|  25%: 0.0001411	|  50%: 0.0001411	|  75%: 0.0001411	|  max: 0.0001411[0m
[32m2022-07-06 12:34:05[0m | [1mINFO    [0m | [1mvalidation:[0m
[32m2022-07-06 12:34:05[0m | [1mINFO    [0m | [1mloss:	| avg: 561.6    	|  std: 18.72    	|  min: 534.0    	|  25%: 550.2    	|  50%: 556.2    	|  75%: 568.9    	|  max: 613.0    [0m
[32m2022-07-06 12:34:05[0m | 


train:   0%|          | 0/73 [00:00<?, ?it/s]

train:   0%|          | 0/73 [00:00<?, ?it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.15it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.15it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.15it/s]
validation:   0%|          | 0/22 [00:00<?, ?it/s]
validation: 100%|██████████| 22/22 [00:00<00:00, 36.41it/s]


[32m2022-07-06 12:34:21[0m | [1mINFO    [0m | [1mFinished epoch 23/40:[0m
[32m2022-07-06 12:34:21[0m | [1mINFO    [0m | [1mtrain:[0m
[32m2022-07-06 12:34:21[0m | [1mINFO    [0m | [1mloss:	| avg: 483.4    	|  std: 7.927    	|  min: 473.2    	|  25%: 478.0    	|  50%: 481.0    	|  75%: 487.5    	|  max: 509.5    [0m
[32m2022-07-06 12:34:21[0m | [1mINFO    [0m | [1macc:	| avg: 0.9886   	|  std: 0.00623  	|  min: 0.9688   	|  25%: 0.9863   	|  50%: 0.9902   	|  75%: 0.9922   	|  max: 0.998    [0m
[32m2022-07-06 12:34:21[0m | [1mINFO    [0m | [1mlr:	| avg: 0.0001337	|  std: nan      	|  min: 0.0001337	|  25%: 0.0001337	|  50%: 0.0001337	|  75%: 0.0001337	|  max: 0.0001337[0m
[32m2022-07-06 12:34:21[0m | [1mINFO    [0m | [1mvalidation:[0m
[32m2022-07-06 12:34:21[0m | [1mINFO    [0m | [1mloss:	| avg: 552.4    	|  std: 12.89    	|  min: 533.5    	|  25%: 543.6    	|  50%: 550.5    	|  75%: 558.4    	|  max: 585.0    [0m
[32m2022-07-06 12:34:21[0m | 


train:   0%|          | 0/73 [00:00<?, ?it/s]
train:   0%|          | 0/73 [00:00<?, ?it/s]

train: 100%|██████████| 73/73 [00:14<00:00,  5.13it/s]
validation:   0%|          | 0/22 [00:00<?, ?it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.13it/s]

validation: 100%|██████████| 22/22 [00:00<00:00, 37.92it/s]


[32m2022-07-06 12:34:37[0m | [1mINFO    [0m | [1mFinished epoch 24/40:[0m
[32m2022-07-06 12:34:37[0m | [1mINFO    [0m | [1mtrain:[0m
[32m2022-07-06 12:34:37[0m | [1mINFO    [0m | [1mloss:	| avg: 478.8    	|  std: 7.406    	|  min: 467.2    	|  25%: 474.2    	|  50%: 476.8    	|  75%: 482.0    	|  max: 501.0    [0m
[32m2022-07-06 12:34:37[0m | [1mINFO    [0m | [1macc:	| avg: 0.9894   	|  std: 0.006403 	|  min: 0.9668   	|  25%: 0.9863   	|  50%: 0.9922   	|  75%: 0.9941   	|  max: 0.998    [0m
[32m2022-07-06 12:34:37[0m | [1mINFO    [0m | [1mlr:	| avg: 0.0001263	|  std: nan      	|  min: 0.0001263	|  25%: 0.0001263	|  50%: 0.0001263	|  75%: 0.0001263	|  max: 0.0001263[0m
[32m2022-07-06 12:34:37[0m | [1mINFO    [0m | [1mvalidation:[0m
[32m2022-07-06 12:34:37[0m | [1mINFO    [0m | [1mloss:	| avg: 556.0    	|  std: 20.18    	|  min: 534.0    	|  25%: 542.2    	|  50%: 549.0    	|  75%: 564.8    	|  max: 604.5    [0m
[32m2022-07-06 12:34:37[0m | 


train:   0%|          | 0/73 [00:00<?, ?it/s]

train:   0%|          | 0/73 [00:00<?, ?it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.12it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.12it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.12it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.12it/s]
validation: 100%|██████████| 22/22 [00:00<00:00, 37.19it/s]


[32m2022-07-06 12:34:52[0m | [1mINFO    [0m | [1mFinished epoch 25/40:[0m
[32m2022-07-06 12:34:52[0m | [1mINFO    [0m | [1mtrain:[0m
[32m2022-07-06 12:34:52[0m | [1mINFO    [0m | [1mloss:	| avg: 473.3    	|  std: 5.483    	|  min: 464.2    	|  25%: 469.0    	|  50%: 472.0    	|  75%: 477.5    	|  max: 484.2    [0m
[32m2022-07-06 12:34:52[0m | [1mINFO    [0m | [1macc:	| avg: 0.9929   	|  std: 0.005321 	|  min: 0.9785   	|  25%: 0.9902   	|  50%: 0.9941   	|  75%: 0.9961   	|  max: 1.0      [0m
[32m2022-07-06 12:34:52[0m | [1mINFO    [0m | [1mlr:	| avg: 0.0001189	|  std: nan      	|  min: 0.0001189	|  25%: 0.0001189	|  50%: 0.0001189	|  75%: 0.0001189	|  max: 0.0001189[0m
[32m2022-07-06 12:34:52[0m | [1mINFO    [0m | [1mvalidation:[0m
[32m2022-07-06 12:34:52[0m | [1mINFO    [0m | [1mloss:	| avg: 549.6    	|  std: 15.75    	|  min: 532.5    	|  25%: 541.5    	|  50%: 545.2    	|  75%: 549.9    	|  max: 600.0    [0m
[32m2022-07-06 12:34:52[0m | 


train:   0%|          | 0/73 [00:00<?, ?it/s]


train: 100%|██████████| 73/73 [00:14<00:00,  5.13it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.13it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.13it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.13it/s]
validation: 100%|██████████| 22/22 [00:00<00:00, 37.18it/s]


[32m2022-07-06 12:35:08[0m | [1mINFO    [0m | [1mFinished epoch 26/40:[0m
[32m2022-07-06 12:35:08[0m | [1mINFO    [0m | [1mtrain:[0m
[32m2022-07-06 12:35:08[0m | [1mINFO    [0m | [1mloss:	| avg: 469.6    	|  std: 5.291    	|  min: 462.2    	|  25%: 466.0    	|  50%: 468.0    	|  75%: 472.0    	|  max: 487.8    [0m
[32m2022-07-06 12:35:08[0m | [1mINFO    [0m | [1macc:	| avg: 0.9946   	|  std: 0.00422  	|  min: 0.9785   	|  25%: 0.9922   	|  50%: 0.9961   	|  75%: 0.998    	|  max: 1.0      [0m
[32m2022-07-06 12:35:08[0m | [1mINFO    [0m | [1mlr:	| avg: 0.0001115	|  std: nan      	|  min: 0.0001115	|  25%: 0.0001115	|  50%: 0.0001115	|  75%: 0.0001115	|  max: 0.0001115[0m
[32m2022-07-06 12:35:08[0m | [1mINFO    [0m | [1mvalidation:[0m
[32m2022-07-06 12:35:08[0m | [1mINFO    [0m | [1mloss:	| avg: 554.2    	|  std: 17.82    	|  min: 527.5    	|  25%: 544.0    	|  50%: 551.2    	|  75%: 559.4    	|  max: 617.0    [0m
[32m2022-07-06 12:35:08[0m | 


train:   0%|          | 0/73 [00:00<?, ?it/s]


train: 100%|██████████| 73/73 [00:14<00:00,  5.13it/s]

validation:   0%|          | 0/22 [00:00<?, ?it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.13it/s]
validation: 100%|██████████| 22/22 [00:00<00:00, 36.77it/s]


[32m2022-07-06 12:35:23[0m | [1mINFO    [0m | [1mFinished epoch 27/40:[0m
[32m2022-07-06 12:35:23[0m | [1mINFO    [0m | [1mtrain:[0m
[32m2022-07-06 12:35:23[0m | [1mINFO    [0m | [1mloss:	| avg: 468.2    	|  std: 5.876    	|  min: 461.5    	|  25%: 463.5    	|  50%: 466.5    	|  75%: 472.0    	|  max: 489.5    [0m
[32m2022-07-06 12:35:23[0m | [1mINFO    [0m | [1macc:	| avg: 0.9945   	|  std: 0.004872 	|  min: 0.9746   	|  25%: 0.9922   	|  50%: 0.9961   	|  75%: 0.998    	|  max: 1.0      [0m
[32m2022-07-06 12:35:23[0m | [1mINFO    [0m | [1mlr:	| avg: 0.0001041	|  std: nan      	|  min: 0.0001041	|  25%: 0.0001041	|  50%: 0.0001041	|  75%: 0.0001041	|  max: 0.0001041[0m
[32m2022-07-06 12:35:23[0m | [1mINFO    [0m | [1mvalidation:[0m
[32m2022-07-06 12:35:23[0m | [1mINFO    [0m | [1mloss:	| avg: 556.0    	|  std: 19.63    	|  min: 530.5    	|  25%: 544.5    	|  50%: 550.0    	|  75%: 565.1    	|  max: 619.0    [0m
[32m2022-07-06 12:35:23[0m | 


train:   0%|          | 0/73 [00:00<?, ?it/s]
train:   0%|          | 0/73 [00:00<?, ?it/s]

train: 100%|██████████| 73/73 [00:14<00:00,  5.10it/s]
validation:   0%|          | 0/22 [00:00<?, ?it/s]

train: 100%|██████████| 73/73 [00:14<00:00,  5.10it/s]
validation: 100%|██████████| 22/22 [00:00<00:00, 37.77it/s]


[32m2022-07-06 12:35:39[0m | [1mINFO    [0m | [1mFinished epoch 28/40:[0m
[32m2022-07-06 12:35:39[0m | [1mINFO    [0m | [1mtrain:[0m
[32m2022-07-06 12:35:39[0m | [1mINFO    [0m | [1mloss:	| avg: 465.4    	|  std: 4.304    	|  min: 459.0    	|  25%: 462.0    	|  50%: 464.5    	|  75%: 468.0    	|  max: 481.0    [0m
[32m2022-07-06 12:35:39[0m | [1mINFO    [0m | [1macc:	| avg: 0.9956   	|  std: 0.003371 	|  min: 0.9824   	|  25%: 0.9941   	|  50%: 0.9961   	|  75%: 0.998    	|  max: 1.0      [0m
[32m2022-07-06 12:35:39[0m | [1mINFO    [0m | [1mlr:	| avg: 9.676e-05	|  std: nan      	|  min: 9.676e-05	|  25%: 9.676e-05	|  50%: 9.676e-05	|  75%: 9.676e-05	|  max: 9.676e-05[0m
[32m2022-07-06 12:35:39[0m | [1mINFO    [0m | [1mvalidation:[0m
[32m2022-07-06 12:35:39[0m | [1mINFO    [0m | [1mloss:	| avg: 550.8    	|  std: 13.6     	|  min: 530.0    	|  25%: 542.6    	|  50%: 548.5    	|  75%: 558.1    	|  max: 585.0    [0m
[32m2022-07-06 12:35:39[0m | 


train:   0%|          | 0/73 [00:00<?, ?it/s]
train:   0%|          | 0/73 [00:00<?, ?it/s]

train: 100%|██████████| 73/73 [00:14<00:00,  5.12it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.12it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.12it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.12it/s]
validation: 100%|██████████| 22/22 [00:00<00:00, 37.44it/s]


[32m2022-07-06 12:35:55[0m | [1mINFO    [0m | [1mFinished epoch 29/40:[0m
[32m2022-07-06 12:35:55[0m | [1mINFO    [0m | [1mtrain:[0m
[32m2022-07-06 12:35:55[0m | [1mINFO    [0m | [1mloss:	| avg: 463.7    	|  std: 4.196    	|  min: 457.8    	|  25%: 460.5    	|  50%: 462.5    	|  75%: 466.0    	|  max: 479.0    [0m
[32m2022-07-06 12:35:55[0m | [1mINFO    [0m | [1macc:	| avg: 0.9964   	|  std: 0.003277 	|  min: 0.9863   	|  25%: 0.9961   	|  50%: 0.9961   	|  75%: 0.998    	|  max: 1.0      [0m
[32m2022-07-06 12:35:55[0m | [1mINFO    [0m | [1mlr:	| avg: 8.937e-05	|  std: nan      	|  min: 8.937e-05	|  25%: 8.937e-05	|  50%: 8.937e-05	|  75%: 8.937e-05	|  max: 8.937e-05[0m
[32m2022-07-06 12:35:55[0m | [1mINFO    [0m | [1mvalidation:[0m
[32m2022-07-06 12:35:55[0m | [1mINFO    [0m | [1mloss:	| avg: 546.4    	|  std: 11.11    	|  min: 524.5    	|  25%: 540.5    	|  50%: 546.8    	|  75%: 552.5    	|  max: 572.0    [0m
[32m2022-07-06 12:35:55[0m | 


train:   0%|          | 0/73 [00:00<?, ?it/s]


train: 100%|██████████| 73/73 [00:14<00:00,  5.12it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.12it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.12it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.12it/s]
validation: 100%|██████████| 22/22 [00:00<00:00, 37.26it/s]


[32m2022-07-06 12:36:10[0m | [1mINFO    [0m | [1mFinished epoch 30/40:[0m
[32m2022-07-06 12:36:10[0m | [1mINFO    [0m | [1mtrain:[0m
[32m2022-07-06 12:36:10[0m | [1mINFO    [0m | [1mloss:	| avg: 460.9    	|  std: 3.798    	|  min: 455.8    	|  25%: 458.0    	|  50%: 459.8    	|  75%: 462.8    	|  max: 472.0    [0m
[32m2022-07-06 12:36:10[0m | [1mINFO    [0m | [1macc:	| avg: 0.9975   	|  std: 0.00334  	|  min: 0.9844   	|  25%: 0.9961   	|  50%: 0.998    	|  75%: 1.0      	|  max: 1.0      [0m
[32m2022-07-06 12:36:10[0m | [1mINFO    [0m | [1mlr:	| avg: 8.198e-05	|  std: nan      	|  min: 8.198e-05	|  25%: 8.198e-05	|  50%: 8.198e-05	|  75%: 8.198e-05	|  max: 8.198e-05[0m
[32m2022-07-06 12:36:10[0m | [1mINFO    [0m | [1mvalidation:[0m
[32m2022-07-06 12:36:10[0m | [1mINFO    [0m | [1mloss:	| avg: 547.1    	|  std: 10.37    	|  min: 529.0    	|  25%: 544.5    	|  50%: 547.5    	|  75%: 550.8    	|  max: 570.0    [0m
[32m2022-07-06 12:36:10[0m | 


train:   0%|          | 0/73 [00:00<?, ?it/s]
train:   0%|          | 0/73 [00:00<?, ?it/s]
train:   0%|          | 0/73 [00:00<?, ?it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.14it/s]
validation:   0%|          | 0/22 [00:00<?, ?it/s]t/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.14it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.13it/s]
validation: 100%|██████████| 22/22 [00:00<00:00, 36.46it/s]


[32m2022-07-06 12:36:26[0m | [1mINFO    [0m | [1mFinished epoch 31/40:[0m
[32m2022-07-06 12:36:26[0m | [1mINFO    [0m | [1mtrain:[0m
[32m2022-07-06 12:36:26[0m | [1mINFO    [0m | [1mloss:	| avg: 459.9    	|  std: 3.504    	|  min: 454.5    	|  25%: 457.5    	|  50%: 459.0    	|  75%: 462.0    	|  max: 469.5    [0m
[32m2022-07-06 12:36:26[0m | [1mINFO    [0m | [1macc:	| avg: 0.9974   	|  std: 0.00302  	|  min: 0.9883   	|  25%: 0.9961   	|  50%: 0.998    	|  75%: 1.0      	|  max: 1.0      [0m
[32m2022-07-06 12:36:26[0m | [1mINFO    [0m | [1mlr:	| avg: 7.46e-05 	|  std: nan      	|  min: 7.46e-05 	|  25%: 7.46e-05 	|  50%: 7.46e-05 	|  75%: 7.46e-05 	|  max: 7.46e-05 [0m
[32m2022-07-06 12:36:26[0m | [1mINFO    [0m | [1mvalidation:[0m
[32m2022-07-06 12:36:26[0m | [1mINFO    [0m | [1mloss:	| avg: 540.7    	|  std: 13.5     	|  min: 512.5    	|  25%: 531.4    	|  50%: 540.8    	|  75%: 546.8    	|  max: 569.0    [0m
[32m2022-07-06 12:36:26[0m | 


train:   0%|          | 0/73 [00:00<?, ?it/s]

train:   0%|          | 0/73 [00:00<?, ?it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.13it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.13it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.13it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.13it/s]
validation: 100%|██████████| 22/22 [00:00<00:00, 37.69it/s]


[32m2022-07-06 12:36:41[0m | [1mINFO    [0m | [1mFinished epoch 32/40:[0m
[32m2022-07-06 12:36:41[0m | [1mINFO    [0m | [1mtrain:[0m
[32m2022-07-06 12:36:41[0m | [1mINFO    [0m | [1mloss:	| avg: 458.9    	|  std: 3.523    	|  min: 453.5    	|  25%: 456.5    	|  50%: 458.0    	|  75%: 461.0    	|  max: 470.0    [0m
[32m2022-07-06 12:36:41[0m | [1mINFO    [0m | [1macc:	| avg: 0.9981   	|  std: 0.00249  	|  min: 0.9883   	|  25%: 0.998    	|  50%: 0.998    	|  75%: 1.0      	|  max: 1.0      [0m
[32m2022-07-06 12:36:42[0m | [1mINFO    [0m | [1mlr:	| avg: 6.721e-05	|  std: nan      	|  min: 6.721e-05	|  25%: 6.721e-05	|  50%: 6.721e-05	|  75%: 6.721e-05	|  max: 6.721e-05[0m
[32m2022-07-06 12:36:42[0m | [1mINFO    [0m | [1mvalidation:[0m
[32m2022-07-06 12:36:42[0m | [1mINFO    [0m | [1mloss:	| avg: 543.9    	|  std: 10.31    	|  min: 526.0    	|  25%: 537.0    	|  50%: 543.0    	|  75%: 552.5    	|  max: 563.0    [0m
[32m2022-07-06 12:36:42[0m | 


train:   0%|          | 0/73 [00:00<?, ?it/s]

train:   0%|          | 0/73 [00:00<?, ?it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.11it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.11it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.11it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.11it/s]
validation: 100%|██████████| 22/22 [00:00<00:00, 37.77it/s]


[32m2022-07-06 12:36:57[0m | [1mINFO    [0m | [1mFinished epoch 33/40:[0m
[32m2022-07-06 12:36:57[0m | [1mINFO    [0m | [1mtrain:[0m
[32m2022-07-06 12:36:57[0m | [1mINFO    [0m | [1mloss:	| avg: 458.2    	|  std: 3.432    	|  min: 453.2    	|  25%: 455.5    	|  50%: 457.2    	|  75%: 460.2    	|  max: 468.8    [0m
[32m2022-07-06 12:36:57[0m | [1mINFO    [0m | [1macc:	| avg: 0.998    	|  std: 0.002584 	|  min: 0.9883   	|  25%: 0.9961   	|  50%: 1.0      	|  75%: 1.0      	|  max: 1.0      [0m
[32m2022-07-06 12:36:57[0m | [1mINFO    [0m | [1mlr:	| avg: 5.982e-05	|  std: nan      	|  min: 5.982e-05	|  25%: 5.982e-05	|  50%: 5.982e-05	|  75%: 5.982e-05	|  max: 5.982e-05[0m
[32m2022-07-06 12:36:57[0m | [1mINFO    [0m | [1mvalidation:[0m
[32m2022-07-06 12:36:57[0m | [1mINFO    [0m | [1mloss:	| avg: 542.1    	|  std: 8.353    	|  min: 524.0    	|  25%: 537.5    	|  50%: 542.0    	|  75%: 546.9    	|  max: 561.5    [0m
[32m2022-07-06 12:36:57[0m | 


train:   0%|          | 0/73 [00:00<?, ?it/s]

train:   0%|          | 0/73 [00:00<?, ?it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.15it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.15it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.15it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.15it/s]
validation: 100%|██████████| 22/22 [00:00<00:00, 37.65it/s]


[32m2022-07-06 12:37:13[0m | [1mINFO    [0m | [1mFinished epoch 34/40:[0m
[32m2022-07-06 12:37:13[0m | [1mINFO    [0m | [1mtrain:[0m
[32m2022-07-06 12:37:13[0m | [1mINFO    [0m | [1mloss:	| avg: 456.7    	|  std: 2.676    	|  min: 453.2    	|  25%: 454.5    	|  50%: 456.0    	|  75%: 458.8    	|  max: 463.5    [0m
[32m2022-07-06 12:37:13[0m | [1mINFO    [0m | [1macc:	| avg: 0.9986   	|  std: 0.002097 	|  min: 0.9883   	|  25%: 0.998    	|  50%: 1.0      	|  75%: 1.0      	|  max: 1.0      [0m
[32m2022-07-06 12:37:13[0m | [1mINFO    [0m | [1mlr:	| avg: 5.243e-05	|  std: nan      	|  min: 5.243e-05	|  25%: 5.243e-05	|  50%: 5.243e-05	|  75%: 5.243e-05	|  max: 5.243e-05[0m
[32m2022-07-06 12:37:13[0m | [1mINFO    [0m | [1mvalidation:[0m
[32m2022-07-06 12:37:13[0m | [1mINFO    [0m | [1mloss:	| avg: 540.3    	|  std: 9.162    	|  min: 526.5    	|  25%: 533.5    	|  50%: 539.2    	|  75%: 546.0    	|  max: 558.0    [0m
[32m2022-07-06 12:37:13[0m | 


train:   0%|          | 0/73 [00:00<?, ?it/s]

train:   0%|          | 0/73 [00:00<?, ?it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.19it/s]
validation:   0%|          | 0/22 [00:00<?, ?it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.18it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.18it/s]
validation: 100%|██████████| 22/22 [00:00<00:00, 37.82it/s]


[32m2022-07-06 12:37:28[0m | [1mINFO    [0m | [1mFinished epoch 35/40:[0m
[32m2022-07-06 12:37:28[0m | [1mINFO    [0m | [1mtrain:[0m
[32m2022-07-06 12:37:28[0m | [1mINFO    [0m | [1mloss:	| avg: 456.3    	|  std: 2.89     	|  min: 452.8    	|  25%: 454.2    	|  50%: 455.8    	|  75%: 457.5    	|  max: 467.0    [0m
[32m2022-07-06 12:37:28[0m | [1mINFO    [0m | [1macc:	| avg: 0.9986   	|  std: 0.00204  	|  min: 0.9902   	|  25%: 0.998    	|  50%: 1.0      	|  75%: 1.0      	|  max: 1.0      [0m
[32m2022-07-06 12:37:28[0m | [1mINFO    [0m | [1mlr:	| avg: 5e-05    	|  std: nan      	|  min: 5e-05    	|  25%: 5e-05    	|  50%: 5e-05    	|  75%: 5e-05    	|  max: 5e-05    [0m
[32m2022-07-06 12:37:28[0m | [1mINFO    [0m | [1mvalidation:[0m
[32m2022-07-06 12:37:28[0m | [1mINFO    [0m | [1mloss:	| avg: 539.9    	|  std: 11.75    	|  min: 511.0    	|  25%: 531.1    	|  50%: 541.0    	|  75%: 546.9    	|  max: 559.5    [0m
[32m2022-07-06 12:37:28[0m | 


train:   0%|          | 0/73 [00:00<?, ?it/s]


train: 100%|██████████| 73/73 [00:14<00:00,  5.17it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.17it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.16it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.16it/s]
validation: 100%|██████████| 22/22 [00:00<00:00, 36.85it/s]


[32m2022-07-06 12:37:44[0m | [1mINFO    [0m | [1mFinished epoch 36/40:[0m
[32m2022-07-06 12:37:44[0m | [1mINFO    [0m | [1mtrain:[0m
[32m2022-07-06 12:37:44[0m | [1mINFO    [0m | [1mloss:	| avg: 455.7    	|  std: 2.554    	|  min: 452.2    	|  25%: 453.8    	|  50%: 455.0    	|  75%: 457.0    	|  max: 463.0    [0m
[32m2022-07-06 12:37:44[0m | [1mINFO    [0m | [1macc:	| avg: 0.9991   	|  std: 0.001455 	|  min: 0.9941   	|  25%: 0.998    	|  50%: 1.0      	|  75%: 1.0      	|  max: 1.0      [0m
[32m2022-07-06 12:37:44[0m | [1mINFO    [0m | [1mlr:	| avg: 5e-05    	|  std: nan      	|  min: 5e-05    	|  25%: 5e-05    	|  50%: 5e-05    	|  75%: 5e-05    	|  max: 5e-05    [0m
[32m2022-07-06 12:37:44[0m | [1mINFO    [0m | [1mvalidation:[0m
[32m2022-07-06 12:37:44[0m | [1mINFO    [0m | [1mloss:	| avg: 540.1    	|  std: 9.262    	|  min: 525.5    	|  25%: 533.0    	|  50%: 538.2    	|  75%: 548.4    	|  max: 556.5    [0m
[32m2022-07-06 12:37:44[0m | 


train:   0%|          | 0/73 [00:00<?, ?it/s]

train:   0%|          | 0/73 [00:00<?, ?it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.19it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.19it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.19it/s]
validation:   0%|          | 0/22 [00:00<?, ?it/s]
validation: 100%|██████████| 22/22 [00:00<00:00, 37.34it/s]


[32m2022-07-06 12:37:59[0m | [1mINFO    [0m | [1mFinished epoch 37/40:[0m
[32m2022-07-06 12:37:59[0m | [1mINFO    [0m | [1mtrain:[0m
[32m2022-07-06 12:37:59[0m | [1mINFO    [0m | [1mloss:	| avg: 455.3    	|  std: 3.083    	|  min: 451.5    	|  25%: 453.2    	|  50%: 454.2    	|  75%: 455.8    	|  max: 467.8    [0m
[32m2022-07-06 12:37:59[0m | [1mINFO    [0m | [1macc:	| avg: 0.9991   	|  std: 0.001725 	|  min: 0.9902   	|  25%: 0.998    	|  50%: 1.0      	|  75%: 1.0      	|  max: 1.0      [0m
[32m2022-07-06 12:37:59[0m | [1mINFO    [0m | [1mlr:	| avg: 5e-05    	|  std: nan      	|  min: 5e-05    	|  25%: 5e-05    	|  50%: 5e-05    	|  75%: 5e-05    	|  max: 5e-05    [0m
[32m2022-07-06 12:37:59[0m | [1mINFO    [0m | [1mvalidation:[0m
[32m2022-07-06 12:37:59[0m | [1mINFO    [0m | [1mloss:	| avg: 540.1    	|  std: 11.23    	|  min: 522.5    	|  25%: 529.6    	|  50%: 543.8    	|  75%: 546.6    	|  max: 558.0    [0m
[32m2022-07-06 12:37:59[0m | 


train:   0%|          | 0/73 [00:00<?, ?it/s]

train:   0%|          | 0/73 [00:00<?, ?it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.17it/s]
validation:   0%|          | 0/22 [00:00<?, ?it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.17it/s]
validation:   0%|          | 0/22 [00:00<?, ?it/s]
validation: 100%|██████████| 22/22 [00:00<00:00, 36.75it/s]


[32m2022-07-06 12:38:15[0m | [1mINFO    [0m | [1mFinished epoch 38/40:[0m
[32m2022-07-06 12:38:15[0m | [1mINFO    [0m | [1mtrain:[0m
[32m2022-07-06 12:38:15[0m | [1mINFO    [0m | [1mloss:	| avg: 455.1    	|  std: 2.917    	|  min: 451.0    	|  25%: 453.0    	|  50%: 454.0    	|  75%: 456.5    	|  max: 463.0    [0m
[32m2022-07-06 12:38:15[0m | [1mINFO    [0m | [1macc:	| avg: 0.999    	|  std: 0.001597 	|  min: 0.9941   	|  25%: 0.998    	|  50%: 1.0      	|  75%: 1.0      	|  max: 1.0      [0m
[32m2022-07-06 12:38:15[0m | [1mINFO    [0m | [1mlr:	| avg: 5e-05    	|  std: nan      	|  min: 5e-05    	|  25%: 5e-05    	|  50%: 5e-05    	|  75%: 5e-05    	|  max: 5e-05    [0m
[32m2022-07-06 12:38:15[0m | [1mINFO    [0m | [1mvalidation:[0m
[32m2022-07-06 12:38:15[0m | [1mINFO    [0m | [1mloss:	| avg: 537.1    	|  std: 9.271    	|  min: 519.5    	|  25%: 534.0    	|  50%: 537.8    	|  75%: 541.9    	|  max: 556.0    [0m
[32m2022-07-06 12:38:15[0m | 



train:   0%|          | 0/73 [00:00<?, ?it/s]
train:   0%|          | 0/73 [00:00<?, ?it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.16it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.15it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.15it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.15it/s]
validation: 100%|██████████| 22/22 [00:00<00:00, 37.53it/s]


[32m2022-07-06 12:38:30[0m | [1mINFO    [0m | [1mFinished epoch 39/40:[0m
[32m2022-07-06 12:38:30[0m | [1mINFO    [0m | [1mtrain:[0m
[32m2022-07-06 12:38:30[0m | [1mINFO    [0m | [1mloss:	| avg: 454.2    	|  std: 2.319    	|  min: 451.0    	|  25%: 452.5    	|  50%: 453.5    	|  75%: 455.5    	|  max: 463.5    [0m
[32m2022-07-06 12:38:30[0m | [1mINFO    [0m | [1macc:	| avg: 0.9996   	|  std: 0.0009898	|  min: 0.9961   	|  25%: 1.0      	|  50%: 1.0      	|  75%: 1.0      	|  max: 1.0      [0m
[32m2022-07-06 12:38:30[0m | [1mINFO    [0m | [1mlr:	| avg: 5e-05    	|  std: nan      	|  min: 5e-05    	|  25%: 5e-05    	|  50%: 5e-05    	|  75%: 5e-05    	|  max: 5e-05    [0m
[32m2022-07-06 12:38:30[0m | [1mINFO    [0m | [1mvalidation:[0m
[32m2022-07-06 12:38:30[0m | [1mINFO    [0m | [1mloss:	| avg: 539.2    	|  std: 10.83    	|  min: 515.0    	|  25%: 535.2    	|  50%: 539.5    	|  75%: 545.9    	|  max: 561.5    [0m
[32m2022-07-06 12:38:30[0m | 



train:   0%|          | 0/73 [00:00<?, ?it/s]
train:   0%|          | 0/73 [00:00<?, ?it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.15it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.15it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.15it/s]
train: 100%|██████████| 73/73 [00:14<00:00,  5.15it/s]
validation: 100%|██████████| 22/22 [00:00<00:00, 37.40it/s]


[32m2022-07-06 12:38:46[0m | [1mINFO    [0m | [1mFinished epoch 40/40:[0m
[32m2022-07-06 12:38:46[0m | [1mINFO    [0m | [1mtrain:[0m
[32m2022-07-06 12:38:46[0m | [1mINFO    [0m | [1mloss:	| avg: 454.4    	|  std: 2.115    	|  min: 451.8    	|  25%: 452.8    	|  50%: 454.0    	|  75%: 455.8    	|  max: 460.0    [0m
[32m2022-07-06 12:38:46[0m | [1mINFO    [0m | [1macc:	| avg: 0.9992   	|  std: 0.001254 	|  min: 0.9941   	|  25%: 0.998    	|  50%: 1.0      	|  75%: 1.0      	|  max: 1.0      [0m
[32m2022-07-06 12:38:46[0m | [1mINFO    [0m | [1mlr:	| avg: 5e-05    	|  std: nan      	|  min: 5e-05    	|  25%: 5e-05    	|  50%: 5e-05    	|  75%: 5e-05    	|  max: 5e-05    [0m
[32m2022-07-06 12:38:46[0m | [1mINFO    [0m | [1mvalidation:[0m
[32m2022-07-06 12:38:46[0m | [1mINFO    [0m | [1mloss:	| avg: 539.4    	|  std: 9.066    	|  min: 523.5    	|  25%: 531.6    	|  50%: 541.2    	|  75%: 548.0    	|  max: 551.0    [0m
[32m2022-07-06 12:38:46[0m | 

In [5]:
np.mean(alg.evaluate('test')['scalar']['acc'])

test:   0%|          | 0/20 [00:00<?, ?it/s]

0.7747989445924759

## Show tensorboard

In [10]:
%load_ext tensorboard

In [11]:
%tensorboard --logdir /localdata/elads/data/cifar10/cifar10/CIFAR10Algorithm/debug/0147_20220706_122801 --port=13067 --bind_all

## Hyperparameter search with native optuna

In [None]:
args = beam_arguments(f"--project-name=cifar10 --root-dir={root_dir} --algorithm=CIFAR10Algorithm --device=0 --half --lr-d=1e-3 --batch-size=512",
                      "--n-epochs=40 --clip-gradient=1000 --parallel=4 --accumulate=1 --no-deterministic",
                      "--weight-decay=1e-5 --beta1=0.9 --beta2=0.9", 
                      path_to_data=path_to_data, dropout=.0, activation='relu', channels=512, label_smoothing=.2,
                      padding=6, gain=.2, turn_point=1024, final_point=3000, minimal_gain=.05, temperature=1)

study = Study(cifar10_algorithm_generator, args)

In [14]:
def suggest(trial):
    lr = trial.suggest_loguniform("lr", 1e-3, 2e-2)
    print('My suggestion')
    print(lr)
    return {'lr_dense': lr}
    

In [15]:
study.optuna(suggest, direction='maximize', n_jobs=1, n_trials=10)

[32m[I 2022-06-20 08:46:21,221][0m A new study created in memory with name: cifar10/CIFAR10Algorithm/debug_hp_optimization_20220620_084618[0m


My suggestion
0.009781018192999246
[32m2022-06-20 08:46:21.224[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mrunner_optuna[0m:[36m114[0m - [1mNext Hyperparameter suggestion:[0m
[32m2022-06-20 08:46:21.225[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mrunner_optuna[0m:[36m116[0m - [1mlr_dense: 0.009781018192999246[0m
[32m2022-06-20 08:46:21.229[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36m__init__[0m:[36m262[0m - [1mCreating new experiment[0m
[32m2022-06-20 08:46:21.229[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36m__init__[0m:[36m277[0m - [1mExperiment directory is: /home/shared/data/results/cifar10/cifar10/CIFAR10Algorithm/debug_hp_optimization_20220620_084618/0000_20220620_084621[0m
[32m2022-06-20 08:46:21.239[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mrun[0m:[36m554[0m - [1mSingle worker mode[0m
[32m2022-06-20 08:46:21.240[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mrun

KeyboardInterrupt: 

## Hyperparameter search with ray-tune and optuna

In [3]:
args = beam_arguments(f"--project-name=cifar10 --root-dir={root_dir} --algorithm=CIFAR10Algorithm --device=0 --amp --lr-d=1e-3 --batch-size=512",
                      "--n-epochs=40 --clip-gradient=1000 --parallel=0 --accumulate=1 --no-deterministic",
                      "--weight-decay=1e-5 --beta1=0.9 --beta2=0.9", 
                      path_to_data=path_to_data, dropout=.0, activation='relu', channels=512, label_smoothing=.2,
                      padding=6, gain=.2, turn_point=1024, final_point=3000, minimal_gain=.05, temperature=1)

study = Study(args, Alg=CIFAR10Algorithm, Dataset=CIFAR10Dataset, print_results=True)

[32m2022-07-06 16:20:20[0m | [1mINFO    [0m | [1mHyperparameter Optimization[0m
[32m2022-07-06 16:20:20[0m | [1mINFO    [0m | [1mbeam project: cifar10[0m
[32m2022-07-06 16:20:20[0m | [1mINFO    [0m | [1mExperiment Hyperparameters[0m
[32m2022-07-06 16:20:20[0m | [1mINFO    [0m | [1mproject_name: cifar10[0m
[32m2022-07-06 16:20:20[0m | [1mINFO    [0m | [1malgorithm: CIFAR10Algorithm[0m
[32m2022-07-06 16:20:20[0m | [1mINFO    [0m | [1midentifier: debug_hp_optimization_20220706_162020[0m
[32m2022-07-06 16:20:20[0m | [1mINFO    [0m | [1mmp_port: random[0m
[32m2022-07-06 16:20:20[0m | [1mINFO    [0m | [1mroot_dir: /localdata/elads/data/cifar10[0m
[32m2022-07-06 16:20:20[0m | [1mINFO    [0m | [1mreload: False[0m
[32m2022-07-06 16:20:20[0m | [1mINFO    [0m | [1mresume: -1[0m
[32m2022-07-06 16:20:20[0m | [1mINFO    [0m | [1moverride: False[0m
[32m2022-07-06 16:20:20[0m | [1mINFO    [0m | [1mcpu_workers: 0[0m
[32m2022-07-06

In [None]:
# hebo = HEBOSearch(metric="mean_accuracy", mode="max")

# analysis = study.tune(config={"lr_dense": tune.loguniform(1e-3, 2e-2),
#                               "weight_decay": tune.loguniform(1e-6, 1e-4),
#                               "gamma": tune.loguniform(.1, .9),
#                               "dropout": tune.uniform(0, .75),
#                               "scale_down": tune.uniform(0.4, .7),
#                               "scale_up": tune.uniform(0.9, 1.2),
#                               "ratio_down": tune.uniform(0.7, .95),
#                               "ratio_up": tune.uniform(1.05, 1.4),
#                               "channels": tune.choice([128, 256, 512]),
#                               "batch_size": tune.choice([512, 1024, 2048]),},
#                        metric="mean_accuracy",
#                        max_concurrent_trials=4,
#                        resources_per_trial={"gpu": 1},
#                        mode="max",
#                        search_alg=hebo,
#                       progress_reporter=JupyterNotebookReporter(overwrite=True),
#                        num_samples=400)


analysis = study.tune(config={"lr_dense": tune.loguniform(1e-4, 2e-2),
                              "weight_decay": tune.loguniform(1e-6, 1e-2),
                              "beta1": tune.loguniform(.85, .95),
                              "gain": tune.uniform(0.2, .2),
                              "temperature": tune.uniform(0.05, 2.),
                              "minimal_gain": tune.loguniform(.01, .1),
                              "channels": tune.choice([256, 512, 1024]),
                              "padding": tune.choice([4, 6, 8]),
                              "turn_point": tune.choice([256, 512, 1024]),
                              "final_point": tune.choice([2048, 2048*1.5, 2048*2]),
                              "batch_size": tune.choice([256, 512, 1024]),
                              "activation": tune.choice(['relu', 'celu', 'gelu']),},
                       metric="mean_accuracy",
                       max_concurrent_trials=8,
                       resources_per_trial={"gpu": 1},
                       mode="max",
                       search_alg=OptunaSearch(),
                      progress_reporter=JupyterNotebookReporter(overwrite=True),
                       num_samples=400)


Trial name,status,loc,activation,batch_size,beta1,channels,final_point,gain,lr_dense,minimal_gain,padding,temperature,turn_point,weight_decay,acc,iter,total time (s)
runner_tune_ec1791a4,RUNNING,172.17.0.2:39938,relu,512,0.928183,1024,4096,0.2,0.00671536,0.0357185,4,0.062858,512,4.63743e-05,0.934482,35.0,454.552
runner_tune_3d2a6602,RUNNING,172.17.0.2:40084,relu,512,0.911644,1024,4096,0.2,0.0071578,0.0349454,4,0.0630833,512,3.41031e-05,0.930131,25.0,308.486
runner_tune_93f28ee2,RUNNING,172.17.0.2:40184,relu,512,0.911794,1024,4096,0.2,0.011317,0.0469718,4,0.0575666,512,2.46689e-05,0.925337,17.0,217.496
runner_tune_c8115550,RUNNING,172.17.0.2:40344,relu,256,0.927557,1024,4096,0.2,0.0106841,0.0470998,4,0.0569684,512,3.21594e-05,0.763281,2.0,34.0246
runner_tune_38247390,PENDING,,relu,512,0.927516,1024,4096,0.2,0.00689768,0.0473985,4,0.0550966,512,2.76028e-05,,,
runner_tune_c944283c,TERMINATED,172.17.0.2:23692,celu,256,0.904816,256,2048,0.2,0.0099276,0.0735093,8,1.58846,512,3.5821e-06,0.880295,40.0,204.667
runner_tune_cc0e4228,TERMINATED,172.17.0.2:23729,relu,512,0.883576,512,2048,0.2,0.000335789,0.01734,4,0.221518,256,6.57065e-05,0.908114,40.0,233.51
runner_tune_cc12cf64,TERMINATED,172.17.0.2:23731,gelu,1024,0.933654,512,4096,0.2,0.00266318,0.014136,6,1.3378,512,0.00157602,0.910742,40.0,230.826
runner_tune_cc172366,TERMINATED,172.17.0.2:23733,gelu,512,0.943031,1024,2048,0.2,0.000101818,0.0812117,6,1.14841,1024,2.45449e-06,0.872603,40.0,497.553
runner_tune_cc1b3c94,TERMINATED,172.17.0.2:24077,relu,256,0.856223,256,4096,0.2,0.00219286,0.0769723,4,0.668636,512,0.00776539,0.907031,40.0,188.601


In [None]:
1+1