In [1]:
%load_ext autoreload
%autoreload 2

import torch
import torchvision
import torch.nn.functional as F
from torch import nn
from sklearn.metrics import precision_recall_fscore_support
import numpy as np
import math

# manage ray's relative imports
import ray
runtime_env = {"working_dir": ".." }
ray.init(runtime_env=runtime_env, dashboard_port=13065, include_dashboard=True)

from ray import tune
from ray.tune.suggest.optuna import OptunaSearch
from ray.tune import JupyterNotebookReporter

# manage beams's relative imports
import sys
sys.path.append('..')

from src.beam import beam_arguments, Experiment, Study
from src.beam import UniversalDataset, UniversalBatchSampler, PackedFolds
from src.beam import Algorithm
from src.beam import LinearNet, check_type, slice_to_index
from torchvision import transforms
import matplotlib.pyplot as plt

from src.beam import DataTensor
from src.beam.utils import is_notebook

from sklearn.datasets import fetch_covtype
import pandas as pd

from covtype_example import CovtypeDataset, CovtypeAlgorithm, RuleNet, covtype_algorithm_generator, get_covtype_parser 

2022-06-26 12:28:11,979	INFO services.py:1456 -- View the Ray dashboard at [1m[32mhttp://127.0.0.1:13065[39m[22m
2022-06-26 12:28:12,512	INFO packaging.py:388 -- Creating a file package for local directory '..'.
2022-06-26 12:28:12,536	INFO packaging.py:241 -- Pushing file package 'gcs://_ray_pkg_16b7a439f752140a.zip' (1.03MiB) to Ray cluster...
2022-06-26 12:28:12,551	INFO packaging.py:243 -- Successfully pushed file package 'gcs://_ray_pkg_16b7a439f752140a.zip'.


In [2]:
path_to_data = '/home/shared/data/dataset/covtype'
root_dir = '/home/shared/data/results/covtype'

In [13]:
args = beam_arguments(get_covtype_parser(), 
        f"--project-name=covtype --root-dir={root_dir} --algorithm=CovtypeAlgorithm --device=0 --no-half --lr-d=1e-3 --lr-s=.02 --batch-size=512",
        "--n-epochs=100 --clip=0 --parallel=1 --accumulate=1 --cudnn-benchmark",
        "--weight-decay=1e-5 --beta1=0.9 --beta2=0.99", weight_factor=1., scheduler_patience=16, weight_decay=1e-3,  label_smoothing=.2,
                      k_p=.05, k_i=0.001, k_d=0.005, initial_mask=1,
        path_to_data=path_to_data, dropout=.0, activation='gelu', channels=256, n_rules=128, n_layers=4, scheduler_factor=1/math.sqrt(10))

experiment = Experiment(args)

[32m2022-06-26 12:44:48.913[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36m__init__[0m:[36m183[0m - [1mbeam project: covtype[0m
[32m2022-06-26 12:44:48.915[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36m__init__[0m:[36m184[0m - [1mExperiment Hyperparameters[0m
[32m2022-06-26 12:44:48.916[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36m__init__[0m:[36m189[0m - [1mproject_name: covtype[0m
[32m2022-06-26 12:44:48.917[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36m__init__[0m:[36m189[0m - [1midentifier: debug[0m
[32m2022-06-26 12:44:48.918[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36m__init__[0m:[36m189[0m - [1malgorithm: CovtypeAlgorithm[0m
[32m2022-06-26 12:44:48.919[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36m__init__[0m:[36m189[0m - [1mmp_port: None[0m
[32m2022-06-26 12:44:48.920[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36m__init__[0m:[36m189[0m - [1mroot_

In [37]:
args = beam_arguments(get_covtype_parser(), 
        f"--project-name=covtype --root-dir={root_dir} --algorithm=CovtypeAlgorithm --device=0 --clip=0. --amp --lr-d=1e-3 --lr-s=.02 --batch-size=1024",
        "--n-epochs=100 --parallel=1 --accumulate=1 --cudnn-benchmark",
        "--weight-decay=1e-5 --beta1=0.9 --beta2=0.999", weight_factor=.0, scheduler_patience=16,  label_smoothing=.1,
                      k_p=.05, k_i=0.001, k_d=0.005, initial_mask=1,
        path_to_data=path_to_data, dropout=.0, activation='gelu', channels=192, n_rules=128, n_layers=3, scheduler_factor=1/math.sqrt(10))

experiment = Experiment(args)

[32m2022-06-26 15:27:13.751[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36m__init__[0m:[36m183[0m - [1mbeam project: covtype[0m
[32m2022-06-26 15:27:13.752[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36m__init__[0m:[36m184[0m - [1mExperiment Hyperparameters[0m
[32m2022-06-26 15:27:13.753[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36m__init__[0m:[36m189[0m - [1mproject_name: covtype[0m
[32m2022-06-26 15:27:13.754[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36m__init__[0m:[36m189[0m - [1midentifier: debug[0m
[32m2022-06-26 15:27:13.754[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36m__init__[0m:[36m189[0m - [1malgorithm: CovtypeAlgorithm[0m
[32m2022-06-26 15:27:13.755[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36m__init__[0m:[36m189[0m - [1mmp_port: None[0m
[32m2022-06-26 15:27:13.756[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36m__init__[0m:[36m189[0m - [1mroot_

In [38]:
# alg = covtype_algorithm_generator(experiment)

In [39]:
alg = experiment(covtype_algorithm_generator)

[32m2022-06-26 15:27:16.726[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mrun[0m:[36m553[0m - [1mSingle worker mode[0m
[32m2022-06-26 15:27:16.728[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mrun_worker[0m:[36m45[0m - [1mWorker: 1/1 is running...[0m


train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 15:29:03.183[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 1[0m
[32m2022-06-26 15:29:03.184[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0[0m

[32m2022-06-26 15:29:03.185[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 1/100:[0m
[32m2022-06-26 15:29:03.189[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 15:29:03.190[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 1046.82 	|[0m
[32m2022-06-26 15:29:03.191[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.705839 	|[0m
[32m2022-06-26 15:29:03.191[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mlr 0.001 	|[0m
[32m2022-06-26 15

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 15:30:49.439[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 1[0m
[32m2022-06-26 15:30:49.441[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0[0m

[32m2022-06-26 15:30:49.442[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 2/100:[0m
[32m2022-06-26 15:30:49.447[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 15:30:49.448[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 856.087 	|[0m
[32m2022-06-26 15:30:49.449[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.804399 	|[0m
[32m2022-06-26 15:30:49.450[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mlr 0.001 	|[0m
[32m2022-06-26 15

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 15:32:35.352[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 1[0m
[32m2022-06-26 15:32:35.353[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0[0m

[32m2022-06-26 15:32:35.354[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 3/100:[0m
[32m2022-06-26 15:32:35.359[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 15:32:35.359[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 780.585 	|[0m
[32m2022-06-26 15:32:35.360[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.844577 	|[0m
[32m2022-06-26 15:32:35.361[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mlr 0.001 	|[0m
[32m2022-06-26 15

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 15:34:20.988[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 1[0m
[32m2022-06-26 15:34:20.989[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0[0m

[32m2022-06-26 15:34:20.989[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 4/100:[0m
[32m2022-06-26 15:34:20.993[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 15:34:20.994[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 734.399 	|[0m
[32m2022-06-26 15:34:20.994[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.869325 	|[0m
[32m2022-06-26 15:34:20.995[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mlr 0.001 	|[0m
[32m2022-06-26 15

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 15:36:06.827[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 1[0m
[32m2022-06-26 15:36:06.828[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0[0m

[32m2022-06-26 15:36:06.829[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 5/100:[0m
[32m2022-06-26 15:36:06.834[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 15:36:06.835[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 698.818 	|[0m
[32m2022-06-26 15:36:06.836[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.888485 	|[0m
[32m2022-06-26 15:36:06.837[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mlr 0.001 	|[0m
[32m2022-06-26 15

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 15:37:52.266[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 1[0m
[32m2022-06-26 15:37:52.267[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0[0m

[32m2022-06-26 15:37:52.268[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 6/100:[0m
[32m2022-06-26 15:37:52.272[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 15:37:52.272[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 675.008 	|[0m
[32m2022-06-26 15:37:52.273[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.9008 	|[0m
[32m2022-06-26 15:37:52.274[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mlr 0.001 	|[0m
[32m2022-06-26 15:3

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 15:39:37.951[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.9993158384168893[0m
[32m2022-06-26 15:39:37.952[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.0009208957642236223[0m

[32m2022-06-26 15:39:37.953[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 7/100:[0m
[32m2022-06-26 15:39:37.958[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 15:39:37.959[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 655.634 	|[0m
[32m2022-06-26 15:39:37.959[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.911012 	|[0m
[32m2022-06-26 15:39:37.960[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - 

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 15:41:23.657[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 1[0m
[32m2022-06-26 15:41:23.658[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.0003580747121886221[0m

[32m2022-06-26 15:41:23.659[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 8/100:[0m
[32m2022-06-26 15:41:23.663[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 15:41:23.664[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 643.633 	|[0m
[32m2022-06-26 15:41:23.664[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.917139 	|[0m
[32m2022-06-26 15:41:23.665[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mlr 0.001 	|[0

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 15:43:09.508[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 1[0m
[32m2022-06-26 15:43:09.508[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.0001582958361448578[0m

[32m2022-06-26 15:43:09.509[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 9/100:[0m
[32m2022-06-26 15:43:09.513[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 15:43:09.514[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 629.267 	|[0m
[32m2022-06-26 15:43:09.515[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.923972 	|[0m
[32m2022-06-26 15:43:09.515[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mlr 0.001 	|[0

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 15:44:55.180[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 1[0m
[32m2022-06-26 15:44:55.181[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.00037429970546641264[0m

[32m2022-06-26 15:44:55.183[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 10/100:[0m
[32m2022-06-26 15:44:55.186[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 15:44:55.187[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 620.52 	|[0m
[32m2022-06-26 15:44:55.188[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.928017 	|[0m
[32m2022-06-26 15:44:55.189[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mlr 0.001 	|[

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 15:46:40.823[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.9988166246708431[0m
[32m2022-06-26 15:46:40.824[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.0013661856212461077[0m

[32m2022-06-26 15:46:40.825[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 11/100:[0m
[32m2022-06-26 15:46:40.829[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 15:46:40.830[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 611.093 	|[0m
[32m2022-06-26 15:46:40.830[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.933274 	|[0m
[32m2022-06-26 15:46:40.831[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - 

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 15:48:26.989[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.999148901352857[0m
[32m2022-06-26 15:48:26.991[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.001544609286126702[0m

[32m2022-06-26 15:48:26.992[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 12/100:[0m
[32m2022-06-26 15:48:26.995[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 15:48:26.996[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 610.757 	|[0m
[32m2022-06-26 15:48:26.997[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.933576 	|[0m
[32m2022-06-26 15:48:26.998[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 15:50:12.831[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.9989318272807621[0m
[32m2022-06-26 15:50:12.833[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.0022750406844096716[0m

[32m2022-06-26 15:50:12.834[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 13/100:[0m
[32m2022-06-26 15:50:12.838[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 15:50:12.839[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 602.861 	|[0m
[32m2022-06-26 15:50:12.840[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.936999 	|[0m
[32m2022-06-26 15:50:12.841[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - 

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 15:51:58.431[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.9984101110952149[0m
[32m2022-06-26 15:51:58.432[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.0031849696074174004[0m

[32m2022-06-26 15:51:58.432[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 14/100:[0m
[32m2022-06-26 15:51:58.435[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 15:51:58.436[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 597.429 	|[0m
[32m2022-06-26 15:51:58.436[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.940317 	|[0m
[32m2022-06-26 15:51:58.437[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - 

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 15:53:44.209[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.997753781197991[0m
[32m2022-06-26 15:53:44.210[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.004131460338903272[0m

[32m2022-06-26 15:53:44.211[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 15/100:[0m
[32m2022-06-26 15:53:44.213[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 15:53:44.214[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 596.139 	|[0m
[32m2022-06-26 15:53:44.215[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.941095 	|[0m
[32m2022-06-26 15:53:44.215[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 15:55:29.825[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.9973708768156768[0m
[32m2022-06-26 15:55:29.826[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.004991956475285178[0m

[32m2022-06-26 15:55:29.827[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 16/100:[0m
[32m2022-06-26 15:55:29.830[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 15:55:29.831[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 592.396 	|[0m
[32m2022-06-26 15:55:29.832[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.942766 	|[0m
[32m2022-06-26 15:55:29.832[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - 

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 15:57:15.221[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.9966107888522122[0m
[32m2022-06-26 15:57:15.222[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.005949052479954744[0m

[32m2022-06-26 15:57:15.223[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 17/100:[0m
[32m2022-06-26 15:57:15.226[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 15:57:15.226[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 593.756 	|[0m
[32m2022-06-26 15:57:15.227[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.942391 	|[0m
[32m2022-06-26 15:57:15.228[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - 

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 15:59:00.948[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.995768584975128[0m
[32m2022-06-26 15:59:00.949[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.006918402779222217[0m

[32m2022-06-26 15:59:00.950[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 18/100:[0m
[32m2022-06-26 15:59:00.953[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 15:59:00.954[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 589.422 	|[0m
[32m2022-06-26 15:59:00.954[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.944434 	|[0m
[32m2022-06-26 15:59:00.955[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 16:00:46.294[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.9953011549171283[0m
[32m2022-06-26 16:00:46.296[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.007798969263980253[0m

[32m2022-06-26 16:00:46.297[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 19/100:[0m
[32m2022-06-26 16:00:46.300[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 16:00:46.301[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 589.193 	|[0m
[32m2022-06-26 16:00:46.302[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.945085 	|[0m
[32m2022-06-26 16:00:46.303[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - 

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 16:02:32.067[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.9939419041150841[0m
[32m2022-06-26 16:02:32.069[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.008793434755093596[0m

[32m2022-06-26 16:02:32.070[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 20/100:[0m
[32m2022-06-26 16:02:32.074[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 16:02:32.075[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 588.671 	|[0m
[32m2022-06-26 16:02:32.076[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.944921 	|[0m
[32m2022-06-26 16:02:32.076[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - 

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 16:04:17.653[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.9923943723052331[0m
[32m2022-06-26 16:04:17.654[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.00978986829231582[0m

[32m2022-06-26 16:04:17.655[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 21/100:[0m
[32m2022-06-26 16:04:17.660[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 16:04:17.661[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 589.886 	|[0m
[32m2022-06-26 16:04:17.661[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.944791 	|[0m
[32m2022-06-26 16:04:17.662[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 16:06:02.599[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.991292822370285[0m
[32m2022-06-26 16:06:02.600[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.010764106566215638[0m

[32m2022-06-26 16:06:02.601[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 22/100:[0m
[32m2022-06-26 16:06:02.604[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 16:06:02.605[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 591.598 	|[0m
[32m2022-06-26 16:06:02.606[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.943685 	|[0m
[32m2022-06-26 16:06:02.606[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 16:07:47.982[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.989795951995266[0m
[32m2022-06-26 16:07:47.983[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.011755139112914285[0m

[32m2022-06-26 16:07:47.984[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 23/100:[0m
[32m2022-06-26 16:07:47.987[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 16:07:47.988[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 591.317 	|[0m
[32m2022-06-26 16:07:47.989[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.943578 	|[0m
[32m2022-06-26 16:07:47.990[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 16:09:33.622[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.98823063747168[0m
[32m2022-06-26 16:09:33.624[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.012747225908446238[0m

[32m2022-06-26 16:09:33.625[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 24/100:[0m
[32m2022-06-26 16:09:33.628[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 16:09:33.629[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 592.502 	|[0m
[32m2022-06-26 16:09:33.630[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.942936 	|[0m
[32m2022-06-26 16:09:33.630[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 16:11:19.123[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.9867196177574868[0m
[32m2022-06-26 16:11:19.124[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.013735528577318235[0m

[32m2022-06-26 16:11:19.125[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 25/100:[0m
[32m2022-06-26 16:11:19.129[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 16:11:19.130[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 592.899 	|[0m
[32m2022-06-26 16:11:19.130[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.94287 	|[0m
[32m2022-06-26 16:11:19.131[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 16:13:04.723[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.9851582530442871[0m
[32m2022-06-26 16:13:04.725[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.01472359380276335[0m

[32m2022-06-26 16:13:04.727[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 26/100:[0m
[32m2022-06-26 16:13:04.731[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 16:13:04.731[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 595.634 	|[0m
[32m2022-06-26 16:13:04.732[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.941369 	|[0m
[32m2022-06-26 16:13:04.733[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 16:14:50.206[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.9835333492412454[0m
[32m2022-06-26 16:14:50.208[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.01571396999459151[0m

[32m2022-06-26 16:14:50.209[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 27/100:[0m
[32m2022-06-26 16:14:50.213[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 16:14:50.214[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 597.103 	|[0m
[32m2022-06-26 16:14:50.215[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.94068 	|[0m
[32m2022-06-26 16:14:50.217[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 16:16:35.896[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.9824129026488087[0m
[32m2022-06-26 16:16:35.897[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.01664160651242237[0m

[32m2022-06-26 16:16:35.898[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 28/100:[0m
[32m2022-06-26 16:16:35.902[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 16:16:35.903[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 597.433 	|[0m
[32m2022-06-26 16:16:35.904[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.94049 	|[0m
[32m2022-06-26 16:16:35.905[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 16:18:21.254[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.9810083975981905[0m
[32m2022-06-26 16:18:21.256[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.017609557337819954[0m

[32m2022-06-26 16:18:21.258[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 29/100:[0m
[32m2022-06-26 16:18:21.261[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 16:18:21.263[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 596.616 	|[0m
[32m2022-06-26 16:18:21.263[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.940813 	|[0m
[32m2022-06-26 16:18:21.264[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - 

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 16:20:06.959[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.9795274787144058[0m
[32m2022-06-26 16:20:06.961[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.018585870078213433[0m

[32m2022-06-26 16:20:06.962[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 30/100:[0m
[32m2022-06-26 16:20:06.965[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 16:20:06.966[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 598.248 	|[0m
[32m2022-06-26 16:20:06.967[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.940116 	|[0m
[32m2022-06-26 16:20:06.968[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - 

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 16:21:52.975[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.9782341041970976[0m
[32m2022-06-26 16:21:52.977[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.019539686917901776[0m

[32m2022-06-26 16:21:52.979[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 31/100:[0m
[32m2022-06-26 16:21:52.983[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 16:21:52.985[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 598.534 	|[0m
[32m2022-06-26 16:21:52.985[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.940041 	|[0m
[32m2022-06-26 16:21:52.986[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - 

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 16:23:38.370[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.9765778962773027[0m
[32m2022-06-26 16:23:38.371[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.02052687503504339[0m

[32m2022-06-26 16:23:38.372[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 32/100:[0m
[32m2022-06-26 16:23:38.376[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 16:23:38.377[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 597.124 	|[0m
[32m2022-06-26 16:23:38.378[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.940055 	|[0m
[32m2022-06-26 16:23:38.378[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 16:25:24.295[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.9745656546852608[0m
[32m2022-06-26 16:25:24.297[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.021524085579706594[0m

[32m2022-06-26 16:25:24.298[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 33/100:[0m
[32m2022-06-26 16:25:24.301[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 16:25:24.302[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 599.893 	|[0m
[32m2022-06-26 16:25:24.303[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.938857 	|[0m
[32m2022-06-26 16:25:24.304[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - 

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 16:27:10.243[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.9728601879222871[0m
[32m2022-06-26 16:27:10.244[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.022514869091442336[0m

[32m2022-06-26 16:27:10.245[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 34/100:[0m
[32m2022-06-26 16:27:10.249[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 16:27:10.250[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 601.253 	|[0m
[32m2022-06-26 16:27:10.251[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.938347 	|[0m
[32m2022-06-26 16:27:10.251[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - 

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 16:28:56.049[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.9710173500455681[0m
[32m2022-06-26 16:28:56.050[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.023508819123856457[0m

[32m2022-06-26 16:28:56.051[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 35/100:[0m
[32m2022-06-26 16:28:56.054[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 16:28:56.055[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 602.069 	|[0m
[32m2022-06-26 16:28:56.056[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.937232 	|[0m
[32m2022-06-26 16:28:56.056[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - 

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 16:30:41.842[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.9695181393216998[0m
[32m2022-06-26 16:30:41.843[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.024484461719392225[0m
Epoch 00036: reducing learning rate of group 0 to 3.1623e-04.
Epoch 00036: reducing learning rate of group 0 to 6.3246e-03.

[32m2022-06-26 16:30:41.845[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 36/100:[0m
[32m2022-06-26 16:30:41.848[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 16:30:41.849[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 603.546 	|[0m
[32m2022-06-26 16:30:41.850[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.936964 

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 16:32:27.463[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.9674718793562034[0m
[32m2022-06-26 16:32:27.465[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.025481456419235382[0m

[32m2022-06-26 16:32:27.466[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 37/100:[0m
[32m2022-06-26 16:32:27.469[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 16:32:27.470[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 580.668 	|[0m
[32m2022-06-26 16:32:27.471[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.948499 	|[0m
[32m2022-06-26 16:32:27.472[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - 

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 16:34:13.470[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.9651401808988095[0m
[32m2022-06-26 16:34:13.472[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.02648072040969572[0m

[32m2022-06-26 16:34:13.473[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 38/100:[0m
[32m2022-06-26 16:34:13.476[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 16:34:13.477[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 577.867 	|[0m
[32m2022-06-26 16:34:13.478[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.949829 	|[0m
[32m2022-06-26 16:34:13.479[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 16:35:59.011[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.9628510957979842[0m
[32m2022-06-26 16:35:59.013[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.02747985695211504[0m

[32m2022-06-26 16:35:59.015[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 39/100:[0m
[32m2022-06-26 16:35:59.018[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 16:35:59.019[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 578.58 	|[0m
[32m2022-06-26 16:35:59.020[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.949818 	|[0m
[32m2022-06-26 16:35:59.020[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 16:37:44.431[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.9605099333302067[0m
[32m2022-06-26 16:37:44.433[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.028479142332859832[0m

[32m2022-06-26 16:37:44.434[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 40/100:[0m
[32m2022-06-26 16:37:44.438[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 16:37:44.439[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 580.516 	|[0m
[32m2022-06-26 16:37:44.439[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.948504 	|[0m
[32m2022-06-26 16:37:44.440[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - 

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 16:39:30.112[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.9580025885823585[0m
[32m2022-06-26 16:39:30.113[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.0294788094925035[0m

[32m2022-06-26 16:39:30.114[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 41/100:[0m
[32m2022-06-26 16:39:30.120[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 16:39:30.121[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 583.009 	|[0m
[32m2022-06-26 16:39:30.122[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.947075 	|[0m
[32m2022-06-26 16:39:30.122[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 16:41:15.361[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.9556714968266995[0m
[32m2022-06-26 16:41:15.363[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.03047804499505079[0m

[32m2022-06-26 16:41:15.364[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 42/100:[0m
[32m2022-06-26 16:41:15.367[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 16:41:15.368[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 584.967 	|[0m
[32m2022-06-26 16:41:15.369[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.946603 	|[0m
[32m2022-06-26 16:41:15.370[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 16:43:00.924[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.9532441244692279[0m
[32m2022-06-26 16:43:00.926[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.031477493249977256[0m

[32m2022-06-26 16:43:00.927[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 43/100:[0m
[32m2022-06-26 16:43:00.930[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 16:43:00.931[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 585.731 	|[0m
[32m2022-06-26 16:43:00.932[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.946275 	|[0m
[32m2022-06-26 16:43:00.933[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - 

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 16:44:46.485[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.9511237305969172[0m
[32m2022-06-26 16:44:46.486[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.032475253607184[0m

[32m2022-06-26 16:44:46.488[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 44/100:[0m
[32m2022-06-26 16:44:46.491[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 16:44:46.491[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 588.323 	|[0m
[32m2022-06-26 16:44:46.492[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.944543 	|[0m
[32m2022-06-26 16:44:46.493[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1m

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 16:46:32.344[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.9488094015658993[0m
[32m2022-06-26 16:46:32.346[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.03347414931879042[0m

[32m2022-06-26 16:46:32.347[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 45/100:[0m
[32m2022-06-26 16:46:32.350[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 16:46:32.351[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 589.759 	|[0m
[32m2022-06-26 16:46:32.351[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.943743 	|[0m
[32m2022-06-26 16:46:32.352[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 16:48:17.999[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.9464873525590057[0m
[32m2022-06-26 16:48:18.000[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.03447310483170669[0m

[32m2022-06-26 16:48:18.000[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 46/100:[0m
[32m2022-06-26 16:48:18.004[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 16:48:18.004[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 591.799 	|[0m
[32m2022-06-26 16:48:18.005[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.942697 	|[0m
[32m2022-06-26 16:48:18.005[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 16:50:03.675[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.9440881199396576[0m
[32m2022-06-26 16:50:03.676[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.0354723462576699[0m

[32m2022-06-26 16:50:03.677[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 47/100:[0m
[32m2022-06-26 16:50:03.680[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 16:50:03.681[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 592.363 	|[0m
[32m2022-06-26 16:50:03.682[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.942198 	|[0m
[32m2022-06-26 16:50:03.683[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 16:51:49.256[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.9416607627149562[0m
[32m2022-06-26 16:51:49.258[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.03647164421668559[0m

[32m2022-06-26 16:51:49.259[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 48/100:[0m
[32m2022-06-26 16:51:49.262[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 16:51:49.263[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 594.936 	|[0m
[32m2022-06-26 16:51:49.264[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.941081 	|[0m
[32m2022-06-26 16:51:49.265[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 16:53:35.125[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.9392092198157548[0m
[32m2022-06-26 16:53:35.126[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.03747097757979828[0m

[32m2022-06-26 16:53:35.128[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 49/100:[0m
[32m2022-06-26 16:53:35.131[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 16:53:35.132[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 596.079 	|[0m
[32m2022-06-26 16:53:35.132[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.940735 	|[0m
[32m2022-06-26 16:53:35.133[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 16:55:20.862[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.9368492986390753[0m
[32m2022-06-26 16:55:20.864[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.0384698948905458[0m

[32m2022-06-26 16:55:20.865[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 50/100:[0m
[32m2022-06-26 16:55:20.867[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 16:55:20.868[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 599.001 	|[0m
[32m2022-06-26 16:55:20.869[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.938747 	|[0m
[32m2022-06-26 16:55:20.870[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 16:57:06.531[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.9346041812389457[0m
[32m2022-06-26 16:57:06.532[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.0394678606175736[0m

[32m2022-06-26 16:57:06.534[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 51/100:[0m
[32m2022-06-26 16:57:06.538[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 16:57:06.539[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 600.783 	|[0m
[32m2022-06-26 16:57:06.540[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.937935 	|[0m
[32m2022-06-26 16:57:06.541[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 16:58:52.316[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.9321698705208905[0m
[32m2022-06-26 16:58:52.317[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.040466923926511786[0m

[32m2022-06-26 16:58:52.318[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 52/100:[0m
[32m2022-06-26 16:58:52.321[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 16:58:52.322[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 601.977 	|[0m
[32m2022-06-26 16:58:52.323[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.937025 	|[0m
[32m2022-06-26 16:58:52.323[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - 

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 17:00:38.271[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.9297155216674553[0m
[32m2022-06-26 17:00:38.273[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.04146611266789985[0m
Epoch 00053: reducing learning rate of group 0 to 1.0000e-04.
Epoch 00053: reducing learning rate of group 0 to 2.0000e-03.

[32m2022-06-26 17:00:38.274[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 53/100:[0m
[32m2022-06-26 17:00:38.277[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 17:00:38.278[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 603.708 	|[0m
[32m2022-06-26 17:00:38.278[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.936322 	

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 17:02:24.200[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.9272271121756481[0m
[32m2022-06-26 17:02:24.201[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.042465400514765814[0m

[32m2022-06-26 17:02:24.202[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 54/100:[0m
[32m2022-06-26 17:02:24.206[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 17:02:24.207[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 598.545 	|[0m
[32m2022-06-26 17:02:24.208[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.939681 	|[0m
[32m2022-06-26 17:02:24.209[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - 

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 17:04:10.157[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.9246269446281188[0m
[32m2022-06-26 17:04:10.158[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.04346497368536425[0m

[32m2022-06-26 17:04:10.158[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 55/100:[0m
[32m2022-06-26 17:04:10.161[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 17:04:10.162[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 597.592 	|[0m
[32m2022-06-26 17:04:10.162[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.939891 	|[0m
[32m2022-06-26 17:04:10.163[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 17:05:56.069[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.9221224207202248[0m
[32m2022-06-26 17:05:56.070[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.04446427795086274[0m

[32m2022-06-26 17:05:56.071[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 56/100:[0m
[32m2022-06-26 17:05:56.074[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 17:05:56.075[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 599.376 	|[0m
[32m2022-06-26 17:05:56.075[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.939122 	|[0m
[32m2022-06-26 17:05:56.076[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 17:07:41.783[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.919540573986219[0m
[32m2022-06-26 17:07:41.784[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.04546376391603175[0m

[32m2022-06-26 17:07:41.785[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 57/100:[0m
[32m2022-06-26 17:07:41.789[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 17:07:41.790[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 602.717 	|[0m
[32m2022-06-26 17:07:41.790[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.937353 	|[0m
[32m2022-06-26 17:07:41.791[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 17:09:28.045[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.916918166890068[0m
[32m2022-06-26 17:09:28.046[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.04646335107897395[0m

[32m2022-06-26 17:09:28.048[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 58/100:[0m
[32m2022-06-26 17:09:28.051[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 17:09:28.052[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 603.719 	|[0m
[32m2022-06-26 17:09:28.053[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.937192 	|[0m
[32m2022-06-26 17:09:28.054[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 17:11:13.815[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.9144321478686157[0m
[32m2022-06-26 17:11:13.816[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.047462558183651214[0m

[32m2022-06-26 17:11:13.818[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 59/100:[0m
[32m2022-06-26 17:11:13.821[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 17:11:13.822[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 607.542 	|[0m
[32m2022-06-26 17:11:13.822[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.935132 	|[0m
[32m2022-06-26 17:11:13.823[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - 

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 17:12:59.362[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.9119291363483242[0m
[32m2022-06-26 17:12:59.363[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.048461784367748485[0m

[32m2022-06-26 17:12:59.364[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 60/100:[0m
[32m2022-06-26 17:12:59.366[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 17:12:59.367[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 609.092 	|[0m
[32m2022-06-26 17:12:59.368[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.934115 	|[0m
[32m2022-06-26 17:12:59.369[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - 

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 17:14:44.976[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.909521201209223[0m
[32m2022-06-26 17:14:44.978[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.04946059473919165[0m

[32m2022-06-26 17:14:44.979[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 61/100:[0m
[32m2022-06-26 17:14:44.983[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 17:14:44.984[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 611.534 	|[0m
[32m2022-06-26 17:14:44.985[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.93281 	|[0m
[32m2022-06-26 17:14:44.986[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1m

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 17:16:30.566[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.9070185213751153[0m
[32m2022-06-26 17:16:30.567[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.05045980934878566[0m

[32m2022-06-26 17:16:30.568[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 62/100:[0m
[32m2022-06-26 17:16:30.571[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 17:16:30.572[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 613.56 	|[0m
[32m2022-06-26 17:16:30.573[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.931952 	|[0m
[32m2022-06-26 17:16:30.575[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 17:18:16.383[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.9046893847413208[0m
[32m2022-06-26 17:18:16.385[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.05145812163642704[0m

[32m2022-06-26 17:18:16.386[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 63/100:[0m
[32m2022-06-26 17:18:16.390[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 17:18:16.391[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 617.162 	|[0m
[32m2022-06-26 17:18:16.392[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.929881 	|[0m
[32m2022-06-26 17:18:16.393[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 17:20:01.936[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.9022202378241447[0m
[32m2022-06-26 17:20:01.938[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.05245717285075479[0m

[32m2022-06-26 17:20:01.939[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 64/100:[0m
[32m2022-06-26 17:20:01.942[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 17:20:01.943[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 618.836 	|[0m
[32m2022-06-26 17:20:01.944[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.928688 	|[0m
[32m2022-06-26 17:20:01.945[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 17:21:47.731[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.8999201592125408[0m
[32m2022-06-26 17:21:47.732[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.053455199040098746[0m

[32m2022-06-26 17:21:47.733[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 65/100:[0m
[32m2022-06-26 17:21:47.736[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 17:21:47.736[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 620.572 	|[0m
[32m2022-06-26 17:21:47.737[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.927518 	|[0m
[32m2022-06-26 17:21:47.738[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - 

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 17:23:33.453[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.8975464877461379[0m
[32m2022-06-26 17:23:33.454[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.054453710223044995[0m

[32m2022-06-26 17:23:33.455[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 66/100:[0m
[32m2022-06-26 17:23:33.458[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 17:23:33.459[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 623.648 	|[0m
[32m2022-06-26 17:23:33.460[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.926216 	|[0m
[32m2022-06-26 17:23:33.461[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - 

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 17:25:19.437[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.8952103460625955[0m
[32m2022-06-26 17:25:19.439[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.05545200640593434[0m

[32m2022-06-26 17:25:19.440[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 67/100:[0m
[32m2022-06-26 17:25:19.444[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 17:25:19.445[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 624.942 	|[0m
[32m2022-06-26 17:25:19.446[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.925582 	|[0m
[32m2022-06-26 17:25:19.447[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 17:27:05.263[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.8930543617470578[0m
[32m2022-06-26 17:27:05.264[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.05644820896508372[0m

[32m2022-06-26 17:27:05.265[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 68/100:[0m
[32m2022-06-26 17:27:05.268[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 17:27:05.268[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 627.898 	|[0m
[32m2022-06-26 17:27:05.269[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.924174 	|[0m
[32m2022-06-26 17:27:05.270[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 17:28:51.291[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.8907839980346787[0m
[32m2022-06-26 17:28:51.293[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.05744582799697216[0m

[32m2022-06-26 17:28:51.295[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 69/100:[0m
[32m2022-06-26 17:28:51.298[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 17:28:51.300[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 628.839 	|[0m
[32m2022-06-26 17:28:51.301[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.923122 	|[0m
[32m2022-06-26 17:28:51.301[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 17:30:37.209[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.8884114710435815[0m
[32m2022-06-26 17:30:37.211[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.058444413197431246[0m
Epoch 00070: reducing learning rate of group 0 to 3.1623e-05.
Epoch 00070: reducing learning rate of group 0 to 6.3246e-04.

[32m2022-06-26 17:30:37.212[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 70/100:[0m
[32m2022-06-26 17:30:37.215[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 17:30:37.216[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 631.18 	|[0m
[32m2022-06-26 17:30:37.216[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.921829 	

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 17:32:23.054[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.8861838563719451[0m
[32m2022-06-26 17:32:23.055[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.059441793831619634[0m

[32m2022-06-26 17:32:23.057[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 71/100:[0m
[32m2022-06-26 17:32:23.062[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 17:32:23.063[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 630.626 	|[0m
[32m2022-06-26 17:32:23.064[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.922252 	|[0m
[32m2022-06-26 17:32:23.065[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - 

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 17:34:08.921[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.8838234108339372[0m
[32m2022-06-26 17:34:08.922[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.06044030320525831[0m

[32m2022-06-26 17:34:08.924[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 72/100:[0m
[32m2022-06-26 17:34:08.927[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 17:34:08.927[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 632.272 	|[0m
[32m2022-06-26 17:34:08.928[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.922209 	|[0m
[32m2022-06-26 17:34:08.929[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 17:35:54.698[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.8815767131273213[0m
[32m2022-06-26 17:35:54.700[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.061437955888237465[0m

[32m2022-06-26 17:35:54.702[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 73/100:[0m
[32m2022-06-26 17:35:54.705[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 17:35:54.706[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 635.645 	|[0m
[32m2022-06-26 17:35:54.707[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.920129 	|[0m
[32m2022-06-26 17:35:54.709[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - 

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 17:37:39.906[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.8793890163048753[0m
[32m2022-06-26 17:37:39.907[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.06243484639787019[0m

[32m2022-06-26 17:37:39.908[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 74/100:[0m
[32m2022-06-26 17:37:39.912[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 17:37:39.913[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 637.606 	|[0m
[32m2022-06-26 17:37:39.914[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.918833 	|[0m
[32m2022-06-26 17:37:39.915[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 17:39:25.485[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.877092296628123[0m
[32m2022-06-26 17:39:25.487[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.0634329550314939[0m

[32m2022-06-26 17:39:25.488[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 75/100:[0m
[32m2022-06-26 17:39:25.492[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 17:39:25.493[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 639.34 	|[0m
[32m2022-06-26 17:39:25.494[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.918447 	|[0m
[32m2022-06-26 17:39:25.495[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1ml

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 17:41:10.893[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.8747359442771852[0m
[32m2022-06-26 17:41:10.895[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.06443160054658245[0m

[32m2022-06-26 17:41:10.896[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 76/100:[0m
[32m2022-06-26 17:41:10.900[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 17:41:10.901[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 641.743 	|[0m
[32m2022-06-26 17:41:10.902[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.916906 	|[0m
[32m2022-06-26 17:41:10.903[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 17:42:56.860[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.8726822820727275[0m
[32m2022-06-26 17:42:56.861[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.06542665982235485[0m

[32m2022-06-26 17:42:56.862[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 77/100:[0m
[32m2022-06-26 17:42:56.866[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 17:42:56.867[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 645.439 	|[0m
[32m2022-06-26 17:42:56.868[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.915062 	|[0m
[32m2022-06-26 17:42:56.869[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 17:44:42.113[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.8705481855059978[0m
[32m2022-06-26 17:44:42.114[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.0664229123712216[0m

[32m2022-06-26 17:44:42.115[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 78/100:[0m
[32m2022-06-26 17:44:42.118[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 17:44:42.118[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 647.207 	|[0m
[32m2022-06-26 17:44:42.119[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.913823 	|[0m
[32m2022-06-26 17:44:42.119[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 17:46:27.820[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.8682715897150189[0m
[32m2022-06-26 17:46:27.821[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.0674210205066758[0m

[32m2022-06-26 17:46:27.822[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 79/100:[0m
[32m2022-06-26 17:46:27.825[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 17:46:27.825[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 648.597 	|[0m
[32m2022-06-26 17:46:27.826[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.912965 	|[0m
[32m2022-06-26 17:46:27.827[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 17:48:13.544[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.8664007043411843[0m
[32m2022-06-26 17:48:13.546[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.06841096128641477[0m

[32m2022-06-26 17:48:13.547[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 80/100:[0m
[32m2022-06-26 17:48:13.550[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 17:48:13.550[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 653.166 	|[0m
[32m2022-06-26 17:48:13.551[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.910793 	|[0m
[32m2022-06-26 17:48:13.552[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 17:49:59.792[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.8643566009315221[0m
[32m2022-06-26 17:49:59.794[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.06940553417620407[0m

[32m2022-06-26 17:49:59.796[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 81/100:[0m
[32m2022-06-26 17:49:59.803[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 17:49:59.804[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 655.078 	|[0m
[32m2022-06-26 17:49:59.804[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.91024 	|[0m
[32m2022-06-26 17:49:59.805[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 17:51:46.056[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.8623139804554981[0m
[32m2022-06-26 17:51:46.057[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.07040054076674175[0m

[32m2022-06-26 17:51:46.059[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 82/100:[0m
[32m2022-06-26 17:51:46.062[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 17:51:46.062[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 655.864 	|[0m
[32m2022-06-26 17:51:46.063[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.909111 	|[0m
[32m2022-06-26 17:51:46.064[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 17:53:32.110[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.8602041276266073[0m
[32m2022-06-26 17:53:32.111[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.0713969014759178[0m

[32m2022-06-26 17:53:32.112[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 83/100:[0m
[32m2022-06-26 17:53:32.115[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 17:53:32.115[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 657.593 	|[0m
[32m2022-06-26 17:53:32.116[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.908189 	|[0m
[32m2022-06-26 17:53:32.117[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 17:55:17.752[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.8582881376215227[0m
[32m2022-06-26 17:55:17.753[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.07238902540579195[0m

[32m2022-06-26 17:55:17.754[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 84/100:[0m
[32m2022-06-26 17:55:17.757[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 17:55:17.758[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 660.541 	|[0m
[32m2022-06-26 17:55:17.759[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.907129 	|[0m
[32m2022-06-26 17:55:17.760[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 17:57:03.269[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.856342933168002[0m
[32m2022-06-26 17:57:03.271[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.07338174006103115[0m

[32m2022-06-26 17:57:03.272[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 85/100:[0m
[32m2022-06-26 17:57:03.275[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 17:57:03.276[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 663.354 	|[0m
[32m2022-06-26 17:57:03.277[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.905308 	|[0m
[32m2022-06-26 17:57:03.278[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 17:58:49.066[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.854259494309113[0m
[32m2022-06-26 17:58:49.067[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.0743778331594681[0m

[32m2022-06-26 17:58:49.068[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 86/100:[0m
[32m2022-06-26 17:58:49.071[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 17:58:49.072[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 664.001 	|[0m
[32m2022-06-26 17:58:49.073[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.904833 	|[0m
[32m2022-06-26 17:58:49.073[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1m

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 18:00:34.583[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.8522239446871097[0m
[32m2022-06-26 18:00:34.585[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.07537336124278073[0m
Epoch 00087: reducing learning rate of group 0 to 1.0000e-05.
Epoch 00087: reducing learning rate of group 0 to 2.0000e-04.

[32m2022-06-26 18:00:34.586[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 87/100:[0m
[32m2022-06-26 18:00:34.589[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 18:00:34.590[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 665.097 	|[0m
[32m2022-06-26 18:00:34.591[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.903565 	

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 18:02:20.225[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.850165314176489[0m
[32m2022-06-26 18:02:20.227[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.07636927290781202[0m

[32m2022-06-26 18:02:20.228[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 88/100:[0m
[32m2022-06-26 18:02:20.232[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 18:02:20.233[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 667.957 	|[0m
[32m2022-06-26 18:02:20.234[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.902756 	|[0m
[32m2022-06-26 18:02:20.235[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 18:04:05.676[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.8481526869148657[0m
[32m2022-06-26 18:04:05.677[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.07736438392228094[0m

[32m2022-06-26 18:04:05.677[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 89/100:[0m
[32m2022-06-26 18:04:05.680[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 18:04:05.681[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 671.478 	|[0m
[32m2022-06-26 18:04:05.682[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.900892 	|[0m
[32m2022-06-26 18:04:05.683[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 18:05:51.305[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.8463843908847762[0m
[32m2022-06-26 18:05:51.306[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.07835098613909276[0m

[32m2022-06-26 18:05:51.308[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 90/100:[0m
[32m2022-06-26 18:05:51.311[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 18:05:51.312[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 672.244 	|[0m
[32m2022-06-26 18:05:51.313[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.900431 	|[0m
[32m2022-06-26 18:05:51.314[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 18:07:36.996[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.8445221032286683[0m
[32m2022-06-26 18:07:36.997[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.07934129285017644[0m

[32m2022-06-26 18:07:36.998[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 91/100:[0m
[32m2022-06-26 18:07:37.003[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 18:07:37.004[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 675.224 	|[0m
[32m2022-06-26 18:07:37.005[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.89891 	|[0m
[32m2022-06-26 18:07:37.006[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 18:09:22.986[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.8427583859198585[0m
[32m2022-06-26 18:09:22.988[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.080327663384169[0m

[32m2022-06-26 18:09:22.990[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 92/100:[0m
[32m2022-06-26 18:09:22.993[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 18:09:22.995[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 677.413 	|[0m
[32m2022-06-26 18:09:22.996[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.897288 	|[0m
[32m2022-06-26 18:09:22.997[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1m

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 18:11:09.066[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.8409395216005288[0m
[32m2022-06-26 18:11:09.067[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.08131678524283448[0m

[32m2022-06-26 18:11:09.068[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 93/100:[0m
[32m2022-06-26 18:11:09.070[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 18:11:09.071[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 679.479 	|[0m
[32m2022-06-26 18:11:09.071[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.896447 	|[0m
[32m2022-06-26 18:11:09.072[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 18:12:55.309[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.8389739471886181[0m
[32m2022-06-26 18:12:55.310[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.08231111602216547[0m

[32m2022-06-26 18:12:55.312[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 94/100:[0m
[32m2022-06-26 18:12:55.315[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 18:12:55.315[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 681.219 	|[0m
[32m2022-06-26 18:12:55.316[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.895401 	|[0m
[32m2022-06-26 18:12:55.317[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 18:14:41.372[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.8373336884610939[0m
[32m2022-06-26 18:14:41.373[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.08329130546363456[0m

[32m2022-06-26 18:14:41.375[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 95/100:[0m
[32m2022-06-26 18:14:41.379[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 18:14:41.380[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 683.302 	|[0m
[32m2022-06-26 18:14:41.381[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.894358 	|[0m
[32m2022-06-26 18:14:41.382[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 18:16:27.448[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.8356922394165595[0m
[32m2022-06-26 18:16:27.449[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.08427029296597803[0m

[32m2022-06-26 18:16:27.450[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 96/100:[0m
[32m2022-06-26 18:16:27.453[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 18:16:27.454[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 685.523 	|[0m
[32m2022-06-26 18:16:27.455[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.892765 	|[0m
[32m2022-06-26 18:16:27.455[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 18:18:13.520[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.8339685496580035[0m
[32m2022-06-26 18:18:13.521[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.08525546785436293[0m

[32m2022-06-26 18:18:13.522[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 97/100:[0m
[32m2022-06-26 18:18:13.525[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 18:18:13.526[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 687.958 	|[0m
[32m2022-06-26 18:18:13.527[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.891898 	|[0m
[32m2022-06-26 18:18:13.527[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 18:20:00.080[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.8321842872609196[0m
[32m2022-06-26 18:20:00.082[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.08624449426607969[0m

[32m2022-06-26 18:20:00.083[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 98/100:[0m
[32m2022-06-26 18:20:00.086[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 18:20:00.087[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 689.073 	|[0m
[32m2022-06-26 18:20:00.088[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.891434 	|[0m
[32m2022-06-26 18:20:00.089[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 18:21:45.808[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.8305630072461575[0m
[32m2022-06-26 18:21:45.809[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.08722458820583187[0m

[32m2022-06-26 18:21:45.811[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 99/100:[0m
[32m2022-06-26 18:21:45.814[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 18:21:45.815[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 691.06 	|[0m
[32m2022-06-26 18:21:45.816[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.890544 	|[0m
[32m2022-06-26 18:21:45.817[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1

train:   0%|          | 0/339 [00:00<?, ?it/s]

validation:   0%|          | 0/112 [00:00<?, ?it/s]

[32m2022-06-26 18:23:31.715[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m590[0m - [1mbr was changed to 0.8290065502177499[0m
[32m2022-06-26 18:23:31.716[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m591[0m - [1mlambda_llr was changed to 0.08819784233820116[0m

[32m2022-06-26 18:23:31.718[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 100/100:[0m
[32m2022-06-26 18:23:31.722[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-26 18:23:31.723[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 693.034 	|[0m
[32m2022-06-26 18:23:31.724[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.889118 	|[0m
[32m2022-06-26 18:23:31.725[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - 

*** SIGTERM received at time=1656335415 on cpu 73 ***
PC: @     0x7f4da3f70155  (unknown)  __clone
    @     0x7f4da41bd3c0  1257294768  (unknown)
    @     0x7f4da3b25bb0  (unknown)  (unknown)
    @     0x563542705fa0  (unknown)  (unknown)
[2022-06-27 13:10:15,855 E 10960 50473] logging.cc:325: *** SIGTERM received at time=1656335415 on cpu 73 ***
[2022-06-27 13:10:15,855 E 10960 50473] logging.cc:325: PC: @     0x7f4da3f70155  (unknown)  __clone
[2022-06-27 13:10:15,860 E 10960 50473] logging.cc:325:     @     0x7f4da41bd3c0  1257294768  (unknown)
[2022-06-27 13:10:15,866 E 10960 50473] logging.cc:325:     @     0x7f4da3b25bb0  (unknown)  (unknown)
[2022-06-27 13:10:15,875 E 10960 50473] logging.cc:325:     @     0x563542705fa0  (unknown)  (unknown)


In [13]:
results = alg.evaluate('test')

test:   0%|          | 0/454 [00:00<?, ?it/s]

In [15]:
np.mean(results['scalar']['acc'])

0.8330432722747063

In [14]:
%load_ext tensorboard

In [15]:
%tensorboard --logdir /home/shared/data/results/covtype/covtype/CovtypeAlgorithm/debug/0001_20220622_160022 --port=17067 --bind_all

In [6]:
args = beam_arguments(
        f"--project-name=covtype --root-dir={root_dir} --algorithm=CovtypeAlgorithm --device=1 --no-amp --lr-d=1e-3 --batch-size=256",
        "--n-epochs=100 --clip=0 --parallel=1 --accumulate=1 --cudnn-benchmark --identifier=half_precision",
        "--weight-decay=1e-5 --beta1=0.9 --beta2=0.999", label_smoothing=.05, weight_factor=.5,
        path_to_data=path_to_data, gamma=1., dropout=.0, activation='gelu', channels=512)

experiment = Experiment(args)

[32m2022-06-23 11:44:34.677[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36m__init__[0m:[36m183[0m - [1mbeam project: covtype[0m
[32m2022-06-23 11:44:34.679[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36m__init__[0m:[36m184[0m - [1mExperiment Hyperparameters[0m
[32m2022-06-23 11:44:34.683[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36m__init__[0m:[36m189[0m - [1mproject_name: covtype[0m
[32m2022-06-23 11:44:34.685[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36m__init__[0m:[36m189[0m - [1midentifier: half_precision[0m
[32m2022-06-23 11:44:34.686[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36m__init__[0m:[36m189[0m - [1malgorithm: CovtypeAlgorithm[0m
[32m2022-06-23 11:44:34.687[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36m__init__[0m:[36m189[0m - [1mmp_port: None[0m
[32m2022-06-23 11:44:34.688[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36m__init__[0m:[36m189[0m - 

In [7]:
alg = experiment(covtype_algorithm_generator)

[32m2022-06-23 11:44:37.677[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mrun[0m:[36m553[0m - [1mSingle worker mode[0m
[32m2022-06-23 11:44:37.680[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mrun_worker[0m:[36m45[0m - [1mWorker: 1/1 is running...[0m


train:   0%|          | 0/1360 [00:00<?, ?it/s]

validation:   0%|          | 0/452 [00:00<?, ?it/s]


[32m2022-06-23 11:50:32.263[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 1/100:[0m
[32m2022-06-23 11:50:32.272[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-23 11:50:32.274[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 228.893 	|[0m
[32m2022-06-23 11:50:32.274[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.695109 	|[0m
[32m2022-06-23 11:50:32.275[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mlr 0.001 	|[0m
[32m2022-06-23 11:50:32.277[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mvalidation:[0m
[32m2022-06-23 11:50:32.283[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 195.103 	|[0m
[32m2022-06-23 11:5

train:   0%|          | 0/1360 [00:00<?, ?it/s]

validation:   0%|          | 0/452 [00:00<?, ?it/s]


[32m2022-06-23 11:56:29.838[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 2/100:[0m
[32m2022-06-23 11:56:29.844[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-23 11:56:29.845[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 167.189 	|[0m
[32m2022-06-23 11:56:29.846[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.816791 	|[0m
[32m2022-06-23 11:56:29.846[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mlr 0.001 	|[0m
[32m2022-06-23 11:56:29.847[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mvalidation:[0m
[32m2022-06-23 11:56:29.847[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss nan 	|[0m
[32m2022-06-23 11:56:29

train:   0%|          | 0/1360 [00:00<?, ?it/s]

validation:   0%|          | 0/452 [00:00<?, ?it/s]


[32m2022-06-23 12:03:08.504[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 3/100:[0m
[32m2022-06-23 12:03:08.515[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-23 12:03:08.517[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss 139.599 	|[0m
[32m2022-06-23 12:03:08.525[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.870749 	|[0m
[32m2022-06-23 12:03:08.527[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mlr 0.001 	|[0m
[32m2022-06-23 12:03:08.529[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mvalidation:[0m
[32m2022-06-23 12:03:08.531[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss nan 	|[0m
[32m2022-06-23 12:03:08

train:   0%|          | 0/1360 [00:00<?, ?it/s]

validation:   0%|          | 0/452 [00:00<?, ?it/s]


[32m2022-06-23 12:08:59.802[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 4/100:[0m
[32m2022-06-23 12:08:59.808[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-23 12:08:59.810[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss nan 	|[0m
[32m2022-06-23 12:08:59.811[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.895735 	|[0m
[32m2022-06-23 12:08:59.813[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mlr 0.001 	|[0m
[32m2022-06-23 12:08:59.815[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mvalidation:[0m
[32m2022-06-23 12:08:59.817[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss nan 	|[0m
[32m2022-06-23 12:08:59.820

train:   0%|          | 0/1360 [00:00<?, ?it/s]

validation:   0%|          | 0/452 [00:00<?, ?it/s]


[32m2022-06-23 12:14:43.038[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36msave_model_results[0m:[36m397[0m - [1mFinished epoch 5/100:[0m
[32m2022-06-23 12:14:43.057[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mtrain:[0m
[32m2022-06-23 12:14:43.058[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss nan 	|[0m
[32m2022-06-23 12:14:43.060[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1macc 0.903142 	|[0m
[32m2022-06-23 12:14:43.060[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mlr 0.001 	|[0m
[32m2022-06-23 12:14:43.062[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m443[0m - [1mvalidation:[0m
[32m2022-06-23 12:14:43.063[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36mlog_data[0m:[36m447[0m - [1mloss nan 	|[0m
[32m2022-06-23 12:14:43.064

train:   0%|          | 0/1360 [00:00<?, ?it/s]

KeyboardInterrupt: 

## Hyperparameter optimization with ray and optuna

In [3]:
args = beam_arguments(get_covtype_parser(), 
        f"--project-name=covtype --root-dir={root_dir} --algorithm=CovtypeAlgorithm --device=0 --no-half --lr-d=1e-3 --batch-size=256",
        "--n-epochs=40 --clip=0 --parallel=1 --accumulate=1 --cudnn-benchmark",
        "--weight-decay=1e-5 --beta1=0.9 --beta2=0.999", label_smoothing=.05, weight_factor=.0,
        path_to_data=path_to_data, dropout=.0, activation='gelu', channels=128, n_rules=64, n_layers=2,)

study = Study(covtype_algorithm_generator, args)

[32m2022-06-23 16:26:10.599[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36m__init__[0m:[36m82[0m - [1mHyperparameter Optimization[0m
[32m2022-06-23 16:26:10.600[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36m__init__[0m:[36m83[0m - [1mbeam project: covtype[0m
[32m2022-06-23 16:26:10.601[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36m__init__[0m:[36m84[0m - [1mExperiment Hyperparameters[0m
[32m2022-06-23 16:26:10.601[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36m__init__[0m:[36m87[0m - [1mproject_name: covtype[0m
[32m2022-06-23 16:26:10.602[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36m__init__[0m:[36m87[0m - [1midentifier: debug_hp_optimization_20220623_162610[0m
[32m2022-06-23 16:26:10.602[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[36m__init__[0m:[36m87[0m - [1malgorithm: CovtypeAlgorithm[0m
[32m2022-06-23 16:26:10.603[0m | [1mINFO    [0m | [36msrc.beam.experiment[0m:[

In [4]:
analysis = study.tune(config={"lr_dense": tune.loguniform(1e-4, 1e-2),
                              "lr_sparse": tune.loguniform(1e-3, 1e-1),
                              "dropout": tune.uniform(.0, .25),
                              "scheduler_factor": tune.uniform(.1, .5),
                              "scheduler_patience": tune.choice([12, 16, 20]),
                              "weight_decay": tune.loguniform(1e-6, 1e-3),
                              "beta1": tune.choice([.9, .95]),
                              "beta2": tune.choice([.99, .999]),
                              "n_tables": tune.choice([1, 5, 15]),
                              "n_quantiles": tune.choice([4, 10, 20]),
                              "weight_factor": tune.choice([.0, .25, .5]),
                              "label_smoothing": tune.choice([.0, .1, .2]),
                              "channels": tune.choice([64, 128, 256]),
                              "n_rules": tune.choice([64, 128, 256]),
                              "n_layers": tune.choice([1, 2]),
                              "activation": tune.choice(['celu', 'gelu']),
                              "k_p": tune.loguniform(.01, .1),
                              "k_i": tune.loguniform(.001, .01),
                              "k_d": tune.loguniform(.001, .01),
                              "initial_mask": tune.uniform(.9, 1.),},
                       metric="mean_accuracy",
                       max_concurrent_trials=2,
                       resources_per_trial={"gpu": 1},
                       mode="max",
                       search_alg=OptunaSearch(),
                      progress_reporter=JupyterNotebookReporter(overwrite=True),
                       num_samples=1000)

Trial name,status,loc,activation,beta1,beta2,channels,dropout,initial_mask,k_d,k_i,k_p,label_smoothing,lr_dense,lr_sparse,n_layers,n_quantiles,n_rules,n_tables,scheduler_factor,scheduler_patience,weight_decay,weight_factor,acc,iter,total time (s)
runner_tune_63c3d776,RUNNING,172.17.0.7:66237,gelu,0.9,0.999,256,0.058916,0.999251,0.00353359,0.00155413,0.0555205,0.2,0.00217149,0.017969,2,20,128,15,0.135275,12,0.000351825,0.0,0.948467,36,5490.23
runner_tune_edaad5d2,RUNNING,172.17.0.7:67440,gelu,0.9,0.999,256,0.0494754,0.998241,0.00445461,0.0012865,0.0747774,0.2,0.000941906,0.0200523,2,20,64,15,0.122971,12,0.00038737,0.0,0.950014,29,2290.66
runner_tune_008a91a0,TERMINATED,172.17.0.7:50284,gelu,0.9,0.99,256,0.0807869,0.996324,0.00680326,0.00142563,0.0510722,0.2,0.000819026,0.0152461,2,20,128,15,0.112404,12,0.000984329,0.0,0.953592,40,6066.92
runner_tune_028e4942,TERMINATED,172.17.0.7:20640,gelu,0.9,0.99,64,0.138117,0.98606,0.00797104,0.00847916,0.0140101,0.2,0.000334277,0.050323,1,20,256,1,0.153175,16,1.73845e-06,0.0,0.93171,40,5513.77
runner_tune_080099b0,TERMINATED,172.17.0.7:80084,celu,0.9,0.999,64,0.158326,0.996888,0.00856642,0.00988607,0.0889488,0.1,0.00986728,0.0959956,2,20,256,1,0.1056,16,1.25602e-06,0.0,0.912118,40,10459.7
runner_tune_0e789ebc,TERMINATED,172.17.0.7:60721,celu,0.9,0.999,256,0.0295621,0.999882,0.00456891,0.00102814,0.0707723,0.2,0.000994112,0.0304406,2,4,64,15,0.100448,12,0.000715209,0.0,0.947706,40,2903.16
runner_tune_10fb7f6c,TERMINATED,172.17.0.7:72407,gelu,0.9,0.99,256,0.220779,0.968569,0.00308747,0.002626,0.0240213,0.1,0.000142814,0.00126458,1,10,256,5,0.267074,20,1.47414e-05,0.25,0.896104,40,8462.36
runner_tune_121f98fc,TERMINATED,172.17.0.7:40384,gelu,0.95,0.99,256,0.1964,0.963854,0.00830381,0.0019387,0.0374598,0.1,0.00100392,0.00268295,2,10,128,5,0.226368,20,3.64052e-05,0.0,0.933931,40,5975.81
runner_tune_1fc0b7b0,TERMINATED,172.17.0.7:38270,celu,0.95,0.999,256,0.185739,0.982717,0.00635819,0.00250672,0.0167592,0.0,0.00241463,0.0140612,2,10,128,5,0.165462,20,1.75448e-05,0.0,0.928149,40,5984.78
runner_tune_20003a20,TERMINATED,172.17.0.7:14600,celu,0.9,0.99,64,0.189547,0.979488,0.0099452,0.00441909,0.0125956,0.2,0.000193391,0.0418173,1,20,256,15,0.190423,16,9.5758e-06,0.0,0.921564,40,5645.03




KeyboardInterrupt: 

[2m[36m(runner_tune pid=67440)[0m [32m2022-06-26 06:23:07.687[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m584[0m - [1mbr was changed to 0.9798078372723117[0m
[2m[36m(runner_tune pid=67440)[0m [32m2022-06-26 06:23:07.687[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m585[0m - [1mlambda_llr was changed to 0.017812550184276018[0m
[2m[36m(runner_tune pid=66237)[0m [32m2022-06-26 06:23:49.308[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m584[0m - [1mbr was changed to 0.9730077730625055[0m
[2m[36m(runner_tune pid=66237)[0m [32m2022-06-26 06:23:49.308[0m | [1mINFO    [0m | [36msrc.beam.model[0m:[36mstep[0m:[36m585[0m - [1mlambda_llr was changed to 0.024606548212574783[0m
