In [1]:
##%matplotlib widget
## with %matplotlib notebook: seems to require ipympl as part of environment, either
## part of the conda environment or "pip install ipympl"
## otherwise, does not show ANY plots in note"book, plt.savefig() works
%matplotlib notebook  
##%matplotlib inline    ## --plt.savefig()  works, but re-sizing does NOT


This notebook is the second attempt to read in track information and use it to predict the KDE used as input to PvFinder. This time, we are reading in poca KDEs rather than the original KDEs. 

collectdata_kde_C.py uses poca_z, poca_x, poca_y, major_axis_x, major_axis_y, and major_axis_z as the six track parameters (for the moment)


Check the current GPU usage. Please try to be nice!

In [2]:
!nvidia-smi

Sun Aug 29 20:13:39 2021       
+-----------------------------------------------------------------------------+
| NVIDIA-SMI 470.42.01    Driver Version: 470.42.01    CUDA Version: 11.4     |
|-------------------------------+----------------------+----------------------+
| GPU  Name        Persistence-M| Bus-Id        Disp.A | Volatile Uncorr. ECC |
| Fan  Temp  Perf  Pwr:Usage/Cap|         Memory-Usage | GPU-Util  Compute M. |
|                               |                      |               MIG M. |
|   0  NVIDIA TITAN V      Off  | 00000000:03:00.0 Off |                  N/A |
| 43%   60C    P2   100W / 250W |   8775MiB / 12066MiB |     96%      Default |
|                               |                      |                  N/A |
+-------------------------------+----------------------+----------------------+
|   1  Tesla P100-PCIE...  Off  | 00000000:83:00.0 Off |                    0 |
| N/A   38C    P0    34W / 250W |   3321MiB / 16280MiB |      0%      Default |
|       

> **WARNING**: The card numbers here are *not* the same as in CUDA. You have been warned.

This notebook is first attempt to read in track information and use it to predict the KDE used as input to PvFinder.


## Imports

In [3]:
import matplotlib.pyplot as plt
import numpy as np
import time
import torch
import pandas as pd

# Python 3 standard library
from pathlib import Path

##from torchsummary import summary

### Set up local parameters

In [4]:
n_epochs = 200

# Name is the output file name


##  201027 -- about to go to bed, so try 2500 epochs with lr = 1e55
##  previous iteration had l4 = 3e-5 and cost dropped almost linearly
##  for 100 epochs -- final training costs ~ 2.02, validation cost ~ 2.01

## for iter 4, try 10 epochs with lr = 3e-6
## usually have a big jump down at epoch 0; want to try a
## small number of epochs per iteration and see what happens (iter4: 10 epochs gave
## traiing cost dropping from 1.54 to 1.50 immediately, then dropping very slowly)
folder = 'baileyds200ep_DDplus_iter6_lrstepschedulecontinued2'
name   = folder

# Make an output folder named "name" (change if you want)

## Special instructions for those working on goofy at UC
## Please be very careful to make sure that your folder
## does not live in a subdirectory of your home directory
## this disk has very little capacity. Instead, use 
## a subdirectory in /share/lazy with a symbolic link to
## it in this (the notebooks) subdirectory
folder = 'baileyds/DDplus/' + folder
output = Path(folder)


# Size of batches
batch_size = 16 ## was 64
# How fast to learn
learning_rate = 1e-4

Make the output directory if it does not exist:

In [5]:
output.mkdir(exist_ok=True)

## Get the helper functions

Add the directory with the model
definitions to the path so we can import from it:

> When you type `import X`,
Python searches `sys.path` for a python
file named `X.py` to import. So we need to add the model directory to the path.

In [6]:
# From model/collectdata.py
##from model.collectdata_kde_B import collect_t2kde_data
## collectdata_kde_C should use the new poca KDE rather than the original kernel KDE
from model.collectdata_kde_Ellipsoids import collect_t2kde_data


# From model/loss.py
##from loss import Loss
## kde_loss_D includes botha ratio term and a chisq term, 98% ave_chisq
## kde_loss_E adds a chi^4 term to the kde_loss_D return value
## this is intended to emphasize the importance of values significantly different than zero
from model.kde_loss_Ba import Loss

##  TracksToKDE_Ellipsoids_SevenLayerCake has 7 hidden layers producing the 4000-bin KDE historgram
##  It takes 9 input features (pocca centers + (A,B,C,D,E,F) . 
from model.models_kde import TracksToKDE_Ellipsoids_DDplus as Model


from model.training_kde import trainNet, select_gpu, Results
from functions.my_training_kde import trainNet
from model.plots import dual_train_plots, replace_in_ax

In [7]:
# This gets built up during the run - do not rerun this cell
results = pd.DataFrame([], columns=Results._fields)
# my entry 
from functions.utils import get_param_state
param_states = []

Set up Torch device configuration. All tensors and model parameters need to know where to be put.
This takes a BUS ID number: The BUS ID is the same as the listing at the top of this script.

In [8]:
device = "cuda:2"#select_gpu(0)
##device = "cpu"

## Loading data

Load the dataset, split into parts, then move to device (see `collectdata.py` in the `../model` directory)

# Preparing the model

Prepare a model, use multiple GPUs if they are VISIBLE, and move the model to the device.

In [9]:
##print("Let's use", torch.cuda.device_count(), "GPUs!")
##if torch.cuda.device_count() > 1:
##    model = torch.nn.DataParallel(model)

In [10]:
## a comment on the web at https://pytorch.org/docs/stable/optim.html says
"""
If you need to move a model to GPU via .cuda(), please do so before constructing optimizers for it. 
Parameters of a model after .cuda() will be different objects with those before the call.

In general, you should make sure that optimized parameters live in consistent locations when 
optimizers are constructed and used.
"""
## so move this here (although we are using model.to(device) not explicitly using .cuda()

nOut1 = 50
nOut2 = 50
nOut3 = 50
nOut4 = 50
nOut5 = 50
nOut6 = 50
nOut7 = 50
nOut8 = 50
nOut9 = 50
nOut10 = 50
nOut11 = 50
latentChannels = 4
model = Model(nOut1,nOut2,nOut3,nOut4,nOut5,nOut6,nOut7,nOut8,nOut9,nOut10,nOut11,latentChannels)

##summary(model, input_size=(4, 4000))
##print(model.parameters)

## add the following code to allow the user to freeze the some of the weights corresponding 
## to those taken from an earlier model trained with the original target histograms
## presumably -- this leaves either the perturbative filter "fixed" and lets the 
## learning focus on the non-perturbative features, so get started faster, or vice versa
ct = 0
for child in model.children():
  print('ct, child = ',ct, "  ", child)
  if ct < 0:
    print("     About to set param.requires_grad=False for ct = ", ct, "params")
    for param in child.parameters():
        param.requires_grad = False 
  ct += 1
##  mds 200121 loss = Loss(epsilon=1e-5,coefficient=1.0)
##  loss = Loss(epsilon=1e-5,coefficient=2.5)
##loss = Loss(epsilon=3e-5, debug=False)
loss = Loss(epsilon=3e-5)

ct, child =  0    Linear(in_features=9, out_features=50, bias=True)
ct, child =  1    Linear(in_features=50, out_features=50, bias=True)
ct, child =  2    Linear(in_features=50, out_features=50, bias=True)
ct, child =  3    Linear(in_features=50, out_features=50, bias=True)
ct, child =  4    Linear(in_features=50, out_features=50, bias=True)
ct, child =  5    Linear(in_features=50, out_features=50, bias=True)
ct, child =  6    Linear(in_features=50, out_features=50, bias=True)
ct, child =  7    Linear(in_features=50, out_features=50, bias=True)
ct, child =  8    Linear(in_features=50, out_features=50, bias=True)
ct, child =  9    Linear(in_features=50, out_features=50, bias=True)
ct, child =  10    Linear(in_features=50, out_features=50, bias=True)
ct, child =  11    Linear(in_features=50, out_features=16000, bias=True)
ct, child =  12    Conv1d(4, 25, kernel_size=(25,), stride=(1,), padding=(12,))
ct, child =  13    Conv1d(25, 1, kernel_size=(5,), stride=(1,), padding=(2,))
ct, child 

Let's move the model's weight matricies to the GPU:

In [11]:
model = model.to(device)

In [12]:
optimizer = torch.optim.Adam(model.parameters(), lr=learning_rate)
from functions.my_optimizers import StepLrSchedule
step_schedule = StepLrSchedule(optimizer, decay_rate=0.7, drop_rate=20)
##optimizer = torch.optim.SGD(model.parameters(), lr=learning_rate)

In [13]:
print('output = ',output)
##print('oldOutput = ',oldOutput)
##  use the first four layers from a pre-existing model
##  see example at https://discuss.pytorch.org/t/how-to-load-part-of-pre-trained-model/1113

##   ML -> /share/lazy/sokoloff/ML
model_dict = model.state_dict()
## mds 190725 for debugging
print("for model_dict")
index = 0
for k,v in model_dict.items():
    print("index, k =  ",index,"  ",k)
    index = index+1
##    print("value = ", v)
 
updated_dict = model_dict
##print("updated_dict = ",updated_dict)
## when starting "ab initio", reduce biases as the bias gets summed for each track
## contributing to the predicted KDE
updated_dict["layer1.bias"] = 0.005*model_dict["layer1.bias"]
updated_dict["layer2.bias"] = 0.005*model_dict["layer2.bias"]
updated_dict["layer3.bias"] = 0.005*model_dict["layer3.bias"]
updated_dict["layer4.bias"] = 0.005*model_dict["layer4.bias"]
updated_dict["layer5.bias"] = 0.005*model_dict["layer5.bias"]
updated_dict["layer6.bias"] = 0.005*model_dict["layer6.bias"]
updated_dict["layer7.bias"] = 0.005*model_dict["layer7.bias"]
updated_dict["layer8.bias"] = 0.005*model_dict["layer8.bias"]
updated_dict["layer9.bias"] = 0.005*model_dict["layer9.bias"]
updated_dict["layer10.bias"] = 0.005*model_dict["layer10.bias"]
updated_dict["layer11.bias"] = 0.005*model_dict["layer11.bias"]

model.load_state_dict(updated_dict,strict=False)

model_dict = model.state_dict()
##print("updated model_dict = ",model_dict)

## print(" \n","  for pretrained_dict")
## index = 0
##for k,v in pretrained_dict.items():
##    print("index, k =  ",index,"  ",k)
##    index = index+1
## mds  

##pretrained_dict = torch.load('ML/29July2020_Trks_to_KDE_C_lossB_100epochs_b64_1m3_nOut_50x50/29July2020_Trks_to_KDE_C_lossB_100epochs_b64_1m3_nOut_50x50_final.pyt')
##print("model_dict instantiated")
# 1. filter out unnecessary keys
##pretrained_dict = {k: v for k, v in pretrained_dict.items() if k in model_dict}
##print("pretrained_dict iterated")
# 2. overwrite entries in the existing state dict
##model_dict.update(pretrained_dict) 
##
#   when starting from a model with a fully connected last layer rather than a convolutional layer
# 3. load the new state dict
#   need to use strict=False as the two models state model attributes do not agree exactly
#   see https://pytorch.org/docs/master/_modules/torch/nn/modules/module.html#Module.load_state_dict

##model.load_state_dict(pretrained_dict,strict=False)

## print('model_dict =    ', model_dict)

# ## finished at training cost = 1.46, validation cost = 1.50
d_folder = 'baileyds200ep_DDplus_iter5_lrstepschedulecontinued'
d_name = d_folder
suffix = 'final'
dict_name = 'baileyds/DDplus/' + d_folder + '/' + d_name + '_'+ suffix + '.pyt'
print('dict_name = ',dict_name)
pretrained_dict = torch.load(dict_name)

# print(" ")
# print("  for pretrained_dict")
# index = 0
# for k,v in pretrained_dict.items():
#     print("index, k =  ",index,"  ",k)
#     index = index+1
 

# ##print("model_dict instantiated")
# # 1. filter out unnecessary keys
# pretrained_dict = {k: v for k, v in pretrained_dict.items() if k in model_dict}
# print("pretrained_dict iterated")
# # 2. overwrite entries in the existing state dict
# model_dict.update(pretrained_dict) 
# ##
# #   when starting from a model with a fully connected last layer rather than a convolutional layer
# # 3. load the new state dict
# #   need to use strict=False as the two models state model attributes do not agree exactly
# #   see https://pytorch.org/docs/master/_modules/torch/nn/modules/module.html#Module.load_state_dict

model.load_state_dict(pretrained_dict,strict=False)

#mine
param_states.append(get_param_state(model))


output =  baileyds/DDplus/baileyds200ep_DDplus_iter6_lrstepschedulecontinued2
for model_dict
index, k =   0    layer1.weight
index, k =   1    layer1.bias
index, k =   2    layer2.weight
index, k =   3    layer2.bias
index, k =   4    layer3.weight
index, k =   5    layer3.bias
index, k =   6    layer4.weight
index, k =   7    layer4.bias
index, k =   8    layer5.weight
index, k =   9    layer5.bias
index, k =   10    layer6.weight
index, k =   11    layer6.bias
index, k =   12    layer7.weight
index, k =   13    layer7.bias
index, k =   14    layer8.weight
index, k =   15    layer8.bias
index, k =   16    layer9.weight
index, k =   17    layer9.bias
index, k =   18    layer10.weight
index, k =   19    layer10.bias
index, k =   20    layer11.weight
index, k =   21    layer11.bias
index, k =   22    layer12new.weight
index, k =   23    layer12new.bias
index, k =   24    conv1.weight
index, k =   25    conv1.bias
index, k =   26    conv2.weight
index, k =   27    conv2.bias
index, k =   

In [14]:
##print('validation.dataset.tensors = ',validation.dataset.tensors)
fig_size = plt.rcParams["figure.figsize"]
fig_size[0] = 10
fig_size[1] = 4
plt.rcParams["figure.figsize"] = fig_size

In [15]:
## Training dataset. You can put as many files here as desired.

##train_loader = collect_t2kde_data('/share/lazy/pv-finder/20k_evts_for_KDE_learning_200716.h5',
train_loader = collect_t2kde_data('/share/lazy/will/data/June30_2020_80k_1.h5', 
                                #'/share/lazy/will/data/June30_2020_80k_2.h5',
                                #'/share/lazy/will/data/June30_2020_80k_3.h5',
                                  #'/share/lazy/will/data/June30_2020_80k_4.h5',
                             batch_size=batch_size,
## if we are using a larger dataset (240K events, with the datasets above, and 11 GB  of GPU memory),
## the dataset will overflow the GPU memory; device=device will allow the data to move back
## and forth between the CPU and GPwU memory. While this allows use of a larger dataset, it slows
## down performance by about 10%.  So comment out when not needed.
                          device=device,
                          slice = slice(None,40000)
                           )

EVE_data = collect_t2kde_data('/share/lazy/will/data/June30_2020_80k_1.h5', 
                              #'/share/lazy/will/data/June30_2020_80k_2.h5',
                              #'/share/lazy/will/data/June30_2020_80k_3.h5',
                                  #'/share/lazy/will/data/June30_2020_80k_4.h5',
                             batch_size=batch_size,
## if we are using a larger dataset (240K events, with the datasets above, and 11 GB  of GPU memory),
## the dataset will overflow the GPU memory; device=device will allow the data to move back
## and forth between the CPU and GPwU memory. While this allows use of a larger dataset, it slows
## down performance by about 10%.  So comment out when not needed.
#                          device=device,
                          slice = slice(40000,60000)
                           )

# train_data_eval = collect_t2kde_data('/share/lazy/will/data/June30_2020_80k_1.h5', 
#                                   #'/share/lazy/will/data/June30_2020_80k_2.h5',
#                                   #'/share/lazy/will/data/June30_2020_80k_3.h5',
#                                   #'/share/lazy/will/data/June30_2020_80k_4.h5',
#                              batch_size=batch_size,
# ## if we are using a larger dataset (240K events, with the datasets above, and 11 GB  of GPU memory),
# ## the dataset will overflow the GPU memory; device=device will allow the data to move back
# ## and forth between the CPU and GPwU memory. While this allows use of a larger dataset, it slows
# ## down performance by about 10%.  So comment out when not needed.
#                           device=device,
# ##                           slice = slice(None,18000)
#                           shuffle=False
#                            )

# Validation dataset. You can slice to reduce the size.
## mds no separate validation set yet,

## For iter12, change slice(18000,None) to slice(10000,None)
## First, we'll see if this changes the validation cost significantly
##  Second, we will see if this reduces the validation cost fluctuations
val_loader = collect_t2kde_data('/share/lazy/will/data/June30_2020_80k_1.h5',
                            batch_size=batch_size,
#                            device=device,
                            slice = slice(60000,None)
                           )

Loading data...
pocaMx.shape =  (80000,)
nEvts =  80000
len(pocaMx[0]) =  199
len(pocaMx[1]) =  25
len(pocaMx[2]) =  369
len(pocaMx[3]) =  143
len(pocaMx[4]) =  160
majorAxis.shape =  (80000, 3)
minorAxis_1.shape =  (80000, 3)
minorAxis_2.shape =  (80000, 3)
have entered six_ellipsoid_parameters
  
 
  nEvts =  80000
 iEvt, nTrks =  0 199
 iEvt, nTrks =  1 25
 iEvt, nTrks =  2 369
 iEvt, nTrks =  3 143
 iEvt, nTrks =  4 160
 iEvt, nTrks =  5 260
 iEvt, nTrks =  6 237
 iEvt, nTrks =  7 327
 iEvt, nTrks =  8 178
 iEvt, nTrks =  9 106
A.shape =  (80000,)
majorAxis[iTrk][0][0] =  0.00045611936
majorAxis[iTrk][1][0] =  -4.8292455e-05
majorAxis[iTrk][2][0] =  0.090019904
minorAxis_1[iTrk][0][0] =  -1.8602173
minorAxis_1[iTrk][1][0] =  -17.569641
minorAxis_1[iTrk][2][0] =  4.7891795e-08
minorAxis_2[iTrk][0][0] =  -17.569414
minorAxis_2[iTrk][1][0] =  1.8601931
minorAxis_2[iTrk][2][0] =  0.0900199
  
majorAxis[iTrk][0][0] =  0.002360258
majorAxis[iTrk][1][0] =  -0.007426616
majorAxis[iTrk][2][

len(X) =  80000
len(Xlist) =  1
Loaded /share/lazy/will/data/June30_2020_80k_1.h5 in 171.8 s
outer loop X.shape =  (80000, 9, 600)
Constructing 20000 event dataset took 0.1339 s
x_t.shape =  torch.Size([20000, 9, 600])
x_t.shape[0] =  20000
x_t.shape[1] =  9
x_t.shape =  torch.Size([20000, 9, 600])
Loading data...
pocaMx.shape =  (80000,)
nEvts =  80000
len(pocaMx[0]) =  199
len(pocaMx[1]) =  25
len(pocaMx[2]) =  369
len(pocaMx[3]) =  143
len(pocaMx[4]) =  160
majorAxis.shape =  (80000, 3)
minorAxis_1.shape =  (80000, 3)
minorAxis_2.shape =  (80000, 3)
have entered six_ellipsoid_parameters
  
 
  nEvts =  80000
 iEvt, nTrks =  0 199
 iEvt, nTrks =  1 25
 iEvt, nTrks =  2 369
 iEvt, nTrks =  3 143
 iEvt, nTrks =  4 160
 iEvt, nTrks =  5 260
 iEvt, nTrks =  6 237
 iEvt, nTrks =  7 327
 iEvt, nTrks =  8 178
 iEvt, nTrks =  9 106
A.shape =  (80000,)
majorAxis[iTrk][0][0] =  0.00045611936
majorAxis[iTrk][1][0] =  -4.8292455e-05
majorAxis[iTrk][2][0] =  0.090019904
minorAxis_1[iTrk][0][0] = 

In [16]:
ax, tax, lax, lines = dual_train_plots()
fig = ax.figure
plt.tight_layout()

<IPython.core.display.Javascript object>

In [17]:
for result in trainNet(model, optimizer, loss,
                        train_loader, val_loader,
                        n_epochs, epoch_start=len(results),
                        notebook=True, step_schedule=step_schedule):
    
    results = results.append(pd.Series(result._asdict()), ignore_index=True)
    xs = results.index
    
    # Update the plot above
    lines['train'].set_data(results.index,results.cost)
    lines['val'].set_data(results.index,results.val)
    
    #filter first cost epoch (can be really large)
    max_cost = max(max(results.cost if len(results.cost)<2 else results.cost[1:]), max(results.val))
    min_cost = min(min(results.cost), min(results.val))
    
    # The plot limits need updating too
    
    
    
    ax.set_ylim(min_cost*.9, max_cost*1.1)  
    ax.set_xlim(-.5, len(results.cost) - .5)

    
    # Redraw the figure
    fig.canvas.draw()

    # Save each model state dictionary
    torch.save(model.state_dict(), output / f'{name}_{result.epoch}.pyt')
    #mine
    param_states.append(get_param_state(model))

Number of batches: train = 2500, val = 1250


HBox(children=(FloatProgress(value=0.0, description='Epochs', layout=Layout(flex='2'), max=200.0, style=Progre…

Number of batches: train = 2500, val = 1250


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 0 | exponent is 0
lr factor is 0.7 ^ 0
final lr: 0.0001
Epoch 0: train=11.7193, val=11.8728, took 128.87 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 1 | exponent is 0
lr factor is 0.7 ^ 0
final lr: 0.0001
Epoch 1: train=11.766, val=11.8673, took 139.97 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 2 | exponent is 0
lr factor is 0.7 ^ 0
final lr: 0.0001
Epoch 2: train=11.7782, val=11.8535, took 189.42 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 3 | exponent is 0
lr factor is 0.7 ^ 0
final lr: 0.0001
Epoch 3: train=11.7614, val=11.8496, took 211.96 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 4 | exponent is 0
lr factor is 0.7 ^ 0
final lr: 0.0001
Epoch 4: train=11.7615, val=11.8367, took 215.28 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 5 | exponent is 0
lr factor is 0.7 ^ 0
final lr: 0.0001
Epoch 5: train=11.7521, val=11.8485, took 213.46 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 6 | exponent is 0
lr factor is 0.7 ^ 0
final lr: 0.0001
Epoch 6: train=11.7653, val=11.8463, took 214.25 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 7 | exponent is 0
lr factor is 0.7 ^ 0
final lr: 0.0001
Epoch 7: train=11.7544, val=11.8454, took 216.05 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 8 | exponent is 0
lr factor is 0.7 ^ 0
final lr: 0.0001
Epoch 8: train=11.6418, val=11.8065, took 211.5 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 9 | exponent is 0
lr factor is 0.7 ^ 0
final lr: 0.0001
Epoch 9: train=11.0016, val=11.5522, took 213.44 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 10 | exponent is 0
lr factor is 0.7 ^ 0
final lr: 0.0001
Epoch 10: train=11.0161, val=11.1502, took 214.73 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 11 | exponent is 0
lr factor is 0.7 ^ 0
final lr: 0.0001
Epoch 11: train=10.6831, val=10.9276, took 212.1 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 12 | exponent is 0
lr factor is 0.7 ^ 0
final lr: 0.0001
Epoch 12: train=10.5069, val=11.3259, took 213.65 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 13 | exponent is 0
lr factor is 0.7 ^ 0
final lr: 0.0001
Epoch 13: train=10.5518, val=11.7853, took 217.49 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 14 | exponent is 0
lr factor is 0.7 ^ 0
final lr: 0.0001
Epoch 14: train=11.0667, val=11.2581, took 211.12 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 15 | exponent is 0
lr factor is 0.7 ^ 0
final lr: 0.0001
Epoch 15: train=10.5556, val=10.6629, took 213.62 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 16 | exponent is 0
lr factor is 0.7 ^ 0
final lr: 0.0001
Epoch 16: train=10.2232, val=10.4775, took 213.97 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 17 | exponent is 0
lr factor is 0.7 ^ 0
final lr: 0.0001
Epoch 17: train=10.1174, val=10.6052, took 212.11 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 18 | exponent is 1
lr factor is 0.7 ^ 1
final lr: 7e-05
Epoch 18: train=9.89974, val=10.9979, took 211.82 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 19 | exponent is 1
lr factor is 0.7 ^ 1
final lr: 7e-05
Epoch 19: train=9.47713, val=9.13989, took 213.25 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 20 | exponent is 1
lr factor is 0.7 ^ 1
final lr: 7e-05
Epoch 20: train=9.31364, val=10.3218, took 213.71 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 21 | exponent is 1
lr factor is 0.7 ^ 1
final lr: 7e-05
Epoch 21: train=9.10284, val=8.7354, took 214.52 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 22 | exponent is 1
lr factor is 0.7 ^ 1
final lr: 7e-05
Epoch 22: train=9.12829, val=9.11811, took 229.72 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 23 | exponent is 1
lr factor is 0.7 ^ 1
final lr: 7e-05
Epoch 23: train=9.04451, val=12.7869, took 218.71 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 24 | exponent is 1
lr factor is 0.7 ^ 1
final lr: 7e-05
Epoch 24: train=8.94891, val=11.9669, took 212.4 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 25 | exponent is 1
lr factor is 0.7 ^ 1
final lr: 7e-05
Epoch 25: train=9.04473, val=13.2742, took 213.07 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 26 | exponent is 1
lr factor is 0.7 ^ 1
final lr: 7e-05
Epoch 26: train=8.9932, val=10.7328, took 211.48 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 27 | exponent is 1
lr factor is 0.7 ^ 1
final lr: 7e-05
Epoch 27: train=8.78268, val=9.61169, took 214.62 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 28 | exponent is 1
lr factor is 0.7 ^ 1
final lr: 7e-05
Epoch 28: train=8.72826, val=13.001, took 216.92 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 29 | exponent is 1
lr factor is 0.7 ^ 1
final lr: 7e-05
Epoch 29: train=8.85204, val=9.44294, took 212.69 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 30 | exponent is 1
lr factor is 0.7 ^ 1
final lr: 7e-05
Epoch 30: train=8.65966, val=11.8167, took 223.73 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 31 | exponent is 1
lr factor is 0.7 ^ 1
final lr: 7e-05
Epoch 31: train=9.42362, val=10.7493, took 214.81 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 32 | exponent is 1
lr factor is 0.7 ^ 1
final lr: 7e-05
Epoch 32: train=10.2106, val=11.229, took 217.95 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 33 | exponent is 1
lr factor is 0.7 ^ 1
final lr: 7e-05
Epoch 33: train=9.79094, val=9.51728, took 217.06 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 34 | exponent is 1
lr factor is 0.7 ^ 1
final lr: 7e-05
Epoch 34: train=9.45811, val=10.0429, took 215.91 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 35 | exponent is 1
lr factor is 0.7 ^ 1
final lr: 7e-05
Epoch 35: train=9.26812, val=8.70651, took 216.29 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 36 | exponent is 1
lr factor is 0.7 ^ 1
final lr: 7e-05
Epoch 36: train=9.18435, val=8.53346, took 216.7 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 37 | exponent is 1
lr factor is 0.7 ^ 1
final lr: 7e-05
Epoch 37: train=9.06121, val=13.5031, took 214.91 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 38 | exponent is 2
lr factor is 0.7 ^ 2
final lr: 4.9e-05
Epoch 38: train=9.33685, val=10.3046, took 218.13 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 39 | exponent is 2
lr factor is 0.7 ^ 2
final lr: 4.9e-05
Epoch 39: train=8.31466, val=8.83769, took 217.11 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 40 | exponent is 2
lr factor is 0.7 ^ 2
final lr: 4.9e-05
Epoch 40: train=8.08914, val=7.61315, took 214.52 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 41 | exponent is 2
lr factor is 0.7 ^ 2
final lr: 4.9e-05
Epoch 41: train=7.96901, val=10.0482, took 216.37 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 42 | exponent is 2
lr factor is 0.7 ^ 2
final lr: 4.9e-05
Epoch 42: train=7.91875, val=11.7369, took 218.95 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 43 | exponent is 2
lr factor is 0.7 ^ 2
final lr: 4.9e-05
Epoch 43: train=7.94501, val=9.9355, took 217.99 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 44 | exponent is 2
lr factor is 0.7 ^ 2
final lr: 4.9e-05
Epoch 44: train=7.82664, val=10.8029, took 218.85 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 45 | exponent is 2
lr factor is 0.7 ^ 2
final lr: 4.9e-05
Epoch 45: train=7.82906, val=10.1629, took 217.44 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 46 | exponent is 2
lr factor is 0.7 ^ 2
final lr: 4.9e-05
Epoch 46: train=7.74343, val=9.27199, took 213.36 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 47 | exponent is 2
lr factor is 0.7 ^ 2
final lr: 4.9e-05
Epoch 47: train=7.67649, val=7.41942, took 213.62 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 48 | exponent is 2
lr factor is 0.7 ^ 2
final lr: 4.9e-05
Epoch 48: train=7.66808, val=11.119, took 211.65 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 49 | exponent is 2
lr factor is 0.7 ^ 2
final lr: 4.9e-05
Epoch 49: train=7.65557, val=7.15383, took 212.16 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 50 | exponent is 2
lr factor is 0.7 ^ 2
final lr: 4.9e-05
Epoch 50: train=7.55157, val=7.60963, took 214.29 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 51 | exponent is 2
lr factor is 0.7 ^ 2
final lr: 4.9e-05
Epoch 51: train=7.58701, val=7.75392, took 215.39 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 52 | exponent is 2
lr factor is 0.7 ^ 2
final lr: 4.9e-05
Epoch 52: train=7.70325, val=11.24, took 213.0 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 53 | exponent is 2
lr factor is 0.7 ^ 2
final lr: 4.9e-05
Epoch 53: train=7.56261, val=7.15123, took 213.35 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 54 | exponent is 2
lr factor is 0.7 ^ 2
final lr: 4.9e-05
Epoch 54: train=7.41937, val=6.92987, took 212.74 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 55 | exponent is 2
lr factor is 0.7 ^ 2
final lr: 4.9e-05
Epoch 55: train=7.50555, val=10.7342, took 213.97 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 56 | exponent is 2
lr factor is 0.7 ^ 2
final lr: 4.9e-05
Epoch 56: train=7.50876, val=9.8196, took 215.41 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 57 | exponent is 2
lr factor is 0.7 ^ 2
final lr: 4.9e-05
Epoch 57: train=7.30842, val=7.26358, took 212.9 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 58 | exponent is 3
lr factor is 0.7 ^ 3
final lr: 3.4299999999999993e-05
Epoch 58: train=7.59884, val=6.92956, took 214.33 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 59 | exponent is 3
lr factor is 0.7 ^ 3
final lr: 3.4299999999999993e-05
Epoch 59: train=7.04809, val=8.17735, took 214.26 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 60 | exponent is 3
lr factor is 0.7 ^ 3
final lr: 3.4299999999999993e-05
Epoch 60: train=6.91591, val=6.93676, took 212.7 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 61 | exponent is 3
lr factor is 0.7 ^ 3
final lr: 3.4299999999999993e-05
Epoch 61: train=6.97457, val=6.7226, took 212.82 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 62 | exponent is 3
lr factor is 0.7 ^ 3
final lr: 3.4299999999999993e-05
Epoch 62: train=6.87172, val=6.52449, took 218.62 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 63 | exponent is 3
lr factor is 0.7 ^ 3
final lr: 3.4299999999999993e-05
Epoch 63: train=6.87915, val=8.28344, took 217.24 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 64 | exponent is 3
lr factor is 0.7 ^ 3
final lr: 3.4299999999999993e-05
Epoch 64: train=6.81415, val=6.56198, took 219.94 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 65 | exponent is 3
lr factor is 0.7 ^ 3
final lr: 3.4299999999999993e-05
Epoch 65: train=6.8477, val=7.09042, took 218.63 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 66 | exponent is 3
lr factor is 0.7 ^ 3
final lr: 3.4299999999999993e-05
Epoch 66: train=6.81695, val=7.44343, took 217.45 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 67 | exponent is 3
lr factor is 0.7 ^ 3
final lr: 3.4299999999999993e-05
Epoch 67: train=6.74453, val=6.51076, took 219.24 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 68 | exponent is 3
lr factor is 0.7 ^ 3
final lr: 3.4299999999999993e-05
Epoch 68: train=6.79972, val=7.717, took 235.22 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 69 | exponent is 3
lr factor is 0.7 ^ 3
final lr: 3.4299999999999993e-05
Epoch 69: train=6.7275, val=6.4961, took 235.88 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 70 | exponent is 3
lr factor is 0.7 ^ 3
final lr: 3.4299999999999993e-05
Epoch 70: train=6.73699, val=6.31549, took 238.09 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 71 | exponent is 3
lr factor is 0.7 ^ 3
final lr: 3.4299999999999993e-05
Epoch 71: train=6.6584, val=6.32687, took 225.33 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 72 | exponent is 3
lr factor is 0.7 ^ 3
final lr: 3.4299999999999993e-05
Epoch 72: train=6.77431, val=7.88469, took 224.83 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 73 | exponent is 3
lr factor is 0.7 ^ 3
final lr: 3.4299999999999993e-05
Epoch 73: train=6.61841, val=6.40769, took 215.45 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 74 | exponent is 3
lr factor is 0.7 ^ 3
final lr: 3.4299999999999993e-05
Epoch 74: train=6.66196, val=8.63073, took 213.74 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 75 | exponent is 3
lr factor is 0.7 ^ 3
final lr: 3.4299999999999993e-05
Epoch 75: train=6.66771, val=9.49827, took 212.66 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 76 | exponent is 3
lr factor is 0.7 ^ 3
final lr: 3.4299999999999993e-05
Epoch 76: train=6.64065, val=8.00265, took 215.94 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 77 | exponent is 3
lr factor is 0.7 ^ 3
final lr: 3.4299999999999993e-05
Epoch 77: train=6.70281, val=8.75787, took 213.0 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 78 | exponent is 4
lr factor is 0.7 ^ 4
final lr: 2.4009999999999995e-05
Epoch 78: train=6.71187, val=9.37206, took 213.91 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 79 | exponent is 4
lr factor is 0.7 ^ 4
final lr: 2.4009999999999995e-05
Epoch 79: train=6.28575, val=6.06119, took 214.13 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 80 | exponent is 4
lr factor is 0.7 ^ 4
final lr: 2.4009999999999995e-05
Epoch 80: train=6.32133, val=6.92788, took 212.46 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 81 | exponent is 4
lr factor is 0.7 ^ 4
final lr: 2.4009999999999995e-05
Epoch 81: train=6.28215, val=8.44576, took 215.25 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 82 | exponent is 4
lr factor is 0.7 ^ 4
final lr: 2.4009999999999995e-05
Epoch 82: train=6.25876, val=7.58861, took 213.16 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 83 | exponent is 4
lr factor is 0.7 ^ 4
final lr: 2.4009999999999995e-05
Epoch 83: train=6.25452, val=6.07248, took 212.42 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 84 | exponent is 4
lr factor is 0.7 ^ 4
final lr: 2.4009999999999995e-05
Epoch 84: train=6.21944, val=8.69759, took 224.63 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 85 | exponent is 4
lr factor is 0.7 ^ 4
final lr: 2.4009999999999995e-05
Epoch 85: train=6.26469, val=6.7756, took 222.83 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 86 | exponent is 4
lr factor is 0.7 ^ 4
final lr: 2.4009999999999995e-05
Epoch 86: train=6.1939, val=7.70075, took 213.87 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 87 | exponent is 4
lr factor is 0.7 ^ 4
final lr: 2.4009999999999995e-05
Epoch 87: train=6.18607, val=6.08625, took 213.38 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 88 | exponent is 4
lr factor is 0.7 ^ 4
final lr: 2.4009999999999995e-05
Epoch 88: train=6.1472, val=6.14903, took 212.95 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 89 | exponent is 4
lr factor is 0.7 ^ 4
final lr: 2.4009999999999995e-05
Epoch 89: train=6.19627, val=6.57146, took 214.31 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 90 | exponent is 4
lr factor is 0.7 ^ 4
final lr: 2.4009999999999995e-05
Epoch 90: train=6.19159, val=8.07785, took 215.24 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 91 | exponent is 4
lr factor is 0.7 ^ 4
final lr: 2.4009999999999995e-05
Epoch 91: train=6.16962, val=5.90636, took 213.85 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 92 | exponent is 4
lr factor is 0.7 ^ 4
final lr: 2.4009999999999995e-05
Epoch 92: train=6.10544, val=7.23135, took 213.57 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 93 | exponent is 4
lr factor is 0.7 ^ 4
final lr: 2.4009999999999995e-05
Epoch 93: train=6.1465, val=7.38743, took 213.83 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 94 | exponent is 4
lr factor is 0.7 ^ 4
final lr: 2.4009999999999995e-05
Epoch 94: train=6.12531, val=8.11371, took 213.36 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 95 | exponent is 4
lr factor is 0.7 ^ 4
final lr: 2.4009999999999995e-05
Epoch 95: train=6.09536, val=6.81685, took 216.07 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 96 | exponent is 4
lr factor is 0.7 ^ 4
final lr: 2.4009999999999995e-05
Epoch 96: train=6.03211, val=5.83263, took 213.43 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 97 | exponent is 4
lr factor is 0.7 ^ 4
final lr: 2.4009999999999995e-05
Epoch 97: train=6.10375, val=5.9442, took 212.42 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 98 | exponent is 5
lr factor is 0.7 ^ 5
final lr: 1.6806999999999993e-05
Epoch 98: train=6.09206, val=5.89009, took 214.33 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 99 | exponent is 5
lr factor is 0.7 ^ 5
final lr: 1.6806999999999993e-05
Epoch 99: train=5.86014, val=6.53657, took 213.96 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 100 | exponent is 5
lr factor is 0.7 ^ 5
final lr: 1.6806999999999993e-05
Epoch 100: train=5.8592, val=5.96054, took 213.15 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 101 | exponent is 5
lr factor is 0.7 ^ 5
final lr: 1.6806999999999993e-05
Epoch 101: train=5.85686, val=5.90277, took 213.29 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 102 | exponent is 5
lr factor is 0.7 ^ 5
final lr: 1.6806999999999993e-05
Epoch 102: train=5.90178, val=5.66025, took 212.72 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 103 | exponent is 5
lr factor is 0.7 ^ 5
final lr: 1.6806999999999993e-05
Epoch 103: train=5.83514, val=5.67849, took 213.08 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 104 | exponent is 5
lr factor is 0.7 ^ 5
final lr: 1.6806999999999993e-05
Epoch 104: train=5.83915, val=5.67977, took 217.09 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 105 | exponent is 5
lr factor is 0.7 ^ 5
final lr: 1.6806999999999993e-05
Epoch 105: train=5.80935, val=8.32602, took 211.62 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 106 | exponent is 5
lr factor is 0.7 ^ 5
final lr: 1.6806999999999993e-05
Epoch 106: train=5.79351, val=5.66987, took 214.14 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 107 | exponent is 5
lr factor is 0.7 ^ 5
final lr: 1.6806999999999993e-05
Epoch 107: train=5.78539, val=5.83554, took 215.36 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 108 | exponent is 5
lr factor is 0.7 ^ 5
final lr: 1.6806999999999993e-05
Epoch 108: train=5.78695, val=5.61635, took 213.03 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 109 | exponent is 5
lr factor is 0.7 ^ 5
final lr: 1.6806999999999993e-05
Epoch 109: train=5.7393, val=5.6109, took 218.86 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 110 | exponent is 5
lr factor is 0.7 ^ 5
final lr: 1.6806999999999993e-05
Epoch 110: train=5.75399, val=8.0408, took 221.52 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 111 | exponent is 5
lr factor is 0.7 ^ 5
final lr: 1.6806999999999993e-05
Epoch 111: train=5.7693, val=7.68413, took 220.7 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 112 | exponent is 5
lr factor is 0.7 ^ 5
final lr: 1.6806999999999993e-05
Epoch 112: train=5.77287, val=6.65607, took 220.75 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 113 | exponent is 5
lr factor is 0.7 ^ 5
final lr: 1.6806999999999993e-05
Epoch 113: train=5.75374, val=5.69253, took 219.21 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 114 | exponent is 5
lr factor is 0.7 ^ 5
final lr: 1.6806999999999993e-05
Epoch 114: train=5.7127, val=7.41935, took 217.5 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 115 | exponent is 5
lr factor is 0.7 ^ 5
final lr: 1.6806999999999993e-05
Epoch 115: train=5.67849, val=5.56743, took 219.65 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 116 | exponent is 5
lr factor is 0.7 ^ 5
final lr: 1.6806999999999993e-05
Epoch 116: train=5.74597, val=6.00237, took 218.05 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 117 | exponent is 5
lr factor is 0.7 ^ 5
final lr: 1.6806999999999993e-05
Epoch 117: train=5.70031, val=7.39319, took 220.5 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 118 | exponent is 6
lr factor is 0.7 ^ 6
final lr: 1.1764899999999996e-05
Epoch 118: train=5.69937, val=5.6098, took 219.55 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 119 | exponent is 6
lr factor is 0.7 ^ 6
final lr: 1.1764899999999996e-05
Epoch 119: train=5.5554, val=5.59085, took 217.15 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 120 | exponent is 6
lr factor is 0.7 ^ 6
final lr: 1.1764899999999996e-05
Epoch 120: train=5.57343, val=5.81769, took 217.82 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 121 | exponent is 6
lr factor is 0.7 ^ 6
final lr: 1.1764899999999996e-05
Epoch 121: train=5.56472, val=5.46403, took 219.4 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 122 | exponent is 6
lr factor is 0.7 ^ 6
final lr: 1.1764899999999996e-05
Epoch 122: train=5.55166, val=5.54729, took 216.26 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 123 | exponent is 6
lr factor is 0.7 ^ 6
final lr: 1.1764899999999996e-05
Epoch 123: train=5.53764, val=5.44907, took 217.61 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 124 | exponent is 6
lr factor is 0.7 ^ 6
final lr: 1.1764899999999996e-05
Epoch 124: train=5.5727, val=5.46422, took 214.98 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 125 | exponent is 6
lr factor is 0.7 ^ 6
final lr: 1.1764899999999996e-05
Epoch 125: train=5.53913, val=6.98262, took 212.96 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 126 | exponent is 6
lr factor is 0.7 ^ 6
final lr: 1.1764899999999996e-05
Epoch 126: train=5.53376, val=5.46859, took 213.09 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 127 | exponent is 6
lr factor is 0.7 ^ 6
final lr: 1.1764899999999996e-05
Epoch 127: train=5.54163, val=5.57853, took 215.57 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 128 | exponent is 6
lr factor is 0.7 ^ 6
final lr: 1.1764899999999996e-05
Epoch 128: train=5.51805, val=5.61459, took 212.99 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 129 | exponent is 6
lr factor is 0.7 ^ 6
final lr: 1.1764899999999996e-05
Epoch 129: train=5.49274, val=7.39378, took 214.72 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 130 | exponent is 6
lr factor is 0.7 ^ 6
final lr: 1.1764899999999996e-05
Epoch 130: train=5.50399, val=5.45712, took 214.86 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 131 | exponent is 6
lr factor is 0.7 ^ 6
final lr: 1.1764899999999996e-05
Epoch 131: train=5.50175, val=5.4116, took 212.97 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 132 | exponent is 6
lr factor is 0.7 ^ 6
final lr: 1.1764899999999996e-05
Epoch 132: train=5.52396, val=6.1476, took 213.7 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 133 | exponent is 6
lr factor is 0.7 ^ 6
final lr: 1.1764899999999996e-05
Epoch 133: train=5.49584, val=6.28804, took 213.9 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 134 | exponent is 6
lr factor is 0.7 ^ 6
final lr: 1.1764899999999996e-05
Epoch 134: train=5.50864, val=5.37453, took 213.43 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 135 | exponent is 6
lr factor is 0.7 ^ 6
final lr: 1.1764899999999996e-05
Epoch 135: train=5.46801, val=5.45824, took 213.6 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 136 | exponent is 6
lr factor is 0.7 ^ 6
final lr: 1.1764899999999996e-05
Epoch 136: train=5.44795, val=5.89878, took 213.83 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 137 | exponent is 6
lr factor is 0.7 ^ 6
final lr: 1.1764899999999996e-05
Epoch 137: train=5.4577, val=5.6089, took 225.31 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 138 | exponent is 7
lr factor is 0.7 ^ 7
final lr: 8.235429999999996e-06
Epoch 138: train=5.46427, val=5.43033, took 216.19 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 139 | exponent is 7
lr factor is 0.7 ^ 7
final lr: 8.235429999999996e-06
Epoch 139: train=5.37953, val=5.32227, took 210.79 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 140 | exponent is 7
lr factor is 0.7 ^ 7
final lr: 8.235429999999996e-06
Epoch 140: train=5.35868, val=5.4709, took 210.08 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 141 | exponent is 7
lr factor is 0.7 ^ 7
final lr: 8.235429999999996e-06
Epoch 141: train=5.36331, val=5.65573, took 211.69 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 142 | exponent is 7
lr factor is 0.7 ^ 7
final lr: 8.235429999999996e-06
Epoch 142: train=5.38315, val=5.42907, took 211.67 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 143 | exponent is 7
lr factor is 0.7 ^ 7
final lr: 8.235429999999996e-06
Epoch 143: train=5.36674, val=5.35716, took 211.85 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 144 | exponent is 7
lr factor is 0.7 ^ 7
final lr: 8.235429999999996e-06
Epoch 144: train=5.36025, val=5.33528, took 211.25 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 145 | exponent is 7
lr factor is 0.7 ^ 7
final lr: 8.235429999999996e-06
Epoch 145: train=5.35015, val=5.43968, took 212.57 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 146 | exponent is 7
lr factor is 0.7 ^ 7
final lr: 8.235429999999996e-06
Epoch 146: train=5.33351, val=5.29168, took 211.23 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 147 | exponent is 7
lr factor is 0.7 ^ 7
final lr: 8.235429999999996e-06
Epoch 147: train=5.35595, val=5.32234, took 210.81 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 148 | exponent is 7
lr factor is 0.7 ^ 7
final lr: 8.235429999999996e-06
Epoch 148: train=5.33854, val=5.38886, took 213.1 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 149 | exponent is 7
lr factor is 0.7 ^ 7
final lr: 8.235429999999996e-06
Epoch 149: train=5.3427, val=5.42333, took 211.8 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 150 | exponent is 7
lr factor is 0.7 ^ 7
final lr: 8.235429999999996e-06
Epoch 150: train=5.33304, val=6.45549, took 212.55 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 151 | exponent is 7
lr factor is 0.7 ^ 7
final lr: 8.235429999999996e-06
Epoch 151: train=5.33126, val=5.89323, took 211.73 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 152 | exponent is 7
lr factor is 0.7 ^ 7
final lr: 8.235429999999996e-06
Epoch 152: train=5.30626, val=5.44043, took 210.9 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 153 | exponent is 7
lr factor is 0.7 ^ 7
final lr: 8.235429999999996e-06
Epoch 153: train=5.32097, val=5.3518, took 212.66 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 154 | exponent is 7
lr factor is 0.7 ^ 7
final lr: 8.235429999999996e-06
Epoch 154: train=5.29513, val=5.29141, took 214.87 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 155 | exponent is 7
lr factor is 0.7 ^ 7
final lr: 8.235429999999996e-06
Epoch 155: train=5.31235, val=5.43813, took 210.33 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 156 | exponent is 7
lr factor is 0.7 ^ 7
final lr: 8.235429999999996e-06
Epoch 156: train=5.29924, val=5.23449, took 211.49 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 157 | exponent is 7
lr factor is 0.7 ^ 7
final lr: 8.235429999999996e-06
Epoch 157: train=5.2954, val=5.27703, took 212.37 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 158 | exponent is 8
lr factor is 0.7 ^ 8
final lr: 5.764800999999997e-06
Epoch 158: train=5.29862, val=5.24366, took 211.29 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 159 | exponent is 8
lr factor is 0.7 ^ 8
final lr: 5.764800999999997e-06
Epoch 159: train=5.24427, val=5.22083, took 211.91 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 160 | exponent is 8
lr factor is 0.7 ^ 8
final lr: 5.764800999999997e-06
Epoch 160: train=5.2363, val=5.22628, took 212.6 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 161 | exponent is 8
lr factor is 0.7 ^ 8
final lr: 5.764800999999997e-06
Epoch 161: train=5.23389, val=5.29906, took 210.04 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 162 | exponent is 8
lr factor is 0.7 ^ 8
final lr: 5.764800999999997e-06
Epoch 162: train=5.23805, val=5.20646, took 214.95 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 163 | exponent is 8
lr factor is 0.7 ^ 8
final lr: 5.764800999999997e-06
Epoch 163: train=5.21805, val=5.21868, took 212.08 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 164 | exponent is 8
lr factor is 0.7 ^ 8
final lr: 5.764800999999997e-06
Epoch 164: train=5.21645, val=5.19542, took 210.67 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 165 | exponent is 8
lr factor is 0.7 ^ 8
final lr: 5.764800999999997e-06
Epoch 165: train=5.23534, val=5.25407, took 213.57 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 166 | exponent is 8
lr factor is 0.7 ^ 8
final lr: 5.764800999999997e-06
Epoch 166: train=5.21945, val=5.21659, took 212.21 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 167 | exponent is 8
lr factor is 0.7 ^ 8
final lr: 5.764800999999997e-06
Epoch 167: train=5.22205, val=5.19984, took 211.61 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 168 | exponent is 8
lr factor is 0.7 ^ 8
final lr: 5.764800999999997e-06
Epoch 168: train=5.21758, val=5.20955, took 210.88 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 169 | exponent is 8
lr factor is 0.7 ^ 8
final lr: 5.764800999999997e-06
Epoch 169: train=5.20765, val=5.17835, took 212.65 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 170 | exponent is 8
lr factor is 0.7 ^ 8
final lr: 5.764800999999997e-06
Epoch 170: train=5.20533, val=5.21855, took 212.74 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 171 | exponent is 8
lr factor is 0.7 ^ 8
final lr: 5.764800999999997e-06
Epoch 171: train=5.20279, val=5.23976, took 213.23 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 172 | exponent is 8
lr factor is 0.7 ^ 8
final lr: 5.764800999999997e-06
Epoch 172: train=5.18997, val=5.24331, took 213.06 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 173 | exponent is 8
lr factor is 0.7 ^ 8
final lr: 5.764800999999997e-06
Epoch 173: train=5.19859, val=5.1834, took 210.24 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 174 | exponent is 8
lr factor is 0.7 ^ 8
final lr: 5.764800999999997e-06
Epoch 174: train=5.1818, val=5.16901, took 211.91 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 175 | exponent is 8
lr factor is 0.7 ^ 8
final lr: 5.764800999999997e-06
Epoch 175: train=5.19098, val=5.16472, took 212.72 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 176 | exponent is 8
lr factor is 0.7 ^ 8
final lr: 5.764800999999997e-06
Epoch 176: train=5.1853, val=5.30657, took 211.04 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 177 | exponent is 8
lr factor is 0.7 ^ 8
final lr: 5.764800999999997e-06
Epoch 177: train=5.18805, val=5.34107, took 211.61 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 178 | exponent is 9
lr factor is 0.7 ^ 9
final lr: 4.035360699999998e-06
Epoch 178: train=5.17967, val=5.1562, took 211.95 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 179 | exponent is 9
lr factor is 0.7 ^ 9
final lr: 4.035360699999998e-06
Epoch 179: train=5.14685, val=5.15839, took 211.3 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 180 | exponent is 9
lr factor is 0.7 ^ 9
final lr: 4.035360699999998e-06
Epoch 180: train=5.14325, val=5.18015, took 211.09 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 181 | exponent is 9
lr factor is 0.7 ^ 9
final lr: 4.035360699999998e-06
Epoch 181: train=5.13257, val=5.13611, took 212.28 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 182 | exponent is 9
lr factor is 0.7 ^ 9
final lr: 4.035360699999998e-06
Epoch 182: train=5.13353, val=5.14055, took 211.19 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 183 | exponent is 9
lr factor is 0.7 ^ 9
final lr: 4.035360699999998e-06
Epoch 183: train=5.13828, val=5.15939, took 212.17 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 184 | exponent is 9
lr factor is 0.7 ^ 9
final lr: 4.035360699999998e-06
Epoch 184: train=5.13185, val=5.19131, took 213.57 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 185 | exponent is 9
lr factor is 0.7 ^ 9
final lr: 4.035360699999998e-06
Epoch 185: train=5.12757, val=5.16608, took 210.45 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 186 | exponent is 9
lr factor is 0.7 ^ 9
final lr: 4.035360699999998e-06
Epoch 186: train=5.1287, val=5.14393, took 211.46 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 187 | exponent is 9
lr factor is 0.7 ^ 9
final lr: 4.035360699999998e-06
Epoch 187: train=5.12762, val=5.13191, took 213.4 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 188 | exponent is 9
lr factor is 0.7 ^ 9
final lr: 4.035360699999998e-06
Epoch 188: train=5.12714, val=5.13942, took 209.32 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 189 | exponent is 9
lr factor is 0.7 ^ 9
final lr: 4.035360699999998e-06
Epoch 189: train=5.11716, val=5.13599, took 211.54 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 190 | exponent is 9
lr factor is 0.7 ^ 9
final lr: 4.035360699999998e-06
Epoch 190: train=5.11853, val=5.12286, took 212.89 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 191 | exponent is 9
lr factor is 0.7 ^ 9
final lr: 4.035360699999998e-06
Epoch 191: train=5.11741, val=5.14212, took 210.26 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 192 | exponent is 9
lr factor is 0.7 ^ 9
final lr: 4.035360699999998e-06
Epoch 192: train=5.10761, val=5.25873, took 212.04 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 193 | exponent is 9
lr factor is 0.7 ^ 9
final lr: 4.035360699999998e-06
Epoch 193: train=5.10848, val=5.11666, took 212.37 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 194 | exponent is 9
lr factor is 0.7 ^ 9
final lr: 4.035360699999998e-06
Epoch 194: train=5.10491, val=5.11966, took 210.78 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 195 | exponent is 9
lr factor is 0.7 ^ 9
final lr: 4.035360699999998e-06
Epoch 195: train=5.11414, val=5.15256, took 213.59 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 196 | exponent is 9
lr factor is 0.7 ^ 9
final lr: 4.035360699999998e-06
Epoch 196: train=5.10082, val=5.16717, took 209.62 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 197 | exponent is 9
lr factor is 0.7 ^ 9
final lr: 4.035360699999998e-06
Epoch 197: train=5.1108, val=5.12843, took 211.02 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 198 | exponent is 10
lr factor is 0.7 ^ 10
final lr: 2.8247524899999986e-06
Epoch 198: train=5.09973, val=5.15792, took 211.81 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=2500.0, style=Pro…

lr inital: 0.0001
Epoch 199 | exponent is 10
lr factor is 0.7 ^ 10
final lr: 2.8247524899999986e-06
Epoch 199: train=5.07753, val=5.14395, took 212.28 s



Go ahead and save the final model (even though it was also saved above):

In [18]:
torch.save(model.state_dict(), output / f'{name}_final.pyt')

Save the output results:

In [19]:
results.to_hdf(f'{name}_stats.hdf5', 'results')

Save the plot above:

In [20]:
dual_train_plots(results.index,
                 results.cost, results.val,
                 results.cost, results.val)
plt.tight_layout()
plt.savefig(str(output / f'{name}_stats_a.png'))

<IPython.core.display.Javascript object>

In [21]:
from functions.utils import state_dict_to_vector
def angle_between(a, b):
    return np.arccos(np.dot(a, b)/(np.linalg.norm(a)*np.linalg.norm(b)))

angle_grids = []
grid_size = 25
num_epochs = n_epochs
num_epochs2 = 0

ep_intervals = [(np.arange(0, num_epochs+num_epochs2+1, grid_size)[i], np.arange(0, num_epochs+num_epochs2+1, grid_size)[i+1]) for i in range(len(np.arange(0, num_epochs+num_epochs2+1, grid_size))-1)]

for interval in ep_intervals:
    
    these_param_states = []
    for i in range(interval[0], interval[1]):
        if i % 100 == 0:
            print(i)
        these_param_states.append(param_states[i])
        #print("Loaded", file_names[i])
        
    interval_size = len(these_param_states)-1    
    these_steps = [these_param_states[i+1]-these_param_states[i] for i in range(interval_size)]
    
    this_angle_grid = np.zeros((interval_size, interval_size))
    
    for i in range(interval_size):
        for j in range(i+1, interval_size):#range(i+1, interval_size):
            angle = angle_between(these_steps[i], these_steps[j])
            this_angle_grid[i,j] = angle
            this_angle_grid[j,i] = angle
            
    angle_grids.append(this_angle_grid)

0
100


In [22]:
import matplotlib.colors as colors
import matplotlib.cm as cm

for angle_grid in angle_grids:
    plt.figure(figsize=(12,8))
    norm = colors.Normalize(vmin=np.amin(angle_grid), vmax=np.amax(angle_grid))   
    plt.imshow(angle_grid, cmap=cm.jet)
    plt.colorbar(cm.ScalarMappable(norm=norm, cmap=cm.jet))
    plt.xlabel('Step i')
    plt.ylabel('Step j')
    
#print("num params:", len(these_param_states[0]))

<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>

In [23]:
from functions.plotting_DDplus_hists import load_data
from functions.utils import vector_to_state_dict

state_dicts = []
# num_epochs = 500
for i in np.arange(0, num_epochs, 10):
    state_dicts.append( (i, vector_to_state_dict(param_states[i], model)) )

data = load_data()

Loading data...
pocaMx.shape =  (20000,)
nEvts =  20000
len(pocaMx[0]) =  211
len(pocaMx[1]) =  21
len(pocaMx[2]) =  20
len(pocaMx[3]) =  198
len(pocaMx[4]) =  233
majorAxis.shape =  (20000, 3)
minorAxis_1.shape =  (20000, 3)
minorAxis_2.shape =  (20000, 3)
have entered six_ellipsoid_parameters
  
 
  nEvts =  20000
 iEvt, nTrks =  0 211
 iEvt, nTrks =  1 21
 iEvt, nTrks =  2 20
 iEvt, nTrks =  3 198
 iEvt, nTrks =  4 233
 iEvt, nTrks =  5 85
 iEvt, nTrks =  6 223
 iEvt, nTrks =  7 425
 iEvt, nTrks =  8 252
 iEvt, nTrks =  9 169
A.shape =  (20000,)
majorAxis[iTrk][0][0] =  -0.00023452607
majorAxis[iTrk][1][0] =  -0.00047206535
majorAxis[iTrk][2][0] =  0.096502915
minorAxis_1[iTrk][0][0] =  -15.822749
minorAxis_1[iTrk][1][0] =  7.8608756
minorAxis_1[iTrk][2][0] =  -2.6228399e-08
minorAxis_2[iTrk][0][0] =  7.860759
minorAxis_2[iTrk][1][0] =  15.822513
minorAxis_2[iTrk][2][0] =  0.096502915
  
majorAxis[iTrk][0][0] =  -0.37655562
majorAxis[iTrk][1][0] =  0.2768704
majorAxis[iTrk][2][0] = 

In [24]:
from functions.plotting_DDplus_hists import plot_DDplus_hists as Plot
Plot(state_dicts, data)

[0, 10, 20, 30, 40, 50, 60, 70, 80, 90, 100, 110, 120, 130, 140, 150, 160, 170, 180, 190]


<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>