In [1]:
##%matplotlib widget
## with %matplotlib notebook: seems to require ipympl as part of environment, either
## part of the conda environment or "pip install ipympl"
## otherwise, does not show ANY plots in note"book, plt.savefig() works
%matplotlib notebook  
##%matplotlib inline    ## --plt.savefig()  works, but re-sizing does NOT


This notebook is the second attempt to read in track information and use it to predict the KDE used as input to PvFinder. This time, we are reading in poca KDEs rather than the original KDEs. 

collectdata_kde_C.py uses poca_z, poca_x, poca_y, major_axis_x, major_axis_y, and major_axis_z as the six track parameters (for the moment)


Check the current GPU usage. Please try to be nice!

In [2]:
!nvidia-smi

Sun Aug 29 12:53:36 2021       
+-----------------------------------------------------------------------------+
| NVIDIA-SMI 470.42.01    Driver Version: 470.42.01    CUDA Version: 11.4     |
|-------------------------------+----------------------+----------------------+
| GPU  Name        Persistence-M| Bus-Id        Disp.A | Volatile Uncorr. ECC |
| Fan  Temp  Perf  Pwr:Usage/Cap|         Memory-Usage | GPU-Util  Compute M. |
|                               |                      |               MIG M. |
|   0  NVIDIA TITAN V      Off  | 00000000:03:00.0 Off |                  N/A |
| 28%   36C    P8    23W / 250W |   2632MiB / 12066MiB |      0%      Default |
|                               |                      |                  N/A |
+-------------------------------+----------------------+----------------------+
|   1  Tesla P100-PCIE...  Off  | 00000000:83:00.0 Off |                    0 |
| N/A   79C    P0   113W / 250W |   7774MiB / 16280MiB |     94%      Default |
|       

> **WARNING**: The card numbers here are *not* the same as in CUDA. You have been warned.

This notebook is first attempt to read in track information and use it to predict the KDE used as input to PvFinder.


## Imports

In [3]:
import matplotlib.pyplot as plt
import numpy as np
import time
import torch
import pandas as pd

# Python 3 standard library
from pathlib import Path

##from torchsummary import summary

### Set up local parameters

In [4]:
n_epochs = 200

# Name is the output file name


##  201027 -- about to go to bed, so try 2500 epochs with lr = 1e55
##  previous iteration had l4 = 3e-5 and cost dropped almost linearly
##  for 100 epochs -- final training costs ~ 2.02, validation cost ~ 2.01

## for iter 4, try 10 epochs with lr = 3e-6
## usually have a big jump down at epoch 0; want to try a
## small number of epochs per iteration and see what happens (iter4: 10 epochs gave
## traiing cost dropping from 1.54 to 1.50 immediately, then dropping very slowly)
folder = 'baileyds200ep_DDplus_iter5_lrstepschedulecontinued'
name   = folder

# Make an output folder named "name" (change if you want)

## Special instructions for those working on goofy at UC
## Please be very careful to make sure that your folder
## does not live in a subdirectory of your home directory
## this disk has very little capacity. Instead, use 
## a subdirectory in /share/lazy with a symbolic link to
## it in this (the notebooks) subdirectory
folder = 'baileyds/DDplus/' + folder
output = Path(folder)


# Size of batches
batch_size = 16 ## was 64
# How fast to learn
learning_rate = 1e-5

Make the output directory if it does not exist:

In [5]:
output.mkdir(exist_ok=True)

## Get the helper functions

Add the directory with the model
definitions to the path so we can import from it:

> When you type `import X`,
Python searches `sys.path` for a python
file named `X.py` to import. So we need to add the model directory to the path.

In [6]:
# From model/collectdata.py
##from model.collectdata_kde_B import collect_t2kde_data
## collectdata_kde_C should use the new poca KDE rather than the original kernel KDE
from model.collectdata_kde_Ellipsoids import collect_t2kde_data


# From model/loss.py
##from loss import Loss
## kde_loss_D includes botha ratio term and a chisq term, 98% ave_chisq
## kde_loss_E adds a chi^4 term to the kde_loss_D return value
## this is intended to emphasize the importance of values significantly different than zero
from model.kde_loss_Ba import Loss

##  TracksToKDE_Ellipsoids_SevenLayerCake has 7 hidden layers producing the 4000-bin KDE historgram
##  It takes 9 input features (pocca centers + (A,B,C,D,E,F) . 
from model.models_kde import TracksToKDE_Ellipsoids_DDplus as Model


from model.training_kde import trainNet, select_gpu, Results
from functions.my_training_kde import trainNet
from model.plots import dual_train_plots, replace_in_ax

In [7]:
# This gets built up during the run - do not rerun this cell
results = pd.DataFrame([], columns=Results._fields)
# my entry 
from functions.utils import get_param_state
param_states = []

Set up Torch device configuration. All tensors and model parameters need to know where to be put.
This takes a BUS ID number: The BUS ID is the same as the listing at the top of this script.

In [8]:
device = "cuda:0"#select_gpu(0)
##device = "cpu"

## Loading data

Load the dataset, split into parts, then move to device (see `collectdata.py` in the `../model` directory)

# Preparing the model

Prepare a model, use multiple GPUs if they are VISIBLE, and move the model to the device.

In [9]:
##print("Let's use", torch.cuda.device_count(), "GPUs!")
##if torch.cuda.device_count() > 1:
##    model = torch.nn.DataParallel(model)

In [10]:
## a comment on the web at https://pytorch.org/docs/stable/optim.html says
"""
If you need to move a model to GPU via .cuda(), please do so before constructing optimizers for it. 
Parameters of a model after .cuda() will be different objects with those before the call.

In general, you should make sure that optimized parameters live in consistent locations when 
optimizers are constructed and used.
"""
## so move this here (although we are using model.to(device) not explicitly using .cuda()

nOut1 = 50
nOut2 = 50
nOut3 = 50
nOut4 = 50
nOut5 = 50
nOut6 = 50
nOut7 = 50
nOut8 = 50
nOut9 = 50
nOut10 = 50
nOut11 = 50
latentChannels = 4
model = Model(nOut1,nOut2,nOut3,nOut4,nOut5,nOut6,nOut7,nOut8,nOut9,nOut10,nOut11,latentChannels)

##summary(model, input_size=(4, 4000))
##print(model.parameters)

## add the following code to allow the user to freeze the some of the weights corresponding 
## to those taken from an earlier model trained with the original target histograms
## presumably -- this leaves either the perturbative filter "fixed" and lets the 
## learning focus on the non-perturbative features, so get started faster, or vice versa
ct = 0
for child in model.children():
  print('ct, child = ',ct, "  ", child)
  if ct < 0:
    print("     About to set param.requires_grad=False for ct = ", ct, "params")
    for param in child.parameters():
        param.requires_grad = False 
  ct += 1
##  mds 200121 loss = Loss(epsilon=1e-5,coefficient=1.0)
##  loss = Loss(epsilon=1e-5,coefficient=2.5)
##loss = Loss(epsilon=3e-5, debug=False)
loss = Loss(epsilon=3e-5)

ct, child =  0    Linear(in_features=9, out_features=50, bias=True)
ct, child =  1    Linear(in_features=50, out_features=50, bias=True)
ct, child =  2    Linear(in_features=50, out_features=50, bias=True)
ct, child =  3    Linear(in_features=50, out_features=50, bias=True)
ct, child =  4    Linear(in_features=50, out_features=50, bias=True)
ct, child =  5    Linear(in_features=50, out_features=50, bias=True)
ct, child =  6    Linear(in_features=50, out_features=50, bias=True)
ct, child =  7    Linear(in_features=50, out_features=50, bias=True)
ct, child =  8    Linear(in_features=50, out_features=50, bias=True)
ct, child =  9    Linear(in_features=50, out_features=50, bias=True)
ct, child =  10    Linear(in_features=50, out_features=50, bias=True)
ct, child =  11    Linear(in_features=50, out_features=16000, bias=True)
ct, child =  12    Conv1d(4, 25, kernel_size=(25,), stride=(1,), padding=(12,))
ct, child =  13    Conv1d(25, 1, kernel_size=(5,), stride=(1,), padding=(2,))
ct, child 

Let's move the model's weight matricies to the GPU:

In [11]:
model = model.to(device)

In [12]:
optimizer = torch.optim.Adam(model.parameters(), lr=learning_rate)
from functions.my_optimizers import StepLrSchedule
step_schedule = StepLrSchedule(optimizer, decay_rate=0.7, drop_rate=20)
##optimizer = torch.optim.SGD(model.parameters(), lr=learning_rate)

In [13]:
print('output = ',output)
##print('oldOutput = ',oldOutput)
##  use the first four layers from a pre-existing model
##  see example at https://discuss.pytorch.org/t/how-to-load-part-of-pre-trained-model/1113

##   ML -> /share/lazy/sokoloff/ML
model_dict = model.state_dict()
## mds 190725 for debugging
print("for model_dict")
index = 0
for k,v in model_dict.items():
    print("index, k =  ",index,"  ",k)
    index = index+1
##    print("value = ", v)
 
updated_dict = model_dict
##print("updated_dict = ",updated_dict)
## when starting "ab initio", reduce biases as the bias gets summed for each track
## contributing to the predicted KDE
updated_dict["layer1.bias"] = 0.005*model_dict["layer1.bias"]
updated_dict["layer2.bias"] = 0.005*model_dict["layer2.bias"]
updated_dict["layer3.bias"] = 0.005*model_dict["layer3.bias"]
updated_dict["layer4.bias"] = 0.005*model_dict["layer4.bias"]
updated_dict["layer5.bias"] = 0.005*model_dict["layer5.bias"]
updated_dict["layer6.bias"] = 0.005*model_dict["layer6.bias"]
updated_dict["layer7.bias"] = 0.005*model_dict["layer7.bias"]
updated_dict["layer8.bias"] = 0.005*model_dict["layer8.bias"]
updated_dict["layer9.bias"] = 0.005*model_dict["layer9.bias"]
updated_dict["layer10.bias"] = 0.005*model_dict["layer10.bias"]
updated_dict["layer11.bias"] = 0.005*model_dict["layer11.bias"]

model.load_state_dict(updated_dict,strict=False)

model_dict = model.state_dict()
##print("updated model_dict = ",model_dict)

## print(" \n","  for pretrained_dict")
## index = 0
##for k,v in pretrained_dict.items():
##    print("index, k =  ",index,"  ",k)
##    index = index+1
## mds  

##pretrained_dict = torch.load('ML/29July2020_Trks_to_KDE_C_lossB_100epochs_b64_1m3_nOut_50x50/29July2020_Trks_to_KDE_C_lossB_100epochs_b64_1m3_nOut_50x50_final.pyt')
##print("model_dict instantiated")
# 1. filter out unnecessary keys
##pretrained_dict = {k: v for k, v in pretrained_dict.items() if k in model_dict}
##print("pretrained_dict iterated")
# 2. overwrite entries in the existing state dict
##model_dict.update(pretrained_dict) 
##
#   when starting from a model with a fully connected last layer rather than a convolutional layer
# 3. load the new state dict
#   need to use strict=False as the two models state model attributes do not agree exactly
#   see https://pytorch.org/docs/master/_modules/torch/nn/modules/module.html#Module.load_state_dict

##model.load_state_dict(pretrained_dict,strict=False)

## print('model_dict =    ', model_dict)

# ## finished at training cost = 1.46, validation cost = 1.50
d_folder = 'baileyds200ep_DDplus_iter4_lrstepschedule'
d_name = d_folder
suffix = 'final'
dict_name = 'baileyds/DDplus/' + d_folder + '/' + d_name + '_'+ suffix + '.pyt'
print('dict_name = ',dict_name)
pretrained_dict = torch.load(dict_name)

# print(" ")
# print("  for pretrained_dict")
# index = 0
# for k,v in pretrained_dict.items():
#     print("index, k =  ",index,"  ",k)
#     index = index+1
 

# ##print("model_dict instantiated")
# # 1. filter out unnecessary keys
# pretrained_dict = {k: v for k, v in pretrained_dict.items() if k in model_dict}
# print("pretrained_dict iterated")
# # 2. overwrite entries in the existing state dict
# model_dict.update(pretrained_dict) 
# ##
# #   when starting from a model with a fully connected last layer rather than a convolutional layer
# # 3. load the new state dict
# #   need to use strict=False as the two models state model attributes do not agree exactly
# #   see https://pytorch.org/docs/master/_modules/torch/nn/modules/module.html#Module.load_state_dict

model.load_state_dict(pretrained_dict,strict=False)

#mine
param_states.append(get_param_state(model))


output =  baileyds/DDplus/baileyds200ep_DDplus_iter5_lrstepschedulecontinued
for model_dict
index, k =   0    layer1.weight
index, k =   1    layer1.bias
index, k =   2    layer2.weight
index, k =   3    layer2.bias
index, k =   4    layer3.weight
index, k =   5    layer3.bias
index, k =   6    layer4.weight
index, k =   7    layer4.bias
index, k =   8    layer5.weight
index, k =   9    layer5.bias
index, k =   10    layer6.weight
index, k =   11    layer6.bias
index, k =   12    layer7.weight
index, k =   13    layer7.bias
index, k =   14    layer8.weight
index, k =   15    layer8.bias
index, k =   16    layer9.weight
index, k =   17    layer9.bias
index, k =   18    layer10.weight
index, k =   19    layer10.bias
index, k =   20    layer11.weight
index, k =   21    layer11.bias
index, k =   22    layer12new.weight
index, k =   23    layer12new.bias
index, k =   24    conv1.weight
index, k =   25    conv1.bias
index, k =   26    conv2.weight
index, k =   27    conv2.bias
index, k =   2

In [14]:
##print('validation.dataset.tensors = ',validation.dataset.tensors)
fig_size = plt.rcParams["figure.figsize"]
fig_size[0] = 10
fig_size[1] = 4
plt.rcParams["figure.figsize"] = fig_size

In [15]:

## Training dataset. You can put as many files here as desired.

##train_loader = collect_t2kde_data('/share/lazy/pv-finder/20k_evts_for_KDE_learning_200716.h5',
train_loader = collect_t2kde_data('dataAA/20K_POCA_kernel_evts_200926.h5',
##train_loader = collect_t2kde_data('/share/lazy/pv-finder/test_data_for_KDE_learning_BastilleDay20.h5',
                            batch_size=batch_size,
## if we are using a larger dataset (240K events, with the datasets above, and 11 GB  of GPU memory),
## the dataset will overflow the GPU memory; device=device will allow the data to move back
## and forth between the CPU and GPU memory. While this allows use of a larger dataset, it slows
## down performance by about 10%.  So comment out when not needed.
##                          device=device,
                           slice = slice(None,18000)
                           )
                            
# Validation dataset. You can slice to reduce the size.
## mds no separate validation set yet,
val_loader = collect_t2kde_data('dataAA/20K_POCA_kernel_evts_200926.h5',
                            batch_size=batch_size,
##                            device=device,
                            slice = slice(18000,None)
                           )


Loading data...
pocaMx.shape =  (20000,)
nEvts =  20000
len(pocaMx[0]) =  211
len(pocaMx[1]) =  21
len(pocaMx[2]) =  20
len(pocaMx[3]) =  198
len(pocaMx[4]) =  233
majorAxis.shape =  (20000, 3)
minorAxis_1.shape =  (20000, 3)
minorAxis_2.shape =  (20000, 3)
have entered six_ellipsoid_parameters
  
 
  nEvts =  20000
 iEvt, nTrks =  0 211
 iEvt, nTrks =  1 21
 iEvt, nTrks =  2 20
 iEvt, nTrks =  3 198
 iEvt, nTrks =  4 233
 iEvt, nTrks =  5 85
 iEvt, nTrks =  6 223
 iEvt, nTrks =  7 425
 iEvt, nTrks =  8 252
 iEvt, nTrks =  9 169
A.shape =  (20000,)
majorAxis[iTrk][0][0] =  -0.00023452607
majorAxis[iTrk][1][0] =  -0.00047206535
majorAxis[iTrk][2][0] =  0.096502915
minorAxis_1[iTrk][0][0] =  -15.822749
minorAxis_1[iTrk][1][0] =  7.8608756
minorAxis_1[iTrk][2][0] =  -2.6228399e-08
minorAxis_2[iTrk][0][0] =  7.860759
minorAxis_2[iTrk][1][0] =  15.822513
minorAxis_2[iTrk][2][0] =  0.096502915
  
majorAxis[iTrk][0][0] =  -0.37655562
majorAxis[iTrk][1][0] =  0.2768704
majorAxis[iTrk][2][0] = 

len(X) =  20000
len(Xlist) =  1
Loaded dataAA/20K_POCA_kernel_evts_200926.h5 in 42.14 s
outer loop X.shape =  (20000, 9, 600)
Constructing 2000 event dataset took 0.0204 s
x_t.shape =  torch.Size([2000, 9, 600])
x_t.shape[0] =  2000
x_t.shape[1] =  9
x_t.shape =  torch.Size([2000, 9, 600])


In [16]:
ax, tax, lax, lines = dual_train_plots()
fig = ax.figure
plt.tight_layout()

<IPython.core.display.Javascript object>

In [17]:
for result in trainNet(model, optimizer, loss,
                        train_loader, val_loader,
                        n_epochs, epoch_start=len(results),
                        notebook=True, step_schedule=step_schedule):
    
    results = results.append(pd.Series(result._asdict()), ignore_index=True)
    xs = results.index
    
    # Update the plot above
    lines['train'].set_data(results.index,results.cost)
    lines['val'].set_data(results.index,results.val)
    
    #filter first cost epoch (can be really large)
    max_cost = max(max(results.cost if len(results.cost)<2 else results.cost[1:]), max(results.val))
    min_cost = min(min(results.cost), min(results.val))
    
    # The plot limits need updating too
    
    
    
    ax.set_ylim(min_cost*.9, max_cost*1.1)  
    ax.set_xlim(-.5, len(results.cost) - .5)

    
    # Redraw the figure
    fig.canvas.draw()

    # Save each model state dictionary
    torch.save(model.state_dict(), output / f'{name}_{result.epoch}.pyt')
    #mine
    param_states.append(get_param_state(model))

Number of batches: train = 1125, val = 125


HBox(children=(FloatProgress(value=0.0, description='Epochs', layout=Layout(flex='2'), max=200.0, style=Progre…

Number of batches: train = 1125, val = 125


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 0 | exponent is 0
lr factor is 0.7 ^ 0
final lr: 1e-05
Epoch 0: train=6.87898, val=7.20091, took 39.928 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 1 | exponent is 0
lr factor is 0.7 ^ 0
final lr: 1e-05
Epoch 1: train=6.83797, val=7.43239, took 38.958 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 2 | exponent is 0
lr factor is 0.7 ^ 0
final lr: 1e-05
Epoch 2: train=6.83958, val=7.71697, took 39.036 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 3 | exponent is 0
lr factor is 0.7 ^ 0
final lr: 1e-05
Epoch 3: train=6.85885, val=7.30058, took 39.275 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 4 | exponent is 0
lr factor is 0.7 ^ 0
final lr: 1e-05
Epoch 4: train=6.80895, val=7.39685, took 39.033 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 5 | exponent is 0
lr factor is 0.7 ^ 0
final lr: 1e-05
Epoch 5: train=6.81592, val=6.9909, took 39.42 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 6 | exponent is 0
lr factor is 0.7 ^ 0
final lr: 1e-05
Epoch 6: train=6.80833, val=7.07252, took 38.917 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 7 | exponent is 0
lr factor is 0.7 ^ 0
final lr: 1e-05
Epoch 7: train=6.81761, val=7.32734, took 38.946 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 8 | exponent is 0
lr factor is 0.7 ^ 0
final lr: 1e-05
Epoch 8: train=6.78563, val=6.91173, took 39.178 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 9 | exponent is 0
lr factor is 0.7 ^ 0
final lr: 1e-05
Epoch 9: train=6.78521, val=7.36473, took 39.439 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 10 | exponent is 0
lr factor is 0.7 ^ 0
final lr: 1e-05
Epoch 10: train=6.7822, val=6.99233, took 39.022 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 11 | exponent is 0
lr factor is 0.7 ^ 0
final lr: 1e-05
Epoch 11: train=6.78814, val=7.03767, took 38.936 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 12 | exponent is 0
lr factor is 0.7 ^ 0
final lr: 1e-05
Epoch 12: train=6.77445, val=6.89652, took 39.405 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 13 | exponent is 0
lr factor is 0.7 ^ 0
final lr: 1e-05
Epoch 13: train=6.78028, val=6.88816, took 38.995 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 14 | exponent is 0
lr factor is 0.7 ^ 0
final lr: 1e-05
Epoch 14: train=6.78537, val=7.29101, took 39.024 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 15 | exponent is 0
lr factor is 0.7 ^ 0
final lr: 1e-05
Epoch 15: train=6.73794, val=7.56538, took 38.626 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 16 | exponent is 0
lr factor is 0.7 ^ 0
final lr: 1e-05
Epoch 16: train=6.73952, val=6.93027, took 45.909 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 17 | exponent is 0
lr factor is 0.7 ^ 0
final lr: 1e-05
Epoch 17: train=6.72506, val=7.03967, took 46.971 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 18 | exponent is 1
lr factor is 0.7 ^ 1
final lr: 7e-06
Epoch 18: train=6.7218, val=6.86578, took 47.736 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 19 | exponent is 1
lr factor is 0.7 ^ 1
final lr: 7e-06
Epoch 19: train=6.64832, val=6.86346, took 50.699 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 20 | exponent is 1
lr factor is 0.7 ^ 1
final lr: 7e-06
Epoch 20: train=6.66463, val=6.91792, took 51.666 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 21 | exponent is 1
lr factor is 0.7 ^ 1
final lr: 7e-06
Epoch 21: train=6.67223, val=6.94026, took 52.045 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 22 | exponent is 1
lr factor is 0.7 ^ 1
final lr: 7e-06
Epoch 22: train=6.64021, val=6.83717, took 52.346 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 23 | exponent is 1
lr factor is 0.7 ^ 1
final lr: 7e-06
Epoch 23: train=6.64613, val=6.91618, took 51.688 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 24 | exponent is 1
lr factor is 0.7 ^ 1
final lr: 7e-06
Epoch 24: train=6.65958, val=6.85203, took 45.67 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 25 | exponent is 1
lr factor is 0.7 ^ 1
final lr: 7e-06
Epoch 25: train=6.6506, val=6.83212, took 42.978 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 26 | exponent is 1
lr factor is 0.7 ^ 1
final lr: 7e-06
Epoch 26: train=6.63067, val=6.87482, took 43.25 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 27 | exponent is 1
lr factor is 0.7 ^ 1
final lr: 7e-06
Epoch 27: train=6.63102, val=6.83083, took 42.582 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 28 | exponent is 1
lr factor is 0.7 ^ 1
final lr: 7e-06
Epoch 28: train=6.63626, val=6.87893, took 43.218 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 29 | exponent is 1
lr factor is 0.7 ^ 1
final lr: 7e-06
Epoch 29: train=6.61543, val=6.9634, took 43.279 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 30 | exponent is 1
lr factor is 0.7 ^ 1
final lr: 7e-06
Epoch 30: train=6.60604, val=6.89479, took 43.33 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 31 | exponent is 1
lr factor is 0.7 ^ 1
final lr: 7e-06
Epoch 31: train=6.59996, val=7.01412, took 41.937 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 32 | exponent is 1
lr factor is 0.7 ^ 1
final lr: 7e-06
Epoch 32: train=6.61272, val=6.79213, took 39.726 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 33 | exponent is 1
lr factor is 0.7 ^ 1
final lr: 7e-06
Epoch 33: train=6.59015, val=6.8072, took 38.807 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 34 | exponent is 1
lr factor is 0.7 ^ 1
final lr: 7e-06
Epoch 34: train=6.58435, val=6.78533, took 38.744 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 35 | exponent is 1
lr factor is 0.7 ^ 1
final lr: 7e-06
Epoch 35: train=6.60302, val=6.78759, took 38.796 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 36 | exponent is 1
lr factor is 0.7 ^ 1
final lr: 7e-06
Epoch 36: train=6.5992, val=6.78587, took 38.501 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 37 | exponent is 1
lr factor is 0.7 ^ 1
final lr: 7e-06
Epoch 37: train=6.58807, val=6.786, took 38.716 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 38 | exponent is 2
lr factor is 0.7 ^ 2
final lr: 4.9e-06
Epoch 38: train=6.57643, val=6.78546, took 39.327 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 39 | exponent is 2
lr factor is 0.7 ^ 2
final lr: 4.9e-06
Epoch 39: train=6.54185, val=6.76958, took 39.336 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 40 | exponent is 2
lr factor is 0.7 ^ 2
final lr: 4.9e-06
Epoch 40: train=6.54449, val=6.78648, took 39.186 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 41 | exponent is 2
lr factor is 0.7 ^ 2
final lr: 4.9e-06
Epoch 41: train=6.54259, val=6.93038, took 38.95 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 42 | exponent is 2
lr factor is 0.7 ^ 2
final lr: 4.9e-06
Epoch 42: train=6.52798, val=6.77189, took 39.119 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 43 | exponent is 2
lr factor is 0.7 ^ 2
final lr: 4.9e-06
Epoch 43: train=6.52203, val=6.76151, took 39.229 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 44 | exponent is 2
lr factor is 0.7 ^ 2
final lr: 4.9e-06
Epoch 44: train=6.52237, val=6.76755, took 38.822 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 45 | exponent is 2
lr factor is 0.7 ^ 2
final lr: 4.9e-06
Epoch 45: train=6.52216, val=6.78633, took 39.372 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 46 | exponent is 2
lr factor is 0.7 ^ 2
final lr: 4.9e-06
Epoch 46: train=6.51608, val=6.75367, took 39.449 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 47 | exponent is 2
lr factor is 0.7 ^ 2
final lr: 4.9e-06
Epoch 47: train=6.50529, val=6.75778, took 39.511 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 48 | exponent is 2
lr factor is 0.7 ^ 2
final lr: 4.9e-06
Epoch 48: train=6.50371, val=6.78791, took 38.913 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 49 | exponent is 2
lr factor is 0.7 ^ 2
final lr: 4.9e-06
Epoch 49: train=6.50723, val=6.83992, took 39.33 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 50 | exponent is 2
lr factor is 0.7 ^ 2
final lr: 4.9e-06
Epoch 50: train=6.49915, val=6.76069, took 39.723 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 51 | exponent is 2
lr factor is 0.7 ^ 2
final lr: 4.9e-06
Epoch 51: train=6.49879, val=6.74949, took 39.359 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 52 | exponent is 2
lr factor is 0.7 ^ 2
final lr: 4.9e-06
Epoch 52: train=6.49692, val=6.74426, took 38.846 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 53 | exponent is 2
lr factor is 0.7 ^ 2
final lr: 4.9e-06
Epoch 53: train=6.48423, val=6.81189, took 38.882 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 54 | exponent is 2
lr factor is 0.7 ^ 2
final lr: 4.9e-06
Epoch 54: train=6.4903, val=6.74257, took 38.731 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 55 | exponent is 2
lr factor is 0.7 ^ 2
final lr: 4.9e-06
Epoch 55: train=6.48261, val=6.76434, took 38.435 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 56 | exponent is 2
lr factor is 0.7 ^ 2
final lr: 4.9e-06
Epoch 56: train=6.48546, val=6.7294, took 38.83 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 57 | exponent is 2
lr factor is 0.7 ^ 2
final lr: 4.9e-06
Epoch 57: train=6.47988, val=6.72949, took 38.768 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 58 | exponent is 3
lr factor is 0.7 ^ 3
final lr: 3.4299999999999993e-06
Epoch 58: train=6.48268, val=6.74806, took 39.146 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 59 | exponent is 3
lr factor is 0.7 ^ 3
final lr: 3.4299999999999993e-06
Epoch 59: train=6.4424, val=6.85979, took 39.35 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 60 | exponent is 3
lr factor is 0.7 ^ 3
final lr: 3.4299999999999993e-06
Epoch 60: train=6.43739, val=6.72239, took 39.213 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 61 | exponent is 3
lr factor is 0.7 ^ 3
final lr: 3.4299999999999993e-06
Epoch 61: train=6.44026, val=6.72231, took 39.399 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 62 | exponent is 3
lr factor is 0.7 ^ 3
final lr: 3.4299999999999993e-06
Epoch 62: train=6.4417, val=6.70807, took 39.444 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 63 | exponent is 3
lr factor is 0.7 ^ 3
final lr: 3.4299999999999993e-06
Epoch 63: train=6.4493, val=6.73405, took 39.365 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 64 | exponent is 3
lr factor is 0.7 ^ 3
final lr: 3.4299999999999993e-06
Epoch 64: train=6.43545, val=6.71293, took 39.34 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 65 | exponent is 3
lr factor is 0.7 ^ 3
final lr: 3.4299999999999993e-06
Epoch 65: train=6.43922, val=6.71713, took 39.134 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 66 | exponent is 3
lr factor is 0.7 ^ 3
final lr: 3.4299999999999993e-06
Epoch 66: train=6.43409, val=6.70355, took 39.368 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 67 | exponent is 3
lr factor is 0.7 ^ 3
final lr: 3.4299999999999993e-06
Epoch 67: train=6.42471, val=6.70512, took 39.066 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 68 | exponent is 3
lr factor is 0.7 ^ 3
final lr: 3.4299999999999993e-06
Epoch 68: train=6.42511, val=6.73015, took 38.955 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 69 | exponent is 3
lr factor is 0.7 ^ 3
final lr: 3.4299999999999993e-06
Epoch 69: train=6.4258, val=6.69578, took 39.239 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 70 | exponent is 3
lr factor is 0.7 ^ 3
final lr: 3.4299999999999993e-06
Epoch 70: train=6.41667, val=6.71154, took 39.006 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 71 | exponent is 3
lr factor is 0.7 ^ 3
final lr: 3.4299999999999993e-06
Epoch 71: train=6.41484, val=6.69629, took 39.545 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 72 | exponent is 3
lr factor is 0.7 ^ 3
final lr: 3.4299999999999993e-06
Epoch 72: train=6.41868, val=6.73524, took 39.093 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 73 | exponent is 3
lr factor is 0.7 ^ 3
final lr: 3.4299999999999993e-06
Epoch 73: train=6.41009, val=6.73299, took 38.896 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 74 | exponent is 3
lr factor is 0.7 ^ 3
final lr: 3.4299999999999993e-06
Epoch 74: train=6.40927, val=6.69922, took 38.635 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 75 | exponent is 3
lr factor is 0.7 ^ 3
final lr: 3.4299999999999993e-06
Epoch 75: train=6.40521, val=6.69275, took 38.896 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 76 | exponent is 3
lr factor is 0.7 ^ 3
final lr: 3.4299999999999993e-06
Epoch 76: train=6.4046, val=6.68324, took 38.957 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 77 | exponent is 3
lr factor is 0.7 ^ 3
final lr: 3.4299999999999993e-06
Epoch 77: train=6.40851, val=6.68992, took 38.871 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 78 | exponent is 4
lr factor is 0.7 ^ 4
final lr: 2.4009999999999995e-06
Epoch 78: train=6.4, val=6.68079, took 39.532 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 79 | exponent is 4
lr factor is 0.7 ^ 4
final lr: 2.4009999999999995e-06
Epoch 79: train=6.38312, val=6.67434, took 39.201 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 80 | exponent is 4
lr factor is 0.7 ^ 4
final lr: 2.4009999999999995e-06
Epoch 80: train=6.37563, val=6.67555, took 39.641 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 81 | exponent is 4
lr factor is 0.7 ^ 4
final lr: 2.4009999999999995e-06
Epoch 81: train=6.37666, val=6.67785, took 39.189 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 82 | exponent is 4
lr factor is 0.7 ^ 4
final lr: 2.4009999999999995e-06
Epoch 82: train=6.37872, val=6.67802, took 39.134 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 83 | exponent is 4
lr factor is 0.7 ^ 4
final lr: 2.4009999999999995e-06
Epoch 83: train=6.37581, val=6.70318, took 39.355 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 84 | exponent is 4
lr factor is 0.7 ^ 4
final lr: 2.4009999999999995e-06
Epoch 84: train=6.3738, val=6.66802, took 38.885 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 85 | exponent is 4
lr factor is 0.7 ^ 4
final lr: 2.4009999999999995e-06
Epoch 85: train=6.36861, val=6.67042, took 39.663 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 86 | exponent is 4
lr factor is 0.7 ^ 4
final lr: 2.4009999999999995e-06
Epoch 86: train=6.36683, val=6.6682, took 39.324 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 87 | exponent is 4
lr factor is 0.7 ^ 4
final lr: 2.4009999999999995e-06
Epoch 87: train=6.36662, val=6.67289, took 39.364 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 88 | exponent is 4
lr factor is 0.7 ^ 4
final lr: 2.4009999999999995e-06
Epoch 88: train=6.36138, val=6.66915, took 39.41 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 89 | exponent is 4
lr factor is 0.7 ^ 4
final lr: 2.4009999999999995e-06
Epoch 89: train=6.35969, val=6.6664, took 39.116 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 90 | exponent is 4
lr factor is 0.7 ^ 4
final lr: 2.4009999999999995e-06
Epoch 90: train=6.36204, val=6.69983, took 39.436 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 91 | exponent is 4
lr factor is 0.7 ^ 4
final lr: 2.4009999999999995e-06
Epoch 91: train=6.36174, val=6.67697, took 39.38 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 92 | exponent is 4
lr factor is 0.7 ^ 4
final lr: 2.4009999999999995e-06
Epoch 92: train=6.35973, val=6.67056, took 39.269 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 93 | exponent is 4
lr factor is 0.7 ^ 4
final lr: 2.4009999999999995e-06
Epoch 93: train=6.35261, val=6.67597, took 38.877 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 94 | exponent is 4
lr factor is 0.7 ^ 4
final lr: 2.4009999999999995e-06
Epoch 94: train=6.36043, val=6.67892, took 38.842 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 95 | exponent is 4
lr factor is 0.7 ^ 4
final lr: 2.4009999999999995e-06
Epoch 95: train=6.3469, val=6.66936, took 39.181 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 96 | exponent is 4
lr factor is 0.7 ^ 4
final lr: 2.4009999999999995e-06
Epoch 96: train=6.34815, val=6.7273, took 38.862 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 97 | exponent is 4
lr factor is 0.7 ^ 4
final lr: 2.4009999999999995e-06
Epoch 97: train=6.34945, val=6.6544, took 38.906 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 98 | exponent is 5
lr factor is 0.7 ^ 5
final lr: 1.6806999999999996e-06
Epoch 98: train=6.3451, val=6.65497, took 39.353 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 99 | exponent is 5
lr factor is 0.7 ^ 5
final lr: 1.6806999999999996e-06
Epoch 99: train=6.33892, val=6.64385, took 39.759 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 100 | exponent is 5
lr factor is 0.7 ^ 5
final lr: 1.6806999999999996e-06
Epoch 100: train=6.33286, val=6.64288, took 39.119 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 101 | exponent is 5
lr factor is 0.7 ^ 5
final lr: 1.6806999999999996e-06
Epoch 101: train=6.33204, val=6.66023, took 39.33 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 102 | exponent is 5
lr factor is 0.7 ^ 5
final lr: 1.6806999999999996e-06
Epoch 102: train=6.33319, val=6.64411, took 39.437 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 103 | exponent is 5
lr factor is 0.7 ^ 5
final lr: 1.6806999999999996e-06
Epoch 103: train=6.3337, val=6.69641, took 39.186 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 104 | exponent is 5
lr factor is 0.7 ^ 5
final lr: 1.6806999999999996e-06
Epoch 104: train=6.32963, val=6.64152, took 39.303 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 105 | exponent is 5
lr factor is 0.7 ^ 5
final lr: 1.6806999999999996e-06
Epoch 105: train=6.33139, val=6.63526, took 39.306 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 106 | exponent is 5
lr factor is 0.7 ^ 5
final lr: 1.6806999999999996e-06
Epoch 106: train=6.32741, val=6.65674, took 39.3 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 107 | exponent is 5
lr factor is 0.7 ^ 5
final lr: 1.6806999999999996e-06
Epoch 107: train=6.32274, val=6.63478, took 39.568 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 108 | exponent is 5
lr factor is 0.7 ^ 5
final lr: 1.6806999999999996e-06
Epoch 108: train=6.32729, val=6.6427, took 39.18 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 109 | exponent is 5
lr factor is 0.7 ^ 5
final lr: 1.6806999999999996e-06
Epoch 109: train=6.32508, val=6.65509, took 39.575 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 110 | exponent is 5
lr factor is 0.7 ^ 5
final lr: 1.6806999999999996e-06
Epoch 110: train=6.32237, val=6.64217, took 39.012 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 111 | exponent is 5
lr factor is 0.7 ^ 5
final lr: 1.6806999999999996e-06
Epoch 111: train=6.32097, val=6.65718, took 39.653 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 112 | exponent is 5
lr factor is 0.7 ^ 5
final lr: 1.6806999999999996e-06
Epoch 112: train=6.31649, val=6.64835, took 39.049 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 113 | exponent is 5
lr factor is 0.7 ^ 5
final lr: 1.6806999999999996e-06
Epoch 113: train=6.31716, val=6.63048, took 38.732 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 114 | exponent is 5
lr factor is 0.7 ^ 5
final lr: 1.6806999999999996e-06
Epoch 114: train=6.31471, val=6.65604, took 38.6 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 115 | exponent is 5
lr factor is 0.7 ^ 5
final lr: 1.6806999999999996e-06
Epoch 115: train=6.3147, val=6.62638, took 38.739 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 116 | exponent is 5
lr factor is 0.7 ^ 5
final lr: 1.6806999999999996e-06
Epoch 116: train=6.32122, val=6.64102, took 38.871 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 117 | exponent is 5
lr factor is 0.7 ^ 5
final lr: 1.6806999999999996e-06
Epoch 117: train=6.31862, val=6.64179, took 38.912 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 118 | exponent is 6
lr factor is 0.7 ^ 6
final lr: 1.1764899999999998e-06
Epoch 118: train=6.30962, val=6.64501, took 39.531 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 119 | exponent is 6
lr factor is 0.7 ^ 6
final lr: 1.1764899999999998e-06
Epoch 119: train=6.30093, val=6.63839, took 38.96 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 120 | exponent is 6
lr factor is 0.7 ^ 6
final lr: 1.1764899999999998e-06
Epoch 120: train=6.3019, val=6.6259, took 39.454 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 121 | exponent is 6
lr factor is 0.7 ^ 6
final lr: 1.1764899999999998e-06
Epoch 121: train=6.30163, val=6.62426, took 39.443 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 122 | exponent is 6
lr factor is 0.7 ^ 6
final lr: 1.1764899999999998e-06
Epoch 122: train=6.30783, val=6.63557, took 39.617 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 123 | exponent is 6
lr factor is 0.7 ^ 6
final lr: 1.1764899999999998e-06
Epoch 123: train=6.2987, val=6.6391, took 39.641 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 124 | exponent is 6
lr factor is 0.7 ^ 6
final lr: 1.1764899999999998e-06
Epoch 124: train=6.29806, val=6.62185, took 39.084 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 125 | exponent is 6
lr factor is 0.7 ^ 6
final lr: 1.1764899999999998e-06
Epoch 125: train=6.30305, val=6.6202, took 39.696 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 126 | exponent is 6
lr factor is 0.7 ^ 6
final lr: 1.1764899999999998e-06
Epoch 126: train=6.29747, val=6.61672, took 39.339 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 127 | exponent is 6
lr factor is 0.7 ^ 6
final lr: 1.1764899999999998e-06
Epoch 127: train=6.29475, val=6.61847, took 40.436 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 128 | exponent is 6
lr factor is 0.7 ^ 6
final lr: 1.1764899999999998e-06
Epoch 128: train=6.30425, val=6.61606, took 39.729 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 129 | exponent is 6
lr factor is 0.7 ^ 6
final lr: 1.1764899999999998e-06
Epoch 129: train=6.29355, val=6.61504, took 39.137 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 130 | exponent is 6
lr factor is 0.7 ^ 6
final lr: 1.1764899999999998e-06
Epoch 130: train=6.29702, val=6.6188, took 39.41 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 131 | exponent is 6
lr factor is 0.7 ^ 6
final lr: 1.1764899999999998e-06
Epoch 131: train=6.29423, val=6.6171, took 39.431 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 132 | exponent is 6
lr factor is 0.7 ^ 6
final lr: 1.1764899999999998e-06
Epoch 132: train=6.29084, val=6.62345, took 39.309 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 133 | exponent is 6
lr factor is 0.7 ^ 6
final lr: 1.1764899999999998e-06
Epoch 133: train=6.28915, val=6.61199, took 38.42 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 134 | exponent is 6
lr factor is 0.7 ^ 6
final lr: 1.1764899999999998e-06
Epoch 134: train=6.29288, val=6.61533, took 38.589 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 135 | exponent is 6
lr factor is 0.7 ^ 6
final lr: 1.1764899999999998e-06
Epoch 135: train=6.2878, val=6.61568, took 38.667 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 136 | exponent is 6
lr factor is 0.7 ^ 6
final lr: 1.1764899999999998e-06
Epoch 136: train=6.29345, val=6.61009, took 38.538 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 137 | exponent is 6
lr factor is 0.7 ^ 6
final lr: 1.1764899999999998e-06
Epoch 137: train=6.29119, val=6.60976, took 38.885 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 138 | exponent is 7
lr factor is 0.7 ^ 7
final lr: 8.235429999999997e-07
Epoch 138: train=6.28827, val=6.61938, took 39.389 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 139 | exponent is 7
lr factor is 0.7 ^ 7
final lr: 8.235429999999997e-07
Epoch 139: train=6.28312, val=6.60884, took 39.422 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 140 | exponent is 7
lr factor is 0.7 ^ 7
final lr: 8.235429999999997e-07
Epoch 140: train=6.284, val=6.61437, took 51.705 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 141 | exponent is 7
lr factor is 0.7 ^ 7
final lr: 8.235429999999997e-07
Epoch 141: train=6.27983, val=6.60721, took 54.253 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 142 | exponent is 7
lr factor is 0.7 ^ 7
final lr: 8.235429999999997e-07
Epoch 142: train=6.27618, val=6.60571, took 54.377 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 143 | exponent is 7
lr factor is 0.7 ^ 7
final lr: 8.235429999999997e-07
Epoch 143: train=6.2787, val=6.61695, took 45.498 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 144 | exponent is 7
lr factor is 0.7 ^ 7
final lr: 8.235429999999997e-07
Epoch 144: train=6.28328, val=6.61683, took 39.5 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 145 | exponent is 7
lr factor is 0.7 ^ 7
final lr: 8.235429999999997e-07
Epoch 145: train=6.28199, val=6.60387, took 40.865 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 146 | exponent is 7
lr factor is 0.7 ^ 7
final lr: 8.235429999999997e-07
Epoch 146: train=6.27205, val=6.60461, took 39.791 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 147 | exponent is 7
lr factor is 0.7 ^ 7
final lr: 8.235429999999997e-07
Epoch 147: train=6.27537, val=6.60274, took 39.818 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 148 | exponent is 7
lr factor is 0.7 ^ 7
final lr: 8.235429999999997e-07
Epoch 148: train=6.27558, val=6.61186, took 53.786 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 149 | exponent is 7
lr factor is 0.7 ^ 7
final lr: 8.235429999999997e-07
Epoch 149: train=6.27519, val=6.6116, took 54.21 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 150 | exponent is 7
lr factor is 0.7 ^ 7
final lr: 8.235429999999997e-07
Epoch 150: train=6.27929, val=6.60385, took 54.182 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 151 | exponent is 7
lr factor is 0.7 ^ 7
final lr: 8.235429999999997e-07
Epoch 151: train=6.27792, val=6.6026, took 56.907 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 152 | exponent is 7
lr factor is 0.7 ^ 7
final lr: 8.235429999999997e-07
Epoch 152: train=6.27231, val=6.60256, took 59.75 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 153 | exponent is 7
lr factor is 0.7 ^ 7
final lr: 8.235429999999997e-07
Epoch 153: train=6.27129, val=6.60233, took 60.132 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 154 | exponent is 7
lr factor is 0.7 ^ 7
final lr: 8.235429999999997e-07
Epoch 154: train=6.27137, val=6.60767, took 58.149 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 155 | exponent is 7
lr factor is 0.7 ^ 7
final lr: 8.235429999999997e-07
Epoch 155: train=6.26728, val=6.6023, took 59.415 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 156 | exponent is 7
lr factor is 0.7 ^ 7
final lr: 8.235429999999997e-07
Epoch 156: train=6.27206, val=6.59992, took 58.313 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 157 | exponent is 7
lr factor is 0.7 ^ 7
final lr: 8.235429999999997e-07
Epoch 157: train=6.26796, val=6.61682, took 56.637 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 158 | exponent is 8
lr factor is 0.7 ^ 8
final lr: 5.764800999999997e-07
Epoch 158: train=6.27018, val=6.61448, took 59.022 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 159 | exponent is 8
lr factor is 0.7 ^ 8
final lr: 5.764800999999997e-07
Epoch 159: train=6.26152, val=6.60454, took 58.746 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 160 | exponent is 8
lr factor is 0.7 ^ 8
final lr: 5.764800999999997e-07
Epoch 160: train=6.26512, val=6.59771, took 56.348 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 161 | exponent is 8
lr factor is 0.7 ^ 8
final lr: 5.764800999999997e-07
Epoch 161: train=6.26433, val=6.60851, took 54.497 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 162 | exponent is 8
lr factor is 0.7 ^ 8
final lr: 5.764800999999997e-07
Epoch 162: train=6.2611, val=6.59694, took 54.521 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 163 | exponent is 8
lr factor is 0.7 ^ 8
final lr: 5.764800999999997e-07
Epoch 163: train=6.26543, val=6.5957, took 53.083 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 164 | exponent is 8
lr factor is 0.7 ^ 8
final lr: 5.764800999999997e-07
Epoch 164: train=6.26353, val=6.60236, took 54.601 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 165 | exponent is 8
lr factor is 0.7 ^ 8
final lr: 5.764800999999997e-07
Epoch 165: train=6.26036, val=6.59744, took 54.292 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 166 | exponent is 8
lr factor is 0.7 ^ 8
final lr: 5.764800999999997e-07
Epoch 166: train=6.26106, val=6.59763, took 53.104 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 167 | exponent is 8
lr factor is 0.7 ^ 8
final lr: 5.764800999999997e-07
Epoch 167: train=6.26175, val=6.59769, took 54.381 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 168 | exponent is 8
lr factor is 0.7 ^ 8
final lr: 5.764800999999997e-07
Epoch 168: train=6.25924, val=6.59835, took 54.555 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 169 | exponent is 8
lr factor is 0.7 ^ 8
final lr: 5.764800999999997e-07
Epoch 169: train=6.25882, val=6.59671, took 52.97 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 170 | exponent is 8
lr factor is 0.7 ^ 8
final lr: 5.764800999999997e-07
Epoch 170: train=6.26134, val=6.60727, took 54.495 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 171 | exponent is 8
lr factor is 0.7 ^ 8
final lr: 5.764800999999997e-07
Epoch 171: train=6.25908, val=6.60669, took 54.482 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 172 | exponent is 8
lr factor is 0.7 ^ 8
final lr: 5.764800999999997e-07
Epoch 172: train=6.25657, val=6.60832, took 54.15 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 173 | exponent is 8
lr factor is 0.7 ^ 8
final lr: 5.764800999999997e-07
Epoch 173: train=6.25642, val=6.59535, took 54.174 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 174 | exponent is 8
lr factor is 0.7 ^ 8
final lr: 5.764800999999997e-07
Epoch 174: train=6.25625, val=6.59588, took 54.228 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 175 | exponent is 8
lr factor is 0.7 ^ 8
final lr: 5.764800999999997e-07
Epoch 175: train=6.25389, val=6.59322, took 54.249 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 176 | exponent is 8
lr factor is 0.7 ^ 8
final lr: 5.764800999999997e-07
Epoch 176: train=6.25621, val=6.60622, took 53.575 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 177 | exponent is 8
lr factor is 0.7 ^ 8
final lr: 5.764800999999997e-07
Epoch 177: train=6.26049, val=6.59404, took 54.552 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 178 | exponent is 9
lr factor is 0.7 ^ 9
final lr: 4.035360699999998e-07
Epoch 178: train=6.25622, val=6.60321, took 54.17 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 179 | exponent is 9
lr factor is 0.7 ^ 9
final lr: 4.035360699999998e-07
Epoch 179: train=6.25442, val=6.59102, took 52.677 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 180 | exponent is 9
lr factor is 0.7 ^ 9
final lr: 4.035360699999998e-07
Epoch 180: train=6.24894, val=6.58979, took 54.197 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 181 | exponent is 9
lr factor is 0.7 ^ 9
final lr: 4.035360699999998e-07
Epoch 181: train=6.25219, val=6.59221, took 54.673 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 182 | exponent is 9
lr factor is 0.7 ^ 9
final lr: 4.035360699999998e-07
Epoch 182: train=6.25283, val=6.58989, took 53.147 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 183 | exponent is 9
lr factor is 0.7 ^ 9
final lr: 4.035360699999998e-07
Epoch 183: train=6.25123, val=6.59022, took 54.74 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 184 | exponent is 9
lr factor is 0.7 ^ 9
final lr: 4.035360699999998e-07
Epoch 184: train=6.24938, val=6.59013, took 54.226 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 185 | exponent is 9
lr factor is 0.7 ^ 9
final lr: 4.035360699999998e-07
Epoch 185: train=6.24827, val=6.58917, took 52.916 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 186 | exponent is 9
lr factor is 0.7 ^ 9
final lr: 4.035360699999998e-07
Epoch 186: train=6.25206, val=6.59254, took 54.632 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 187 | exponent is 9
lr factor is 0.7 ^ 9
final lr: 4.035360699999998e-07
Epoch 187: train=6.24926, val=6.58777, took 54.568 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 188 | exponent is 9
lr factor is 0.7 ^ 9
final lr: 4.035360699999998e-07
Epoch 188: train=6.25045, val=6.59737, took 55.343 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 189 | exponent is 9
lr factor is 0.7 ^ 9
final lr: 4.035360699999998e-07
Epoch 189: train=6.25217, val=6.59991, took 54.808 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 190 | exponent is 9
lr factor is 0.7 ^ 9
final lr: 4.035360699999998e-07
Epoch 190: train=6.24338, val=6.58874, took 58.337 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 191 | exponent is 9
lr factor is 0.7 ^ 9
final lr: 4.035360699999998e-07
Epoch 191: train=6.25647, val=6.59195, took 66.529 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 192 | exponent is 9
lr factor is 0.7 ^ 9
final lr: 4.035360699999998e-07
Epoch 192: train=6.25027, val=6.59666, took 66.4 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 193 | exponent is 9
lr factor is 0.7 ^ 9
final lr: 4.035360699999998e-07
Epoch 193: train=6.24832, val=6.58854, took 68.683 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 194 | exponent is 9
lr factor is 0.7 ^ 9
final lr: 4.035360699999998e-07
Epoch 194: train=6.24763, val=6.58674, took 68.685 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 195 | exponent is 9
lr factor is 0.7 ^ 9
final lr: 4.035360699999998e-07
Epoch 195: train=6.24659, val=6.58687, took 68.417 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 196 | exponent is 9
lr factor is 0.7 ^ 9
final lr: 4.035360699999998e-07
Epoch 196: train=6.24752, val=6.58772, took 67.299 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 197 | exponent is 9
lr factor is 0.7 ^ 9
final lr: 4.035360699999998e-07
Epoch 197: train=6.24441, val=6.59482, took 58.012 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 198 | exponent is 10
lr factor is 0.7 ^ 10
final lr: 2.8247524899999984e-07
Epoch 198: train=6.25003, val=6.58689, took 58.915 s


HBox(children=(FloatProgress(value=0.0, description='Training', layout=Layout(flex='2'), max=1125.0, style=Pro…

lr inital: 1e-05
Epoch 199 | exponent is 10
lr factor is 0.7 ^ 10
final lr: 2.8247524899999984e-07
Epoch 199: train=6.24276, val=6.59251, took 58.575 s



Go ahead and save the final model (even though it was also saved above):

In [18]:
torch.save(model.state_dict(), output / f'{name}_final.pyt')

Save the output results:

In [19]:
results.to_hdf(f'{name}_stats.hdf5', 'results')

Save the plot above:

In [20]:
dual_train_plots(results.index,
                 results.cost, results.val,
                 results.cost, results.val)
plt.tight_layout()
plt.savefig(str(output / f'{name}_stats_a.png'))

<IPython.core.display.Javascript object>

In [21]:
from functions.utils import state_dict_to_vector
def angle_between(a, b):
    return np.arccos(np.dot(a, b)/(np.linalg.norm(a)*np.linalg.norm(b)))

angle_grids = []
grid_size = 25
num_epochs = n_epochs
num_epochs2 = 0

ep_intervals = [(np.arange(0, num_epochs+num_epochs2+1, grid_size)[i], np.arange(0, num_epochs+num_epochs2+1, grid_size)[i+1]) for i in range(len(np.arange(0, num_epochs+num_epochs2+1, grid_size))-1)]

for interval in ep_intervals:
    
    these_param_states = []
    for i in range(interval[0], interval[1]):
        if i % 100 == 0:
            print(i)
        these_param_states.append(param_states[i])
        #print("Loaded", file_names[i])
        
    interval_size = len(these_param_states)-1    
    these_steps = [these_param_states[i+1]-these_param_states[i] for i in range(interval_size)]
    
    this_angle_grid = np.zeros((interval_size, interval_size))
    
    for i in range(interval_size):
        for j in range(i+1, interval_size):#range(i+1, interval_size):
            angle = angle_between(these_steps[i], these_steps[j])
            this_angle_grid[i,j] = angle
            this_angle_grid[j,i] = angle
            
    angle_grids.append(this_angle_grid)

0
100


In [22]:
import matplotlib.colors as colors
import matplotlib.cm as cm

for angle_grid in angle_grids:
    plt.figure(figsize=(12,8))
    norm = colors.Normalize(vmin=np.amin(angle_grid), vmax=np.amax(angle_grid))   
    plt.imshow(angle_grid, cmap=cm.jet)
    plt.colorbar(cm.ScalarMappable(norm=norm, cmap=cm.jet))
    plt.xlabel('Step i')
    plt.ylabel('Step j')
    
#print("num params:", len(these_param_states[0]))

<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>

In [23]:
from functions.plotting_DDplus_hists import load_data
from functions.utils import vector_to_state_dict

state_dicts = []
# num_epochs = 500
for i in np.arange(0, num_epochs, 10):
    state_dicts.append( (i, vector_to_state_dict(param_states[i], model)) )

data = load_data()

Loading data...
pocaMx.shape =  (20000,)
nEvts =  20000
len(pocaMx[0]) =  211
len(pocaMx[1]) =  21
len(pocaMx[2]) =  20
len(pocaMx[3]) =  198
len(pocaMx[4]) =  233
majorAxis.shape =  (20000, 3)
minorAxis_1.shape =  (20000, 3)
minorAxis_2.shape =  (20000, 3)
have entered six_ellipsoid_parameters
  
 
  nEvts =  20000
 iEvt, nTrks =  0 211
 iEvt, nTrks =  1 21
 iEvt, nTrks =  2 20
 iEvt, nTrks =  3 198
 iEvt, nTrks =  4 233
 iEvt, nTrks =  5 85
 iEvt, nTrks =  6 223
 iEvt, nTrks =  7 425
 iEvt, nTrks =  8 252
 iEvt, nTrks =  9 169
A.shape =  (20000,)
majorAxis[iTrk][0][0] =  -0.00023452607
majorAxis[iTrk][1][0] =  -0.00047206535
majorAxis[iTrk][2][0] =  0.096502915
minorAxis_1[iTrk][0][0] =  -15.822749
minorAxis_1[iTrk][1][0] =  7.8608756
minorAxis_1[iTrk][2][0] =  -2.6228399e-08
minorAxis_2[iTrk][0][0] =  7.860759
minorAxis_2[iTrk][1][0] =  15.822513
minorAxis_2[iTrk][2][0] =  0.096502915
  
majorAxis[iTrk][0][0] =  -0.37655562
majorAxis[iTrk][1][0] =  0.2768704
majorAxis[iTrk][2][0] = 

In [24]:
from functions.plotting_DDplus_hists import plot_DDplus_hists as Plot
Plot(state_dicts, data)

[0, 10, 20, 30, 40, 50, 60, 70, 80, 90, 100, 110, 120, 130, 140, 150, 160, 170, 180, 190]


<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>