In [1]:
import pickle
import pandas as pd
import os

import torch
import numpy as np
import torch.nn as nn
import torch.nn.functional as F
import torch.optim as optim
from tqdm import tqdm, trange
import torch.optim as optim
from torch.utils.data import TensorDataset, DataLoader
import wandb
from torch.utils.data.sampler import SubsetRandomSampler
import pprint
import matplotlib.pyplot as plt
import torch

from sklearn.preprocessing import MinMaxScaler
import math
from torch.profiler import profile, record_function, ProfilerActivity

from operator import itemgetter
import operator
from random import randint
from rnn_classes import Dog, DogInput, Race, Races, GRUNet, smallGRUNet, smalll_lin_GRUNet
from raceDB import build_dataset, build_pred_dataset
import importlib
import datetime
from training_testing import validate_model, train_regular, train_log, train_super_batch, train_super_batch_KL, train_super_batch_L1, train_regular_L1,train_regular_one_hot
from model_saver import model_saver, model_saver_wandb



In [2]:
if torch.cuda.is_available():
    device = torch.device("cuda:0")  # you can continue going on here, like cuda:1 cuda:2....etc.
    print("Running on the GPU")
else:
    device = torch.device("cpu")
    print("Running on the CPU")

Running on the GPU


In [3]:
torch.set_default_tensor_type(torch.FloatTensor)

In [4]:
torch.__version__

'1.12.1'

In [5]:
def validation_CLE(x,y):
    loss_t = -torch.log(torch.exp(x)/torch.sum(torch.exp(x), dim=-1, keepdim=True))*y
    return loss_t

In [6]:
def compare_model_to_bf(model:GRUNet,raceDB:Races,example_ct):
    with torch.no_grad():
        sft_max = nn.Softmax(dim=-1)
        l_sftmax = nn.LogSoftmax(dim=-1)
        nnl_loss = nn.KLDivLoss(reduction='batchmean')
        full_test_races = raceDB.get_test_input(range(0,len(raceDB.test_race_ids)))
        full_test_races_w_prices = []
        excluded, included = 0,0
        for r in full_test_races:
            if 0 in r.prices or -1 in r.prices:
                excluded+=1
            else:
                full_test_races_w_prices.append(r)
                included+=1
        print(included,excluded)

        output = l_sftmax(model(full_test_races_w_prices))
        bf_prices = torch.log(torch.tensor([x.implied_prob for x in full_test_races_w_prices ]).to('cuda:0'))
        full_classes = torch.stack([x.classes for x in full_test_races_w_prices ])

        print()

        print(f"our loss = {nnl_loss(output,full_classes)}")
        print(f"their loss = {nnl_loss(bf_prices ,full_classes)}")
        wandb.log({"our loss":nnl_loss(output,full_classes), "their loss":nnl_loss(bf_prices ,full_classes)})

In [7]:
os.getcwd()
os.chdir(r"C:\Users\Nick\Documents\GitHub\grvmodel\Python\DATA")
#dog_stats_file = open( 'new gru input 2023-01.npy', 'rb')
hidden_size = 64
raceDB = build_dataset('new_windows_gru_REAL.npy', hidden_size ,state_filter="NZ", margin_type='neg_raw')
raceDB.create_new_weights_v2()


(1164832, 18)
(1164832, 18)
(123805, 21)
Latest date = 2023-03-02 00:00:00
num_features_per_dog=55


  for obj in iterable:
100%|██████████| 3489/3489 [00:26<00:00, 130.40it/s]
  for obj in iterable:
100%|██████████| 16386/16386 [00:32<00:00, 498.30it/s]


number of races = 16386, number of unique dogs = 3489
0        (Palmerston North, 410.0)
1        (Palmerston North, 410.0)
2        (Palmerston North, 410.0)
3        (Palmerston North, 410.0)
4        (Palmerston North, 410.0)
                   ...            
16381        (Christchurch, 295.0)
16382        (Christchurch, 520.0)
16383        (Christchurch, 295.0)
16384        (Christchurch, 295.0)
16385        (Christchurch, 295.0)
Length: 16386, dtype: object


In [8]:
date = datetime.datetime.strptime("2022-08-01", "%Y-%m-%d").date()
raceDB.create_test_split_date(date)

Train examples 13565, Test examples 2821


In [9]:
def closure(optimizer, criterion, outs, classes):
    optimizer.zero_grad()
    loss = nn.functional.mse_loss(outs, classes)
    loss.backward()
    return loss

def model_pipeline(my_dataset=raceDB,config=None,prev_model=None, sweep=True, model_state_dict=None, prev_model_file="rich-sweep-2"):
    if my_dataset:
      dataset = my_dataset    
    else:
      dataset = raceDB
    # tell wandb to get started
    with wandb.init(project="GRU - FastTrack - AUS Testing - L1", config=config):
      #  access all HPs through wandb.config, so logging matches execution!
      wandb.define_metric("loss", summary="min")
      wandb.define_metric("test_accuracy", summary="max")
      wandb.define_metric("bfprofit", summary="max")
      wandb.define_metric("multibet profit", summary="max")
      
      config = wandb.config
      pprint.pprint(config)
      pprint.pprint(config.epochs)
      print(config)
      input_size = raceDB.get_race_input([0,1])[0].full_input.shape[0] #create fix so messy

      model = smalll_lin_GRUNet(input_size,config['hidden_size'])
      if model_state_dict:
        model.load_state_dict(model_state_dict)
      if prev_model_file!=None:
        model_name = prev_model_file
        model_loc = f"C:/Users/Nick/Documents/GitHub/grvmodel/Python/pytorch/New Model/savedmodel/{model_name}/{model_name}_450.pt"
        model_data = torch.load(model_loc,map_location=torch.device('cuda:0'))
        raceDB.fill_hidden_states_from_dict(hidden_dict=model_data['db'])
        model.load_state_dict(model_data['model_state_dict'])
        config['parent model'] = prev_model_file


      raceDB.to_cuda()

      # criterion = nn.CrossEntropyLoss(reduction='none')
      criterion = nn.SmoothL1Loss(reduction='none', beta=10)
      optimizer = optim.Adam(model.parameters(), lr=config['learning_rate'])
      # optimizer = optim.Adadelta(model.parameters())
      # optimizer = optim.RMSprop(model.parameters(), lr=config['learning_rate'])\
      # optimizer = optim.SGD(model.parameters(), lr=config['learning_rate'], momentum=0.9)

      print(criterion, optimizer)

      scheduler = optim.lr_scheduler.ReduceLROnPlateau(optimizer, 'min',threshold=0.0001, patience=10000, verbose=True, factor=0.5)
      model = model.to(device)
      # optimizer = optimizer.to(device)
      print(model)

      # and use them to train the model
      try:
        train_regular_L1(model, dataset, criterion, optimizer, scheduler, config)
      except KeyboardInterrupt:
        print("finished Early")
      dataset.create_hidden_states_dict()
      model_saver_wandb(model, optimizer, 450, 0.1, dataset.hidden_states_dict_gru, model_name="long nsw new  22000 RUN")
      if sweep:
        raceDB.reset_all_lstm_states
    


    # and test its final performance
    #test(model, test_loader)

    return (model,dataset, optimizer)

In [10]:

sweep_config = {"method": "bayes"}

metric = {"name": "ROI < 30", "goal": "maximize"}

sweep_config["metric"] = metric


parameters_dict = {
    "optimizer": {"value": "adamW"},
    "f1_layer_size": {"values": [256]},
    "f2_layer_size": {"values": [64]},
    "dropout": {"values": [0.3]},
    "len_data": {"value": len(raceDB.raceIDs)},
    "hidden_size": {"value":64}
}

sweep_config["parameters"] = parameters_dict

parameters_dict.update(
    {
        "epochs": {"values": [50]},
        "validation_split": {"value": 0.1},
        "loss": {
            "values": [ "CEL"],
            # "values": ["Huber", "MSE", "L1", "BCE", "Custom", "KL"]
            # 'value': 'l1_custom'
        },
        "num_layers": {"values": [2]},
    }
)

parameters_dict.update(
    {
        "learning_rate":{
            # a flat distribution between 0 and 0.1
            "distribution": "uniform",
            "min": 0.00001,
            "max": 0.001,
        },
        "l1_beta": {"value": 0.1
        },
        "batch_size": {
            'values': [100,250,500,1000]
        },
        "batch_before_backwards": {
            'values': [5,10,20]
        },

        # "batch_before_backwards": {
        #     # a flat distribution between 0 and 0.1
        #     "distribution": "uniform",
        #     "min": 3,
        #     "max": 50,
        # },
    }
)

import pprint

pprint.pprint(sweep_config)


sweep_config

{'method': 'bayes',
 'metric': {'goal': 'maximize', 'name': 'ROI < 30'},
 'parameters': {'batch_before_backwards': {'values': [5, 10, 20]},
                'batch_size': {'values': [100, 250, 500, 1000]},
                'dropout': {'values': [0.3]},
                'epochs': {'values': [50]},
                'f1_layer_size': {'values': [256]},
                'f2_layer_size': {'values': [64]},
                'hidden_size': {'value': 64},
                'l1_beta': {'value': 0.1},
                'learning_rate': {'distribution': 'uniform',
                                  'max': 0.001,
                                  'min': 1e-05},
                'len_data': {'value': 16386},
                'loss': {'values': ['CEL']},
                'num_layers': {'values': [2]},
                'optimizer': {'value': 'adamW'},
                'validation_split': {'value': 0.1}}}


{'method': 'bayes',
 'metric': {'name': 'ROI < 30', 'goal': 'maximize'},
 'parameters': {'optimizer': {'value': 'adamW'},
  'f1_layer_size': {'values': [256]},
  'f2_layer_size': {'values': [64]},
  'dropout': {'values': [0.3]},
  'len_data': {'value': 16386},
  'hidden_size': {'value': 64},
  'epochs': {'values': [50]},
  'validation_split': {'value': 0.1},
  'loss': {'values': ['CEL']},
  'num_layers': {'values': [2]},
  'learning_rate': {'distribution': 'uniform', 'min': 1e-05, 'max': 0.001},
  'l1_beta': {'value': 0.1},
  'batch_size': {'values': [100, 250, 500, 1000]},
  'batch_before_backwards': {'values': [5, 10, 20]}}}

In [11]:
len(raceDB.raceIDs)
wandb_config_static = {'hidden_size':hidden_size,'batch_size': 50, 'dropout': 0.3, 'epochs': 1000, 'f1_layer_size': 256, 'f2_layer_size': 64 , 'learning_rate': 0.00095, 'loss': 'L1', 'l1_beta':0.1,  'num_layers': 2, 'optimizer': 'adamW', 'validation_split': 0.1,'batch_before_backwards':7}

In [12]:
(model,dataset, optimizer) = model_pipeline(raceDB,config=wandb_config_static,sweep=False)

Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.
[34m[1mwandb[0m: Currently logged in as: [33mnickojelly[0m (use `wandb login --relogin` to force relogin)


{'hidden_size': 64, 'batch_size': 50, 'dropout': 0.3, 'epochs': 1000, 'f1_layer_size': 256, 'f2_layer_size': 64, 'learning_rate': 0.00095, 'loss': 'L1', 'l1_beta': 0.1, 'num_layers': 2, 'optimizer': 'adamW', 'validation_split': 0.1, 'batch_before_backwards': 7}
1000
{'hidden_size': 64, 'batch_size': 50, 'dropout': 0.3, 'epochs': 1000, 'f1_layer_size': 256, 'f2_layer_size': 64, 'learning_rate': 0.00095, 'loss': 'L1', 'l1_beta': 0.1, 'num_layers': 2, 'optimizer': 'adamW', 'validation_split': 0.1, 'batch_before_backwards': 7}


100%|██████████| 16386/16386 [00:00<00:00, 18752.70it/s]


filled =0
empty  =131088
0.0null_dog=0
SmoothL1Loss() Adam (
Parameter Group 0
    amsgrad: False
    betas: (0.9, 0.999)
    capturable: False
    eps: 1e-08
    foreach: None
    lr: 0.00095
    maximize: False
    weight_decay: 0
)
smalll_lin_GRUNet(
  (batchnorm): BatchNorm1d(510, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
  (fc0): Linear(in_features=510, out_features=510, bias=True)
  (gru1): GRUCell(510, 64)
  (gru2): GRUCell(510, 64)
  (gru3): GRUCell(510, 64)
  (gru4): GRUCell(510, 64)
  (gru5): GRUCell(510, 64)
  (gru6): GRUCell(510, 64)
  (gru7): GRUCell(510, 64)
  (gru8): GRUCell(510, 64)
  (rl1): ReLU()
  (drop1): Dropout(p=0.3, inplace=False)
  (fc1): Linear(in_features=512, out_features=64, bias=True)
  (rl2): ReLU()
  (drop2): Dropout(p=0.3, inplace=False)
  (fc2): Linear(in_features=64, out_features=8, bias=True)
  (output_fn): Identity()
)


100%|██████████| 271/271 [00:46<00:00,  5.89it/s]
100%|██████████| 271/271 [00:44<00:00,  6.11it/s]t]
100%|██████████| 271/271 [00:40<00:00,  6.64it/s]t]
100%|██████████| 271/271 [00:42<00:00,  6.34it/s]t]
100%|██████████| 271/271 [00:42<00:00,  6.37it/s]t]
100%|██████████| 271/271 [00:40<00:00,  6.65it/s]t]
100%|██████████| 271/271 [00:41<00:00,  6.55it/s]t]
100%|██████████| 271/271 [00:43<00:00,  6.18it/s]t]
100%|██████████| 271/271 [00:43<00:00,  6.20it/s]t]
100%|██████████| 271/271 [00:43<00:00,  6.30it/s]t]
100%|██████████| 271/271 [00:41<00:00,  6.46it/s]it]
100%|██████████| 271/271 [00:41<00:00,  6.49it/s]it]
100%|██████████| 271/271 [00:42<00:00,  6.36it/s]it]
100%|██████████| 271/271 [00:41<00:00,  6.55it/s]it]
100%|██████████| 271/271 [00:41<00:00,  6.49it/s]it]
100%|██████████| 271/271 [00:42<00:00,  6.39it/s]it]
100%|██████████| 271/271 [00:42<00:00,  6.30it/s]it]
100%|██████████| 271/271 [00:41<00:00,  6.53it/s]it]
100%|██████████| 271/271 [00:40<00:00,  6.77it/s]it]
100%|

finished Early
created path



VBox(children=(Label(value='255.460 MB of 255.460 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0,…

0,1
FK ROI,▂▃▄▃▃▄▃▄▄▆▅▅▃▃▂▄▄▃▃▄▂▁▇▆▇▇▇█▅▃▅█▇▇▆▆▆▆▅▄
FK ROI < 30,▁▄▆▄▃▅█▄▅▇▄▅▄▄▂▅▆▅▄▅▂▂▇▇▆▆▅▆▅▃▄▇▆▅▆▅▅▆▅▅
ROI,▂▃▃▃▂▄▂▄▄▅▅▅▃▂▂▄▄▃▃▃▂▁▇▆▇▇▇█▅▃▅█▆▇▆▆▆▆▅▄
ROI < 30,▁▄▆▄▃▅█▄▄▇▄▅▄▄▃▅▇▅▅▅▂▂▇▇▆▆▅▆▅▄▄▇▆▅▆▅▅▆▅▅
accuracy,▄▃▄▄▃▅▃▃▄▅▇▄▁▃▃▁▂▃▄▄▄▅▇▇▆▇▅▇▅▅▇█▇▆▇▇▇▇▆▅
batch_before_backwards,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
batch_loss,█▆▆▄▄▃▃▅▃▄▃▂▃▃▄▃▃▂▂▂▂▃▂▂▂▁▂▂▂▃▂▂▁▁▂▂▂▂▂▂
correct,▄▃▄▄▃▅▃▃▄▅▇▄▁▃▃▁▂▃▄▄▄▅▇▇▆▇▅▇▅▅▇█▇▆▇▇▇▇▆▅
epoch,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇████
epoch_loss,█▇▆▅▄▄▄▃▃▃▃▄▃▃▃▃▃▃▂▃▂▂▂▂▂▁▂▂▁▂▁▁▂▁▁▁▁▁▁▁

0,1
FK ROI,-0.04097
FK ROI < 30,-0.05372
ROI,-0.03859
ROI < 30,-0.05389
accuracy,0.19273
batch_before_backwards,7.0
batch_loss,12.52422
correct,530.0
epoch,182.0
epoch_loss,13.28694


: 

In [None]:

sweep_id = wandb.sweep(sweep_config, project="GRU_sweeps")
CUDA_LAUNCH_BLOCKING=1
wandb.agent(sweep_id, function=model_pipeline, count=100)

Create sweep with ID: fkf5o4gd
Sweep URL: https://wandb.ai/nickojelly/GRU_sweeps/sweeps/fkf5o4gd


[34m[1mwandb[0m: Agent Starting Run: zp6bcv9v with config:
[34m[1mwandb[0m: 	batch_before_backwards: 5
[34m[1mwandb[0m: 	batch_size: 1000
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	epochs: 50
[34m[1mwandb[0m: 	f1_layer_size: 256
[34m[1mwandb[0m: 	f2_layer_size: 64
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	l1_beta: 0.1
[34m[1mwandb[0m: 	learning_rate: 0.0003921465953934761
[34m[1mwandb[0m: 	len_data: 16325
[34m[1mwandb[0m: 	loss: CEL
[34m[1mwandb[0m: 	num_layers: 2
[34m[1mwandb[0m: 	optimizer: adamW
[34m[1mwandb[0m: 	validation_split: 0.1
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


{'batch_before_backwards': 5, 'batch_size': 1000, 'dropout': 0.3, 'epochs': 50, 'f1_layer_size': 256, 'f2_layer_size': 64, 'hidden_size': 64, 'l1_beta': 0.1, 'learning_rate': 0.0003921465953934761, 'len_data': 16325, 'loss': 'CEL', 'num_layers': 2, 'optimizer': 'adamW', 'validation_split': 0.1}
50
{'batch_before_backwards': 5, 'batch_size': 1000, 'dropout': 0.3, 'epochs': 50, 'f1_layer_size': 256, 'f2_layer_size': 64, 'hidden_size': 64, 'l1_beta': 0.1, 'learning_rate': 0.0003921465953934761, 'len_data': 16325, 'loss': 'CEL', 'num_layers': 2, 'optimizer': 'adamW', 'validation_split': 0.1}


100%|██████████| 16325/16325 [00:00<00:00, 21746.90it/s]


filled =0
empty  =130600
0.0null_dog=0
SmoothL1Loss() Adam (
Parameter Group 0
    amsgrad: False
    betas: (0.9, 0.999)
    capturable: False
    eps: 1e-08
    foreach: None
    lr: 0.0003921465953934761
    maximize: False
    weight_decay: 0
)
smalll_lin_GRUNet(
  (batchnorm): BatchNorm1d(510, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
  (fc0): Linear(in_features=510, out_features=510, bias=True)
  (gru1): GRUCell(510, 64)
  (gru2): GRUCell(510, 64)
  (gru3): GRUCell(510, 64)
  (gru4): GRUCell(510, 64)
  (gru5): GRUCell(510, 64)
  (gru6): GRUCell(510, 64)
  (gru7): GRUCell(510, 64)
  (gru8): GRUCell(510, 64)
  (rl1): ReLU()
  (drop1): Dropout(p=0.3, inplace=False)
  (fc1): Linear(in_features=512, out_features=64, bias=True)
  (rl2): ReLU()
  (drop2): Dropout(p=0.3, inplace=False)
  (fc2): Linear(in_features=64, out_features=8, bias=True)
  (output_fn): Identity()
)


100%|██████████| 13/13 [00:08<00:00,  1.46it/s]
100%|██████████| 13/13 [00:05<00:00,  2.33it/s]
100%|██████████| 13/13 [00:08<00:00,  1.51it/s]
100%|██████████| 13/13 [00:11<00:00,  1.10it/s]
100%|██████████| 13/13 [00:06<00:00,  1.97it/s]
100%|██████████| 13/13 [00:08<00:00,  1.51it/s]
100%|██████████| 13/13 [00:05<00:00,  2.36it/s]
100%|██████████| 13/13 [00:08<00:00,  1.49it/s]
100%|██████████| 13/13 [00:05<00:00,  2.39it/s]
100%|██████████| 13/13 [00:06<00:00,  2.05it/s]
100%|██████████| 13/13 [00:06<00:00,  2.08it/s]
100%|██████████| 13/13 [00:05<00:00,  2.22it/s]
100%|██████████| 13/13 [00:08<00:00,  1.45it/s]
100%|██████████| 13/13 [00:05<00:00,  2.34it/s]
100%|██████████| 13/13 [00:06<00:00,  2.04it/s]
100%|██████████| 13/13 [00:05<00:00,  2.40it/s]
100%|██████████| 13/13 [00:11<00:00,  1.10it/s]
100%|██████████| 13/13 [00:06<00:00,  2.09it/s]
100%|██████████| 13/13 [00:05<00:00,  2.41it/s]
100%|██████████| 13/13 [00:06<00:00,  2.08it/s]
100%|██████████| 13/13 [00:08<00:00,  1.

created path



VBox(children=(Label(value='67.403 MB of 67.403 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
FK ROI,█▇▆▆▅▄▂▁▃▂▁▁▂▃▃▄▄▃▃▃▄▄▃▂▃▄▄▄▅▅▄▅▄▄▅▅▆▆▄▅
FK ROI < 30,▁▁▂▄▄▄▅▅▆▆▅▅▄▄▄▄▄▄▄▄▅▅▄▄▅▅▅▆▆▆▆▆▆▇▇▇█▇▆▇
ROI,█▇▆▆▅▄▂▁▃▂▁▁▂▃▃▄▄▃▃▃▄▃▃▂▃▄▄▄▅▄▄▅▄▄▄▅▅▅▄▅
ROI < 30,▁▁▂▃▄▄▄▅▆▆▅▅▄▄▄▄▄▄▄▄▅▅▄▄▅▅▆▆▆▆▆▆▆▇▇▇█▇▇▇
accuracy,▄▄▅▆▃▃▁▁▃▂▅▅▅▅▅▆▅▅▅▅▅▅▅▄▅▅▆▆▅▆▆▆▆▇▇▆█▇▇▆
batch_before_backwards,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
batch_loss,█▂▇▄▂▇▄▂▆▄▆▄▂▆▄▁▆▄▁▆▁▆▃▁▆▃▁▆▃▁▃▁▆▃▁▆▃▁▅▃
correct,▄▄▅▆▃▃▁▁▃▂▅▅▅▅▅▆▅▅▅▅▅▅▅▄▅▅▆▆▅▆▆▆▆▇▇▆█▇▇▆
epoch,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇███
epoch_loss,█▆▅▅▅▄▄▄▄▄▄▄▄▄▃▃▃▄▃▃▃▃▃▃▃▃▃▂▂▂▂▂▂▂▂▁▂▁▁▁

0,1
FK ROI,-0.0441
FK ROI < 30,-0.05782
ROI,-0.04302
ROI < 30,-0.0606
accuracy,0.18545
batch_before_backwards,5.0
batch_loss,17.47592
correct,510.0
epoch,49.0
epoch_loss,17.47592


[34m[1mwandb[0m: Agent Starting Run: ohx15mpl with config:
[34m[1mwandb[0m: 	batch_before_backwards: 10
[34m[1mwandb[0m: 	batch_size: 1000
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	epochs: 50
[34m[1mwandb[0m: 	f1_layer_size: 256
[34m[1mwandb[0m: 	f2_layer_size: 64
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	l1_beta: 0.1
[34m[1mwandb[0m: 	learning_rate: 0.00012066292095517836
[34m[1mwandb[0m: 	len_data: 16325
[34m[1mwandb[0m: 	loss: CEL
[34m[1mwandb[0m: 	num_layers: 2
[34m[1mwandb[0m: 	optimizer: adamW
[34m[1mwandb[0m: 	validation_split: 0.1
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


{'batch_before_backwards': 10, 'batch_size': 1000, 'dropout': 0.3, 'epochs': 50, 'f1_layer_size': 256, 'f2_layer_size': 64, 'hidden_size': 64, 'l1_beta': 0.1, 'learning_rate': 0.00012066292095517836, 'len_data': 16325, 'loss': 'CEL', 'num_layers': 2, 'optimizer': 'adamW', 'validation_split': 0.1}
50
{'batch_before_backwards': 10, 'batch_size': 1000, 'dropout': 0.3, 'epochs': 50, 'f1_layer_size': 256, 'f2_layer_size': 64, 'hidden_size': 64, 'l1_beta': 0.1, 'learning_rate': 0.00012066292095517836, 'len_data': 16325, 'loss': 'CEL', 'num_layers': 2, 'optimizer': 'adamW', 'validation_split': 0.1}


100%|██████████| 16325/16325 [00:00<00:00, 26781.92it/s]


filled =0
empty  =130600
0.0null_dog=0
SmoothL1Loss() Adam (
Parameter Group 0
    amsgrad: False
    betas: (0.9, 0.999)
    capturable: False
    eps: 1e-08
    foreach: None
    lr: 0.00012066292095517836
    maximize: False
    weight_decay: 0
)
smalll_lin_GRUNet(
  (batchnorm): BatchNorm1d(510, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
  (fc0): Linear(in_features=510, out_features=510, bias=True)
  (gru1): GRUCell(510, 64)
  (gru2): GRUCell(510, 64)
  (gru3): GRUCell(510, 64)
  (gru4): GRUCell(510, 64)
  (gru5): GRUCell(510, 64)
  (gru6): GRUCell(510, 64)
  (gru7): GRUCell(510, 64)
  (gru8): GRUCell(510, 64)
  (rl1): ReLU()
  (drop1): Dropout(p=0.3, inplace=False)
  (fc1): Linear(in_features=512, out_features=64, bias=True)
  (rl2): ReLU()
  (drop2): Dropout(p=0.3, inplace=False)
  (fc2): Linear(in_features=64, out_features=8, bias=True)
  (output_fn): Identity()
)


100%|██████████| 13/13 [00:06<00:00,  2.02it/s]
100%|██████████| 13/13 [00:06<00:00,  1.98it/s]
100%|██████████| 13/13 [00:08<00:00,  1.49it/s]
100%|██████████| 13/13 [00:12<00:00,  1.01it/s]
100%|██████████| 13/13 [00:06<00:00,  2.04it/s]
100%|██████████| 13/13 [00:06<00:00,  2.00it/s]
100%|██████████| 13/13 [00:06<00:00,  2.08it/s]
100%|██████████| 13/13 [00:06<00:00,  2.04it/s]
100%|██████████| 13/13 [00:05<00:00,  2.33it/s]
100%|██████████| 13/13 [00:12<00:00,  1.01it/s]
100%|██████████| 13/13 [00:06<00:00,  2.04it/s]
100%|██████████| 13/13 [00:06<00:00,  1.98it/s]
100%|██████████| 13/13 [00:06<00:00,  2.02it/s]
100%|██████████| 13/13 [00:08<00:00,  1.47it/s]
100%|██████████| 13/13 [00:06<00:00,  2.04it/s]
100%|██████████| 13/13 [00:06<00:00,  2.01it/s]
100%|██████████| 13/13 [00:12<00:00,  1.02it/s]
100%|██████████| 13/13 [00:08<00:00,  1.46it/s]
100%|██████████| 13/13 [00:05<00:00,  2.41it/s]
100%|██████████| 13/13 [00:05<00:00,  2.36it/s]
100%|██████████| 13/13 [00:05<00:00,  2.

created path



VBox(children=(Label(value='67.240 MB of 67.240 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
FK ROI,▇▆▇████████▇▇▇▇▇▇▇▇▆▆▆▆▆▄▄▄▄▄▄▃▃▂▂▂▁▂▂▂▁
FK ROI < 30,▁▁▂▂▂▃▃▃▄▄▅▅▅▆▆▆▇▇▇▇█████████████████▇▇▇
ROI,▇▇▇██████▇▇▇▇▇▆▆▆▆▆▅▅▅▅▅▄▄▃▃▃▃▃▃▂▂▂▁▂▂▂▁
ROI < 30,▁▁▂▂▃▃▃▄▄▄▄▅▅▆▆▆▇▇▇▇▇████████████████▇▇▇
accuracy,██▅█▅▆▆▆▇▇▇▆▆▇▆▅▅▄▄▄▃▃▄▄▃▄▄▄▃▃▂▁▃▂▂▁▂▁▁▁
batch_before_backwards,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
batch_loss,█▇▁▁▇▆▁▁▆▆▁▁▆▁▁▆▆▁▁▆▆▁▁▆▆▁▆▆▁▁▆▆▁▁▆▆▁▁▆▁
correct,██▅█▅▆▆▆▇▇▇▆▆▇▆▅▅▄▄▄▃▃▄▄▃▄▄▄▃▃▂▁▃▂▂▁▂▁▁▁
epoch,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇███
epoch_loss,█▅▅▄▄▃▃▃▃▂▃▂▂▂▂▂▂▂▂▂▂▂▁▂▁▁▂▁▁▁▁▁▁▁▂▁▁▁▁▁

0,1
FK ROI,-0.05742
FK ROI < 30,-0.08332
ROI,-0.05636
ROI < 30,-0.08831
accuracy,0.17964
batch_before_backwards,10.0
batch_loss,18.91152
correct,494.0
epoch,49.0
epoch_loss,18.91152


[34m[1mwandb[0m: Agent Starting Run: ue32hp97 with config:
[34m[1mwandb[0m: 	batch_before_backwards: 10
[34m[1mwandb[0m: 	batch_size: 100
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	epochs: 50
[34m[1mwandb[0m: 	f1_layer_size: 256
[34m[1mwandb[0m: 	f2_layer_size: 64
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	l1_beta: 0.1
[34m[1mwandb[0m: 	learning_rate: 0.0007069882482912235
[34m[1mwandb[0m: 	len_data: 16325
[34m[1mwandb[0m: 	loss: CEL
[34m[1mwandb[0m: 	num_layers: 2
[34m[1mwandb[0m: 	optimizer: adamW
[34m[1mwandb[0m: 	validation_split: 0.1
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


{'batch_before_backwards': 10, 'batch_size': 100, 'dropout': 0.3, 'epochs': 50, 'f1_layer_size': 256, 'f2_layer_size': 64, 'hidden_size': 64, 'l1_beta': 0.1, 'learning_rate': 0.0007069882482912235, 'len_data': 16325, 'loss': 'CEL', 'num_layers': 2, 'optimizer': 'adamW', 'validation_split': 0.1}
50
{'batch_before_backwards': 10, 'batch_size': 100, 'dropout': 0.3, 'epochs': 50, 'f1_layer_size': 256, 'f2_layer_size': 64, 'hidden_size': 64, 'l1_beta': 0.1, 'learning_rate': 0.0007069882482912235, 'len_data': 16325, 'loss': 'CEL', 'num_layers': 2, 'optimizer': 'adamW', 'validation_split': 0.1}


100%|██████████| 16325/16325 [00:00<00:00, 27003.56it/s]


filled =0
empty  =130600
0.0null_dog=0
SmoothL1Loss() Adam (
Parameter Group 0
    amsgrad: False
    betas: (0.9, 0.999)
    capturable: False
    eps: 1e-08
    foreach: None
    lr: 0.0007069882482912235
    maximize: False
    weight_decay: 0
)
smalll_lin_GRUNet(
  (batchnorm): BatchNorm1d(510, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
  (fc0): Linear(in_features=510, out_features=510, bias=True)
  (gru1): GRUCell(510, 64)
  (gru2): GRUCell(510, 64)
  (gru3): GRUCell(510, 64)
  (gru4): GRUCell(510, 64)
  (gru5): GRUCell(510, 64)
  (gru6): GRUCell(510, 64)
  (gru7): GRUCell(510, 64)
  (gru8): GRUCell(510, 64)
  (rl1): ReLU()
  (drop1): Dropout(p=0.3, inplace=False)
  (fc1): Linear(in_features=512, out_features=64, bias=True)
  (rl2): ReLU()
  (drop2): Dropout(p=0.3, inplace=False)
  (fc2): Linear(in_features=64, out_features=8, bias=True)
  (output_fn): Identity()
)


100%|██████████| 135/135 [00:21<00:00,  6.25it/s]
100%|██████████| 135/135 [00:21<00:00,  6.30it/s]
100%|██████████| 135/135 [00:27<00:00,  4.88it/s]
100%|██████████| 135/135 [00:21<00:00,  6.31it/s]
100%|██████████| 135/135 [00:21<00:00,  6.23it/s]
100%|██████████| 135/135 [00:21<00:00,  6.28it/s]
100%|██████████| 135/135 [00:27<00:00,  4.94it/s]
100%|██████████| 135/135 [00:21<00:00,  6.25it/s]
100%|██████████| 135/135 [00:21<00:00,  6.24it/s]
100%|██████████| 135/135 [00:21<00:00,  6.29it/s]
100%|██████████| 135/135 [00:26<00:00,  5.05it/s]
100%|██████████| 135/135 [00:21<00:00,  6.26it/s]
100%|██████████| 135/135 [00:21<00:00,  6.17it/s]
100%|██████████| 135/135 [00:21<00:00,  6.23it/s]
100%|██████████| 135/135 [00:21<00:00,  6.25it/s]
100%|██████████| 135/135 [00:29<00:00,  4.53it/s]
100%|██████████| 135/135 [00:21<00:00,  6.26it/s]
100%|██████████| 135/135 [00:21<00:00,  6.23it/s]
100%|██████████| 135/135 [00:21<00:00,  6.30it/s]
100%|██████████| 135/135 [00:29<00:00,  4.57it/s]


created path



VBox(children=(Label(value='67.385 MB of 67.385 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
FK ROI,▃▄▂▁▁▅▄▃▃▆▅▄▂▄▃▂▄▄▃▃▅▃▂▄▃▂▄▄▄▄▃▄▆▇▆█▇▇▅▅
FK ROI < 30,▃▃▂▁▁▄▃▃▄▆█▇▆█▆▅█▇▅▆▇▆▅▇▆▄▄▆▄▆▃▅▆█▆█▆▆▇▆
ROI,▂▄▂▁▁▅▄▃▂▅▅▄▁▄▂▂▃▃▃▃▄▂▂▃▃▂▄▄▄▄▃▄▆█▆█▇▇▅▅
ROI < 30,▂▃▂▁▁▃▃▃▄▆▇▇▅▇▆▄▇▇▅▆▇▅▄▆▆▄▄▆▄▆▃▅▇█▆█▆▆▇▆
accuracy,▃▃▂▁▄▃▄▆▃▃▅▄▄▅▅▄▅▄▄▆▅▅▄▆▆▅▄▆▆█▆▆▅▆▅▅▅▆▆▇
batch_before_backwards,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
batch_loss,▄▅▅▂▄▅▂▄▃█▄▃█▃▄█▃▄▄▂▄▄▂▃▂▁▃▂▆▂▂▆▂▃▃▂▃▃▁▃
correct,▃▃▂▁▄▃▄▆▃▃▅▄▄▅▅▄▅▄▄▆▅▅▄▆▆▅▄▆▆█▆▆▅▆▅▅▅▆▆▇
epoch,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇███
epoch_loss,███▇▇▆▆▆▆▆▆▆▅▅▅▅▅▅▄▅▄▄▄▄▄▃▂▃▃▂▂▃▁▂▁▁▂▁▁▁

0,1
FK ROI,-0.03263
FK ROI < 30,-0.01909
ROI,-0.03141
ROI < 30,-0.01565
accuracy,0.19745
batch_before_backwards,10.0
batch_loss,17.34825
correct,543.0
epoch,49.0
epoch_loss,17.34825


[34m[1mwandb[0m: Agent Starting Run: blpeo95o with config:
[34m[1mwandb[0m: 	batch_before_backwards: 20
[34m[1mwandb[0m: 	batch_size: 100
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	epochs: 50
[34m[1mwandb[0m: 	f1_layer_size: 256
[34m[1mwandb[0m: 	f2_layer_size: 64
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	l1_beta: 0.1
[34m[1mwandb[0m: 	learning_rate: 0.0006068160421309081
[34m[1mwandb[0m: 	len_data: 16325
[34m[1mwandb[0m: 	loss: CEL
[34m[1mwandb[0m: 	num_layers: 2
[34m[1mwandb[0m: 	optimizer: adamW
[34m[1mwandb[0m: 	validation_split: 0.1
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


{'batch_before_backwards': 20, 'batch_size': 100, 'dropout': 0.3, 'epochs': 50, 'f1_layer_size': 256, 'f2_layer_size': 64, 'hidden_size': 64, 'l1_beta': 0.1, 'learning_rate': 0.0006068160421309081, 'len_data': 16325, 'loss': 'CEL', 'num_layers': 2, 'optimizer': 'adamW', 'validation_split': 0.1}
50
{'batch_before_backwards': 20, 'batch_size': 100, 'dropout': 0.3, 'epochs': 50, 'f1_layer_size': 256, 'f2_layer_size': 64, 'hidden_size': 64, 'l1_beta': 0.1, 'learning_rate': 0.0006068160421309081, 'len_data': 16325, 'loss': 'CEL', 'num_layers': 2, 'optimizer': 'adamW', 'validation_split': 0.1}


100%|██████████| 16325/16325 [00:00<00:00, 27504.49it/s]


filled =0
empty  =130600
0.0null_dog=0
SmoothL1Loss() Adam (
Parameter Group 0
    amsgrad: False
    betas: (0.9, 0.999)
    capturable: False
    eps: 1e-08
    foreach: None
    lr: 0.0006068160421309081
    maximize: False
    weight_decay: 0
)
smalll_lin_GRUNet(
  (batchnorm): BatchNorm1d(510, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
  (fc0): Linear(in_features=510, out_features=510, bias=True)
  (gru1): GRUCell(510, 64)
  (gru2): GRUCell(510, 64)
  (gru3): GRUCell(510, 64)
  (gru4): GRUCell(510, 64)
  (gru5): GRUCell(510, 64)
  (gru6): GRUCell(510, 64)
  (gru7): GRUCell(510, 64)
  (gru8): GRUCell(510, 64)
  (rl1): ReLU()
  (drop1): Dropout(p=0.3, inplace=False)
  (fc1): Linear(in_features=512, out_features=64, bias=True)
  (rl2): ReLU()
  (drop2): Dropout(p=0.3, inplace=False)
  (fc2): Linear(in_features=64, out_features=8, bias=True)
  (output_fn): Identity()
)


100%|██████████| 135/135 [00:17<00:00,  7.73it/s]
100%|██████████| 135/135 [00:15<00:00,  8.55it/s]
100%|██████████| 135/135 [00:18<00:00,  7.29it/s]
100%|██████████| 135/135 [00:15<00:00,  8.68it/s]
100%|██████████| 135/135 [00:15<00:00,  8.82it/s]
100%|██████████| 135/135 [00:24<00:00,  5.59it/s]
100%|██████████| 135/135 [00:15<00:00,  8.73it/s]
100%|██████████| 135/135 [00:15<00:00,  8.65it/s]
100%|██████████| 135/135 [00:15<00:00,  8.62it/s]
100%|██████████| 135/135 [00:24<00:00,  5.48it/s]
100%|██████████| 135/135 [00:15<00:00,  8.86it/s]
100%|██████████| 135/135 [00:18<00:00,  7.29it/s]
100%|██████████| 135/135 [00:15<00:00,  8.68it/s]
100%|██████████| 135/135 [00:22<00:00,  6.02it/s]
100%|██████████| 135/135 [00:14<00:00,  9.17it/s]
100%|██████████| 135/135 [00:15<00:00,  8.79it/s]
100%|██████████| 135/135 [00:15<00:00,  8.56it/s]
100%|██████████| 135/135 [00:15<00:00,  8.71it/s]
100%|██████████| 135/135 [00:16<00:00,  7.99it/s]
100%|██████████| 135/135 [00:15<00:00,  8.75it/s]


created path



VBox(children=(Label(value='67.365 MB of 67.365 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
FK ROI,▅▂▂▃▃▃▃▃▃▂▃▃▃▂▃▁▃▂▂▁▂▂▂▂▄▃▂▃▄▄▄▄▄▅▄▅▆▆▇█
FK ROI < 30,▂▃▄▃▂▂▁▁▁▂▃▄▄▃▄▂▅▄▄▃▄▄▄▄▅▅▄▅▇▆▆▅▅▇▆▆▆▆▇█
ROI,▄▂▂▃▃▃▃▃▃▂▃▃▃▂▃▁▃▂▁▁▂▂▂▂▄▃▂▃▄▄▄▄▄▅▄▅▆▆▇█
ROI < 30,▂▃▄▃▂▂▂▁▁▂▃▃▄▃▄▂▅▄▃▃▄▄▄▄▅▅▅▅▇▆▇▅▅▇▆▆▆▆▇█
accuracy,▂▃▁▄▅▅▅▅▅▆▇▅▅▇▆▆▆▆▆▅▆▇▇█▇▇█▇▆▅▆▅▆▇▆▅▆█▆▇
batch_before_backwards,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
batch_loss,▅▆▆▃▄▅▃▃▂█▃▂▇▃▄▇▃▄▄▂▄▄▂▃▁▂▂▁▇▃▁▆▂▃▄▂▃▃▂▃
correct,▂▃▁▄▅▅▅▅▅▆▇▅▅▇▆▆▆▆▆▅▆▇▇█▇▇█▇▆▅▆▅▆▇▆▅▆█▆▇
epoch,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇███
epoch_loss,███▇▇▇▆▆▆▆▆▅▅▅▄▅▄▄▄▄▃▃▄▄▃▃▃▃▃▃▃▃▃▃▂▂▂▁▁▁

0,1
FK ROI,0.02095
FK ROI < 30,-0.01391
ROI,0.03325
ROI < 30,-0.00547
accuracy,0.18764
batch_before_backwards,20.0
batch_loss,50.63058
correct,516.0
epoch,49.0
epoch_loss,50.63058


[34m[1mwandb[0m: Agent Starting Run: u80vbbtm with config:
[34m[1mwandb[0m: 	batch_before_backwards: 20
[34m[1mwandb[0m: 	batch_size: 100
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	epochs: 50
[34m[1mwandb[0m: 	f1_layer_size: 256
[34m[1mwandb[0m: 	f2_layer_size: 64
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	l1_beta: 0.1
[34m[1mwandb[0m: 	learning_rate: 0.0005980970763987507
[34m[1mwandb[0m: 	len_data: 16325
[34m[1mwandb[0m: 	loss: CEL
[34m[1mwandb[0m: 	num_layers: 2
[34m[1mwandb[0m: 	optimizer: adamW
[34m[1mwandb[0m: 	validation_split: 0.1
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


{'batch_before_backwards': 20, 'batch_size': 100, 'dropout': 0.3, 'epochs': 50, 'f1_layer_size': 256, 'f2_layer_size': 64, 'hidden_size': 64, 'l1_beta': 0.1, 'learning_rate': 0.0005980970763987507, 'len_data': 16325, 'loss': 'CEL', 'num_layers': 2, 'optimizer': 'adamW', 'validation_split': 0.1}
50
{'batch_before_backwards': 20, 'batch_size': 100, 'dropout': 0.3, 'epochs': 50, 'f1_layer_size': 256, 'f2_layer_size': 64, 'hidden_size': 64, 'l1_beta': 0.1, 'learning_rate': 0.0005980970763987507, 'len_data': 16325, 'loss': 'CEL', 'num_layers': 2, 'optimizer': 'adamW', 'validation_split': 0.1}


100%|██████████| 16325/16325 [00:00<00:00, 27597.59it/s]


filled =0
empty  =130600
0.0null_dog=0
SmoothL1Loss() Adam (
Parameter Group 0
    amsgrad: False
    betas: (0.9, 0.999)
    capturable: False
    eps: 1e-08
    foreach: None
    lr: 0.0005980970763987507
    maximize: False
    weight_decay: 0
)
smalll_lin_GRUNet(
  (batchnorm): BatchNorm1d(510, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
  (fc0): Linear(in_features=510, out_features=510, bias=True)
  (gru1): GRUCell(510, 64)
  (gru2): GRUCell(510, 64)
  (gru3): GRUCell(510, 64)
  (gru4): GRUCell(510, 64)
  (gru5): GRUCell(510, 64)
  (gru6): GRUCell(510, 64)
  (gru7): GRUCell(510, 64)
  (gru8): GRUCell(510, 64)
  (rl1): ReLU()
  (drop1): Dropout(p=0.3, inplace=False)
  (fc1): Linear(in_features=512, out_features=64, bias=True)
  (rl2): ReLU()
  (drop2): Dropout(p=0.3, inplace=False)
  (fc2): Linear(in_features=64, out_features=8, bias=True)
  (output_fn): Identity()
)


100%|██████████| 135/135 [00:15<00:00,  8.50it/s]
100%|██████████| 135/135 [00:17<00:00,  7.59it/s]
100%|██████████| 135/135 [00:24<00:00,  5.59it/s]
100%|██████████| 135/135 [00:18<00:00,  7.35it/s]
100%|██████████| 135/135 [00:15<00:00,  8.70it/s]
100%|██████████| 135/135 [00:15<00:00,  8.67it/s]
100%|██████████| 135/135 [00:15<00:00,  8.70it/s]
100%|██████████| 135/135 [00:15<00:00,  8.62it/s]
100%|██████████| 135/135 [00:15<00:00,  8.76it/s]
100%|██████████| 135/135 [00:16<00:00,  8.36it/s]
100%|██████████| 135/135 [00:15<00:00,  8.51it/s]
100%|██████████| 135/135 [00:17<00:00,  7.74it/s]
100%|██████████| 135/135 [00:15<00:00,  8.79it/s]
100%|██████████| 135/135 [00:15<00:00,  8.64it/s]
100%|██████████| 135/135 [00:15<00:00,  8.73it/s]
100%|██████████| 135/135 [00:24<00:00,  5.60it/s]
100%|██████████| 135/135 [00:15<00:00,  8.72it/s]
100%|██████████| 135/135 [00:15<00:00,  8.70it/s]
100%|██████████| 135/135 [00:15<00:00,  8.71it/s]
100%|██████████| 135/135 [00:19<00:00,  6.85it/s]





VBox(children=(Label(value='67.354 MB of 67.354 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
FK ROI,▃▂▂▂▃▃▃▃▃▃▂▁▃▂▂▂▂▂▂▂▁▁▂▁▃▂▄▄▄▄▆▅▅▇█▇▇▅▇▆
FK ROI < 30,▂▂▃▃▃▃▂▂▃▃▂▁▂▁▁▂▃▃▃▃▃▃▄▄▅▅▅▆▆▆█▆▆▆█████▇
ROI,▃▂▂▂▂▃▃▃▃▂▂▁▃▂▂▂▂▁▁▁▁▁▂▁▃▂▄▄▃▄▅▅▅▇█▇▆▅▇▆
ROI < 30,▂▂▃▃▃▃▂▂▃▂▂▁▂▁▁▂▃▃▃▃▃▃▃▄▅▅▅▆▆▅▇▆▆▆█████▇
accuracy,▂▂▁▄▄▄▅▄▆▅▅▅▄▅▃▄▅▅▅▅▅▄▃▄▅▅▄▅▅▄▆▄▃▅▆▆▆▆██
batch_before_backwards,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
batch_loss,▅▆▆▃▄▅▃▃▂█▃▂█▃▄▇▃▄▄▂▄▄▂▃▁▂▂▁▇▂▁▆▂▃▃▂▃▃▁▃
correct,▂▂▁▄▄▄▅▄▆▅▅▅▄▅▃▄▅▅▅▅▅▄▃▄▅▅▄▅▅▄▆▄▃▅▆▆▆▆██
epoch,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇███
epoch_loss,██▇▇▇▆▇▆▆▆▆▅▅▅▅▅▄▄▄▄▄▄▄▄▃▄▃▃▃▃▃▃▃▂▂▂▂▁▂▁

0,1
FK ROI,0.0321
FK ROI < 30,-0.01066
ROI,0.04561
ROI < 30,-0.00212
accuracy,0.19418
batch_before_backwards,20.0
batch_loss,49.64127
correct,534.0
epoch,49.0
epoch_loss,49.64127


[34m[1mwandb[0m: Agent Starting Run: pt751nco with config:
[34m[1mwandb[0m: 	batch_before_backwards: 5
[34m[1mwandb[0m: 	batch_size: 100
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	epochs: 50
[34m[1mwandb[0m: 	f1_layer_size: 256
[34m[1mwandb[0m: 	f2_layer_size: 64
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	l1_beta: 0.1
[34m[1mwandb[0m: 	learning_rate: 0.0004723857813859652
[34m[1mwandb[0m: 	len_data: 16325
[34m[1mwandb[0m: 	loss: CEL
[34m[1mwandb[0m: 	num_layers: 2
[34m[1mwandb[0m: 	optimizer: adamW
[34m[1mwandb[0m: 	validation_split: 0.1
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


{'batch_before_backwards': 5, 'batch_size': 100, 'dropout': 0.3, 'epochs': 50, 'f1_layer_size': 256, 'f2_layer_size': 64, 'hidden_size': 64, 'l1_beta': 0.1, 'learning_rate': 0.0004723857813859652, 'len_data': 16325, 'loss': 'CEL', 'num_layers': 2, 'optimizer': 'adamW', 'validation_split': 0.1}
50
{'batch_before_backwards': 5, 'batch_size': 100, 'dropout': 0.3, 'epochs': 50, 'f1_layer_size': 256, 'f2_layer_size': 64, 'hidden_size': 64, 'l1_beta': 0.1, 'learning_rate': 0.0004723857813859652, 'len_data': 16325, 'loss': 'CEL', 'num_layers': 2, 'optimizer': 'adamW', 'validation_split': 0.1}


100%|██████████| 16325/16325 [00:00<00:00, 27597.55it/s]


filled =0
empty  =130600
0.0null_dog=0
SmoothL1Loss() Adam (
Parameter Group 0
    amsgrad: False
    betas: (0.9, 0.999)
    capturable: False
    eps: 1e-08
    foreach: None
    lr: 0.0004723857813859652
    maximize: False
    weight_decay: 0
)
smalll_lin_GRUNet(
  (batchnorm): BatchNorm1d(510, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
  (fc0): Linear(in_features=510, out_features=510, bias=True)
  (gru1): GRUCell(510, 64)
  (gru2): GRUCell(510, 64)
  (gru3): GRUCell(510, 64)
  (gru4): GRUCell(510, 64)
  (gru5): GRUCell(510, 64)
  (gru6): GRUCell(510, 64)
  (gru7): GRUCell(510, 64)
  (gru8): GRUCell(510, 64)
  (rl1): ReLU()
  (drop1): Dropout(p=0.3, inplace=False)
  (fc1): Linear(in_features=512, out_features=64, bias=True)
  (rl2): ReLU()
  (drop2): Dropout(p=0.3, inplace=False)
  (fc2): Linear(in_features=64, out_features=8, bias=True)
  (output_fn): Identity()
)


100%|██████████| 135/135 [00:30<00:00,  4.49it/s]
100%|██████████| 135/135 [00:27<00:00,  4.95it/s]
100%|██████████| 135/135 [00:29<00:00,  4.58it/s]
100%|██████████| 135/135 [00:30<00:00,  4.38it/s]
100%|██████████| 135/135 [00:26<00:00,  5.03it/s]
100%|██████████| 135/135 [00:30<00:00,  4.45it/s]
100%|██████████| 135/135 [00:31<00:00,  4.28it/s]
100%|██████████| 135/135 [00:29<00:00,  4.55it/s]
100%|██████████| 135/135 [00:27<00:00,  4.95it/s]
100%|██████████| 135/135 [00:27<00:00,  5.00it/s]
100%|██████████| 135/135 [00:32<00:00,  4.16it/s]
100%|██████████| 135/135 [00:27<00:00,  4.93it/s]
100%|██████████| 135/135 [00:30<00:00,  4.49it/s]
100%|██████████| 135/135 [00:32<00:00,  4.17it/s]
100%|██████████| 135/135 [00:26<00:00,  5.01it/s]
100%|██████████| 135/135 [00:27<00:00,  4.94it/s]
100%|██████████| 135/135 [00:32<00:00,  4.17it/s]
100%|██████████| 135/135 [00:29<00:00,  4.52it/s]
100%|██████████| 135/135 [00:27<00:00,  4.97it/s]
100%|██████████| 135/135 [00:29<00:00,  4.53it/s]


created path



VBox(children=(Label(value='67.489 MB of 67.489 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
FK ROI,▄▇▄▂▄▁▅▄▁▄▆▆▅▄▆▄▃▃▅▇▆█▆▅▄▅▄▄▂▂▃▂█▇█▆▆▇▅▇
FK ROI < 30,▄▃▂▂▂▁▃▂▂▄▆▅▆▄▆▆▅▅▆█▆▇▇▅▄▄▄▅▄▅▃▃▆▅▄▄▄▆▅▅
ROI,▄▇▅▂▅▂▆▅▁▄▆▆▅▄▆▄▃▃▅▇▆▇▆▅▄▅▅▅▂▂▃▂█▇█▆▅▇▅▇
ROI < 30,▄▃▃▂▂▁▃▂▂▄▆▆▆▅▆▆▅▅▆█▇▇▇▅▅▄▄▅▄▅▂▃▆▅▄▄▄▆▅▅
accuracy,▁▃▁▂▃▂▃▄▅▄▅▅▅▅▅▆▆▆▇▇▆▇▇▅▄▆▆▃▆▃▆▅▅▄▆▇█▇▆▅
batch_before_backwards,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
batch_loss,▅▆▇▂▅▆▂▅▅█▅▅█▄▅█▄▅▅▁▅▅▁▄▄▁▄▄▆▃▄▅▃▄▄▃▄▄▁▄
correct,▁▃▁▂▃▂▃▄▅▄▅▅▅▅▅▆▆▆▇▇▆▇▇▅▄▆▆▃▆▃▆▅▅▄▆▇█▇▆▅
epoch,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇███
epoch_loss,█▇█▇▇▆▆▅▅▅▅▅▆▄▅▅▅▄▃▄▃▃▃▃▂▃▂▂▂▂▂▂▁▂▁▁▁▁▁▁

0,1
FK ROI,-0.02945
FK ROI < 30,-0.04401
ROI,-0.02785
ROI < 30,-0.04571
accuracy,0.18691
batch_before_backwards,5.0
batch_loss,4.95803
correct,514.0
epoch,49.0
epoch_loss,4.95803


[34m[1mwandb[0m: Agent Starting Run: 649fnzi5 with config:
[34m[1mwandb[0m: 	batch_before_backwards: 20
[34m[1mwandb[0m: 	batch_size: 100
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	epochs: 50
[34m[1mwandb[0m: 	f1_layer_size: 256
[34m[1mwandb[0m: 	f2_layer_size: 64
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	l1_beta: 0.1
[34m[1mwandb[0m: 	learning_rate: 0.0004808376045847639
[34m[1mwandb[0m: 	len_data: 16325
[34m[1mwandb[0m: 	loss: CEL
[34m[1mwandb[0m: 	num_layers: 2
[34m[1mwandb[0m: 	optimizer: adamW
[34m[1mwandb[0m: 	validation_split: 0.1
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


{'batch_before_backwards': 20, 'batch_size': 100, 'dropout': 0.3, 'epochs': 50, 'f1_layer_size': 256, 'f2_layer_size': 64, 'hidden_size': 64, 'l1_beta': 0.1, 'learning_rate': 0.0004808376045847639, 'len_data': 16325, 'loss': 'CEL', 'num_layers': 2, 'optimizer': 'adamW', 'validation_split': 0.1}
50
{'batch_before_backwards': 20, 'batch_size': 100, 'dropout': 0.3, 'epochs': 50, 'f1_layer_size': 256, 'f2_layer_size': 64, 'hidden_size': 64, 'l1_beta': 0.1, 'learning_rate': 0.0004808376045847639, 'len_data': 16325, 'loss': 'CEL', 'num_layers': 2, 'optimizer': 'adamW', 'validation_split': 0.1}


100%|██████████| 16325/16325 [00:00<00:00, 26054.61it/s]


filled =0
empty  =130600
0.0null_dog=0
SmoothL1Loss() Adam (
Parameter Group 0
    amsgrad: False
    betas: (0.9, 0.999)
    capturable: False
    eps: 1e-08
    foreach: None
    lr: 0.0004808376045847639
    maximize: False
    weight_decay: 0
)
smalll_lin_GRUNet(
  (batchnorm): BatchNorm1d(510, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
  (fc0): Linear(in_features=510, out_features=510, bias=True)
  (gru1): GRUCell(510, 64)
  (gru2): GRUCell(510, 64)
  (gru3): GRUCell(510, 64)
  (gru4): GRUCell(510, 64)
  (gru5): GRUCell(510, 64)
  (gru6): GRUCell(510, 64)
  (gru7): GRUCell(510, 64)
  (gru8): GRUCell(510, 64)
  (rl1): ReLU()
  (drop1): Dropout(p=0.3, inplace=False)
  (fc1): Linear(in_features=512, out_features=64, bias=True)
  (rl2): ReLU()
  (drop2): Dropout(p=0.3, inplace=False)
  (fc2): Linear(in_features=64, out_features=8, bias=True)
  (output_fn): Identity()
)


100%|██████████| 135/135 [00:18<00:00,  7.28it/s]
100%|██████████| 135/135 [00:19<00:00,  6.99it/s]
100%|██████████| 135/135 [00:18<00:00,  7.32it/s]
100%|██████████| 135/135 [00:15<00:00,  8.71it/s]
100%|██████████| 135/135 [00:18<00:00,  7.32it/s]
100%|██████████| 135/135 [00:24<00:00,  5.59it/s]
100%|██████████| 135/135 [00:15<00:00,  8.71it/s]
100%|██████████| 135/135 [00:18<00:00,  7.21it/s]
100%|██████████| 135/135 [00:15<00:00,  8.63it/s]
100%|██████████| 135/135 [00:21<00:00,  6.32it/s]
100%|██████████| 135/135 [00:14<00:00,  9.13it/s]
100%|██████████| 135/135 [00:15<00:00,  8.55it/s]
100%|██████████| 135/135 [00:18<00:00,  7.16it/s]
100%|██████████| 135/135 [00:15<00:00,  8.83it/s]
100%|██████████| 135/135 [00:18<00:00,  7.21it/s]
100%|██████████| 135/135 [00:21<00:00,  6.42it/s]
100%|██████████| 135/135 [00:17<00:00,  7.62it/s]
100%|██████████| 135/135 [00:15<00:00,  8.71it/s]
100%|██████████| 135/135 [00:15<00:00,  8.61it/s]
100%|██████████| 135/135 [00:18<00:00,  7.26it/s]


created path



VBox(children=(Label(value='67.350 MB of 67.350 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
FK ROI,█▅▃▂▄▄▄▂▆▇▅▅▆▅▇▅▅▅▃▁▂▂▃▄▄▄▃▃▄▄▃▄▆▆▆▅▇▇▇▄
FK ROI < 30,▁▂▃▂▂▂▁▁▂▄▃▃▂▃▄▄▄▃▂▂▁▂▂▃▅▄▃▃▃▄▅▆▇▅▇▆██▇▂
ROI,█▄▃▂▄▄▄▃▆▇▅▅▆▅▇▅▄▄▃▁▂▂▃▃▄▄▃▂▄▄▃▃▅▆▆▅▇▇▆▄
ROI < 30,▁▂▂▂▂▂▁▁▂▄▄▃▂▃▄▄▃▃▂▂▁▂▂▃▄▃▃▃▃▄▅▆▇▅▇▅██▆▂
accuracy,▁▁▁▂▄▄▅▄▅▅▅▅▆▇▅▅▅▆▆▆▅▆▆▅▇█▇▇▅▆▇▆▇▇██▆▆▅▆
batch_before_backwards,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
batch_loss,▅▆▅▃▄▅▃▃▂█▃▂█▃▄█▃▄▄▂▄▄▂▃▁▂▂▁▇▃▁▇▃▄▄▂▃▄▂▃
correct,▁▁▁▂▄▄▅▄▅▅▅▅▆▇▅▅▅▆▆▆▅▆▆▅▇█▇▇▅▆▇▆▇▇██▆▆▅▆
epoch,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇███
epoch_loss,█▇▇▇▆▆▆▆▅▅▅▅▅▅▅▄▄▄▃▃▃▃▃▃▃▃▃▂▂▂▂▂▂▂▂▁▂▁▁▁

0,1
FK ROI,-0.06324
FK ROI < 30,-0.0836
ROI,-0.06389
ROI < 30,-0.08995
accuracy,0.18764
batch_before_backwards,20.0
batch_loss,54.18754
correct,516.0
epoch,49.0
epoch_loss,54.18754


[34m[1mwandb[0m: Agent Starting Run: 887er3i2 with config:
[34m[1mwandb[0m: 	batch_before_backwards: 5
[34m[1mwandb[0m: 	batch_size: 1000
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	epochs: 50
[34m[1mwandb[0m: 	f1_layer_size: 256
[34m[1mwandb[0m: 	f2_layer_size: 64
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	l1_beta: 0.1
[34m[1mwandb[0m: 	learning_rate: 0.0007796847016044851
[34m[1mwandb[0m: 	len_data: 16325
[34m[1mwandb[0m: 	loss: CEL
[34m[1mwandb[0m: 	num_layers: 2
[34m[1mwandb[0m: 	optimizer: adamW
[34m[1mwandb[0m: 	validation_split: 0.1
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


{'batch_before_backwards': 5, 'batch_size': 1000, 'dropout': 0.3, 'epochs': 50, 'f1_layer_size': 256, 'f2_layer_size': 64, 'hidden_size': 64, 'l1_beta': 0.1, 'learning_rate': 0.0007796847016044851, 'len_data': 16325, 'loss': 'CEL', 'num_layers': 2, 'optimizer': 'adamW', 'validation_split': 0.1}
50
{'batch_before_backwards': 5, 'batch_size': 1000, 'dropout': 0.3, 'epochs': 50, 'f1_layer_size': 256, 'f2_layer_size': 64, 'hidden_size': 64, 'l1_beta': 0.1, 'learning_rate': 0.0007796847016044851, 'len_data': 16325, 'loss': 'CEL', 'num_layers': 2, 'optimizer': 'adamW', 'validation_split': 0.1}


100%|██████████| 16325/16325 [00:00<00:00, 27093.33it/s]


filled =0
empty  =130600
0.0null_dog=0
SmoothL1Loss() Adam (
Parameter Group 0
    amsgrad: False
    betas: (0.9, 0.999)
    capturable: False
    eps: 1e-08
    foreach: None
    lr: 0.0007796847016044851
    maximize: False
    weight_decay: 0
)
smalll_lin_GRUNet(
  (batchnorm): BatchNorm1d(510, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
  (fc0): Linear(in_features=510, out_features=510, bias=True)
  (gru1): GRUCell(510, 64)
  (gru2): GRUCell(510, 64)
  (gru3): GRUCell(510, 64)
  (gru4): GRUCell(510, 64)
  (gru5): GRUCell(510, 64)
  (gru6): GRUCell(510, 64)
  (gru7): GRUCell(510, 64)
  (gru8): GRUCell(510, 64)
  (rl1): ReLU()
  (drop1): Dropout(p=0.3, inplace=False)
  (fc1): Linear(in_features=512, out_features=64, bias=True)
  (rl2): ReLU()
  (drop2): Dropout(p=0.3, inplace=False)
  (fc2): Linear(in_features=64, out_features=8, bias=True)
  (output_fn): Identity()
)


100%|██████████| 13/13 [00:05<00:00,  2.31it/s]
100%|██████████| 13/13 [00:06<00:00,  2.00it/s]
100%|██████████| 13/13 [00:09<00:00,  1.37it/s]
100%|██████████| 13/13 [00:11<00:00,  1.10it/s]
100%|██████████| 13/13 [00:07<00:00,  1.79it/s]
100%|██████████| 13/13 [00:05<00:00,  2.36it/s]
100%|██████████| 13/13 [00:06<00:00,  2.04it/s]
100%|██████████| 13/13 [00:06<00:00,  2.03it/s]
100%|██████████| 13/13 [00:06<00:00,  2.05it/s]
100%|██████████| 13/13 [00:05<00:00,  2.35it/s]
100%|██████████| 13/13 [00:09<00:00,  1.40it/s]
100%|██████████| 13/13 [00:06<00:00,  2.05it/s]
100%|██████████| 13/13 [00:06<00:00,  2.07it/s]
100%|██████████| 13/13 [00:06<00:00,  2.05it/s]
100%|██████████| 13/13 [00:06<00:00,  2.01it/s]
100%|██████████| 13/13 [00:06<00:00,  2.01it/s]
100%|██████████| 13/13 [00:11<00:00,  1.10it/s]
100%|██████████| 13/13 [00:06<00:00,  2.06it/s]
100%|██████████| 13/13 [00:06<00:00,  2.06it/s]
100%|██████████| 13/13 [00:06<00:00,  2.10it/s]
100%|██████████| 13/13 [00:06<00:00,  2.

created path



VBox(children=(Label(value='67.382 MB of 67.382 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
FK ROI,█▆▅▄▁▁▃▄▄▄▅▆▄▄▄▅▅▄▄▄▃▃▂▂▃▄▄▄▄▄▅▆▆▅▅▅▆▆▆▅
FK ROI < 30,▂▁▁▁▃▃▄▃▁▁▂▂▂▂▃▃▂▂▁▂▂▂▂▂▃▃▂▃▄▃▃▄▅▅▅▆██▇▇
ROI,█▆▅▄▁▂▃▄▄▄▅▆▅▄▄▅▅▄▄▄▃▃▂▃▃▄▄▄▄▄▅▅▅▅▄▄▅▅▆▄
ROI < 30,▂▁▁▁▃▃▄▃▁▁▂▂▂▂▃▃▂▂▂▂▂▂▂▂▃▃▂▃▄▃▃▄▅▅▅▅███▇
accuracy,▃▃▄▃▁▁▁▄▄▄▅▄▅▆▅▅▄▄▄▅▄▄▅▆▅▅▄▅▆▅▆▆▇▆▆▆▇▇▇█
batch_before_backwards,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
batch_loss,█▂▇▄▂▇▄▂▇▄▇▄▂▆▄▂▆▄▂▆▁▆▄▁▆▃▁▆▃▁▃▁▅▃▁▅▃▁▅▃
correct,▃▃▄▃▁▁▁▄▄▄▅▄▅▆▅▅▄▄▄▅▄▄▅▆▅▅▄▅▆▅▆▆▇▆▆▆▇▇▇█
epoch,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇███
epoch_loss,█▆▆▆▅▅▅▅▅▅▅▄▄▄▄▄▄▃▃▃▃▃▃▃▂▂▂▂▂▂▂▂▂▁▁▂▁▁▁▁

0,1
FK ROI,-0.05946
FK ROI < 30,-0.01704
ROI,-0.06375
ROI < 30,-0.01547
accuracy,0.19782
batch_before_backwards,5.0
batch_loss,16.85309
correct,544.0
epoch,49.0
epoch_loss,16.85309


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: xz5zns7m with config:
[34m[1mwandb[0m: 	batch_before_backwards: 5
[34m[1mwandb[0m: 	batch_size: 250
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	epochs: 50
[34m[1mwandb[0m: 	f1_layer_size: 256
[34m[1mwandb[0m: 	f2_layer_size: 64
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	l1_beta: 0.1
[34m[1mwandb[0m: 	learning_rate: 0.00048201439333189376
[34m[1mwandb[0m: 	len_data: 16325
[34m[1mwandb[0m: 	loss: CEL
[34m[1mwandb[0m: 	num_layers: 2
[34m[1mwandb[0m: 	optimizer: adamW
[34m[1mwandb[0m: 	validation_split: 0.1
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


{'batch_before_backwards': 5, 'batch_size': 250, 'dropout': 0.3, 'epochs': 50, 'f1_layer_size': 256, 'f2_layer_size': 64, 'hidden_size': 64, 'l1_beta': 0.1, 'learning_rate': 0.00048201439333189376, 'len_data': 16325, 'loss': 'CEL', 'num_layers': 2, 'optimizer': 'adamW', 'validation_split': 0.1}
50
{'batch_before_backwards': 5, 'batch_size': 250, 'dropout': 0.3, 'epochs': 50, 'f1_layer_size': 256, 'f2_layer_size': 64, 'hidden_size': 64, 'l1_beta': 0.1, 'learning_rate': 0.00048201439333189376, 'len_data': 16325, 'loss': 'CEL', 'num_layers': 2, 'optimizer': 'adamW', 'validation_split': 0.1}


100%|██████████| 16325/16325 [00:00<00:00, 27458.21it/s]


filled =0
empty  =130600
0.0null_dog=0
SmoothL1Loss() Adam (
Parameter Group 0
    amsgrad: False
    betas: (0.9, 0.999)
    capturable: False
    eps: 1e-08
    foreach: None
    lr: 0.00048201439333189376
    maximize: False
    weight_decay: 0
)
smalll_lin_GRUNet(
  (batchnorm): BatchNorm1d(510, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
  (fc0): Linear(in_features=510, out_features=510, bias=True)
  (gru1): GRUCell(510, 64)
  (gru2): GRUCell(510, 64)
  (gru3): GRUCell(510, 64)
  (gru4): GRUCell(510, 64)
  (gru5): GRUCell(510, 64)
  (gru6): GRUCell(510, 64)
  (gru7): GRUCell(510, 64)
  (gru8): GRUCell(510, 64)
  (rl1): ReLU()
  (drop1): Dropout(p=0.3, inplace=False)
  (fc1): Linear(in_features=512, out_features=64, bias=True)
  (rl2): ReLU()
  (drop2): Dropout(p=0.3, inplace=False)
  (fc2): Linear(in_features=64, out_features=8, bias=True)
  (output_fn): Identity()
)


100%|██████████| 54/54 [00:16<00:00,  3.19it/s]
100%|██████████| 54/54 [00:13<00:00,  3.96it/s]
100%|██████████| 54/54 [00:23<00:00,  2.26it/s]
100%|██████████| 54/54 [00:13<00:00,  4.05it/s]
100%|██████████| 54/54 [00:16<00:00,  3.20it/s]
100%|██████████| 54/54 [00:16<00:00,  3.22it/s]
100%|██████████| 54/54 [00:19<00:00,  2.83it/s]
100%|██████████| 54/54 [00:16<00:00,  3.20it/s]
100%|██████████| 54/54 [00:13<00:00,  3.97it/s]
100%|██████████| 54/54 [00:16<00:00,  3.18it/s]
100%|██████████| 54/54 [00:13<00:00,  4.02it/s]
100%|██████████| 54/54 [00:17<00:00,  3.16it/s]
100%|██████████| 54/54 [00:20<00:00,  2.59it/s]
100%|██████████| 54/54 [00:16<00:00,  3.23it/s]
100%|██████████| 54/54 [00:13<00:00,  3.95it/s]
100%|██████████| 54/54 [00:17<00:00,  3.17it/s]
100%|██████████| 54/54 [00:13<00:00,  4.02it/s]
100%|██████████| 54/54 [00:19<00:00,  2.72it/s]
100%|██████████| 54/54 [00:13<00:00,  4.03it/s]
100%|██████████| 54/54 [00:16<00:00,  3.21it/s]
100%|██████████| 54/54 [00:16<00:00,  3.

created path



VBox(children=(Label(value='67.425 MB of 67.425 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
FK ROI,▄▃▄▅▆▅▆▅▆▆▄▄▃▁▃▃▄▆▆▄▄▄▆▄▂▁▄▅▃▄▇▅▇▅▇▆▆▅██
FK ROI < 30,▁▃▃▃▄▄▅▄▅▄▃▄▃▃▅▄█▆▆▄▅▆▇▆▂▃▄▄▄▆▇▆▅▆▇▇▆▇██
ROI,▄▃▄▅▆▅▆▅▆▇▄▄▃▁▃▃▄▆▅▄▄▄▆▄▂▁▄▅▃▄▇▅█▆▇▆▆▅██
ROI < 30,▁▄▄▃▄▅▆▄▆▄▄▄▃▃▄▄▇▆▆▄▅▆▇▆▂▄▅▄▄▇▇▆▅▆▇▇▇▇██
accuracy,▂▁▂▃▃▃▃▃▄▃▃▂▃▅▃▃▃▄▃▄▄▅▇▅▄▆▄▅▇▇▇▇▆▇▇▇██▇█
batch_before_backwards,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
batch_loss,▅█▄▃▂▃▄▇▃▃▂▃▁▄▂▄▂▃▃▃▆▃▂▁▂▁▃▂▂▂▃▁▃▆▃▂▁▂▃▅
correct,▂▁▂▃▃▃▃▃▄▃▃▂▃▅▃▃▃▄▃▄▄▅▇▅▄▆▄▅▇▇▇▇▆▇▇▇██▇█
epoch,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇███
epoch_loss,██▇▇▇▇▇▆▆▅▅▅▅▄▄▄▄▄▄▄▄▄▃▃▃▃▃▃▃▃▃▂▃▂▂▂▁▂▁▁

0,1
FK ROI,-0.00756
FK ROI < 30,-0.0074
ROI,-0.00529
ROI < 30,-0.00523
accuracy,0.20145
batch_before_backwards,5.0
batch_loss,18.32696
correct,554.0
epoch,49.0
epoch_loss,18.32696


[34m[1mwandb[0m: Agent Starting Run: xgulchw7 with config:
[34m[1mwandb[0m: 	batch_before_backwards: 10
[34m[1mwandb[0m: 	batch_size: 100
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	epochs: 50
[34m[1mwandb[0m: 	f1_layer_size: 256
[34m[1mwandb[0m: 	f2_layer_size: 64
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	l1_beta: 0.1
[34m[1mwandb[0m: 	learning_rate: 0.0005796136324016931
[34m[1mwandb[0m: 	len_data: 16325
[34m[1mwandb[0m: 	loss: CEL
[34m[1mwandb[0m: 	num_layers: 2
[34m[1mwandb[0m: 	optimizer: adamW
[34m[1mwandb[0m: 	validation_split: 0.1
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


{'batch_before_backwards': 10, 'batch_size': 100, 'dropout': 0.3, 'epochs': 50, 'f1_layer_size': 256, 'f2_layer_size': 64, 'hidden_size': 64, 'l1_beta': 0.1, 'learning_rate': 0.0005796136324016931, 'len_data': 16325, 'loss': 'CEL', 'num_layers': 2, 'optimizer': 'adamW', 'validation_split': 0.1}
50
{'batch_before_backwards': 10, 'batch_size': 100, 'dropout': 0.3, 'epochs': 50, 'f1_layer_size': 256, 'f2_layer_size': 64, 'hidden_size': 64, 'l1_beta': 0.1, 'learning_rate': 0.0005796136324016931, 'len_data': 16325, 'loss': 'CEL', 'num_layers': 2, 'optimizer': 'adamW', 'validation_split': 0.1}


100%|██████████| 16325/16325 [00:00<00:00, 25930.33it/s]


filled =0
empty  =130600
0.0null_dog=0
SmoothL1Loss() Adam (
Parameter Group 0
    amsgrad: False
    betas: (0.9, 0.999)
    capturable: False
    eps: 1e-08
    foreach: None
    lr: 0.0005796136324016931
    maximize: False
    weight_decay: 0
)
smalll_lin_GRUNet(
  (batchnorm): BatchNorm1d(510, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
  (fc0): Linear(in_features=510, out_features=510, bias=True)
  (gru1): GRUCell(510, 64)
  (gru2): GRUCell(510, 64)
  (gru3): GRUCell(510, 64)
  (gru4): GRUCell(510, 64)
  (gru5): GRUCell(510, 64)
  (gru6): GRUCell(510, 64)
  (gru7): GRUCell(510, 64)
  (gru8): GRUCell(510, 64)
  (rl1): ReLU()
  (drop1): Dropout(p=0.3, inplace=False)
  (fc1): Linear(in_features=512, out_features=64, bias=True)
  (rl2): ReLU()
  (drop2): Dropout(p=0.3, inplace=False)
  (fc2): Linear(in_features=64, out_features=8, bias=True)
  (output_fn): Identity()
)


100%|██████████| 135/135 [00:22<00:00,  6.10it/s]
100%|██████████| 135/135 [00:22<00:00,  5.91it/s]
100%|██████████| 135/135 [00:22<00:00,  6.07it/s]
100%|██████████| 135/135 [00:19<00:00,  7.10it/s]
100%|██████████| 135/135 [00:22<00:00,  6.05it/s]
100%|██████████| 135/135 [00:22<00:00,  6.12it/s]
100%|██████████| 135/135 [00:25<00:00,  5.35it/s]
100%|██████████| 135/135 [00:22<00:00,  6.11it/s]
100%|██████████| 135/135 [00:22<00:00,  6.01it/s]
100%|██████████| 135/135 [00:18<00:00,  7.16it/s]
100%|██████████| 135/135 [00:28<00:00,  4.81it/s]
100%|██████████| 135/135 [00:22<00:00,  5.97it/s]
100%|██████████| 135/135 [00:19<00:00,  7.06it/s]
100%|██████████| 135/135 [00:23<00:00,  5.78it/s]
100%|██████████| 135/135 [00:22<00:00,  6.03it/s]
100%|██████████| 135/135 [00:18<00:00,  7.15it/s]
100%|██████████| 135/135 [00:22<00:00,  5.93it/s]
100%|██████████| 135/135 [00:23<00:00,  5.81it/s]
100%|██████████| 135/135 [00:18<00:00,  7.14it/s]
100%|██████████| 135/135 [00:22<00:00,  6.07it/s]


created path



VBox(children=(Label(value='67.408 MB of 67.408 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
FK ROI,▃▁▃▂▁▃▃▃▂▂▂▃▃▃▄▃▂▃▂▄▄▆▄▃▄▆▅▅▆▆▆▄▅▅▆▇▆▇█▅
FK ROI < 30,▄▂▃▁▁▃▄▃▂▂▂▂▅▆▇▅▄▄▅▆▆█▇▄▅▇▇▆▆▆▅▆▆▇▅█▅▆█▆
ROI,▂▁▃▂▁▃▃▃▂▂▂▃▃▃▄▃▃▃▂▃▄▆▄▃▄▆▅▅▆▆▆▅▅▅▆▇▆▇█▅
ROI < 30,▃▂▃▁▁▃▄▃▂▂▂▂▄▆▇▅▄▄▅▆▆▇▇▄▆▇▇▆▅▆▆▆▇▇▅█▅▆█▆
accuracy,▂▁▂▂▃▃▄▄▃▅▃▂▃▄▅▂▃▃▃▅▂▅▅▃▃▄▃▄▆▅▄▃▃▃█▃▆▄▆▅
batch_before_backwards,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
batch_loss,▄▅▅▂▄▅▂▄▃█▄▃█▃▄▇▃▄▄▂▄▄▂▃▂▁▃▂▆▂▂▆▂▃▃▂▃▃▁▃
correct,▂▁▂▂▃▃▄▄▃▅▃▂▃▄▅▂▃▃▃▅▂▅▅▃▃▄▃▄▆▅▄▃▃▃█▃▆▄▆▅
epoch,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇███
epoch_loss,██▇▇▇▇▆▆▅▅▅▅▅▅▅▄▅▅▄▄▄▄▄▄▃▄▃▃▃▂▂▂▁▂▂▁▁▂▁▁

0,1
FK ROI,-0.02234
FK ROI < 30,-0.04927
ROI,-0.01447
ROI < 30,-0.04477
accuracy,0.18618
batch_before_backwards,10.0
batch_loss,18.06277
correct,512.0
epoch,49.0
epoch_loss,18.06277


[34m[1mwandb[0m: Agent Starting Run: jgmtjbqe with config:
[34m[1mwandb[0m: 	batch_before_backwards: 20
[34m[1mwandb[0m: 	batch_size: 500
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	epochs: 50
[34m[1mwandb[0m: 	f1_layer_size: 256
[34m[1mwandb[0m: 	f2_layer_size: 64
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	l1_beta: 0.1
[34m[1mwandb[0m: 	learning_rate: 0.0009348872323541364
[34m[1mwandb[0m: 	len_data: 16325
[34m[1mwandb[0m: 	loss: CEL
[34m[1mwandb[0m: 	num_layers: 2
[34m[1mwandb[0m: 	optimizer: adamW
[34m[1mwandb[0m: 	validation_split: 0.1
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


{'batch_before_backwards': 20, 'batch_size': 500, 'dropout': 0.3, 'epochs': 50, 'f1_layer_size': 256, 'f2_layer_size': 64, 'hidden_size': 64, 'l1_beta': 0.1, 'learning_rate': 0.0009348872323541364, 'len_data': 16325, 'loss': 'CEL', 'num_layers': 2, 'optimizer': 'adamW', 'validation_split': 0.1}
50
{'batch_before_backwards': 20, 'batch_size': 500, 'dropout': 0.3, 'epochs': 50, 'f1_layer_size': 256, 'f2_layer_size': 64, 'hidden_size': 64, 'l1_beta': 0.1, 'learning_rate': 0.0009348872323541364, 'len_data': 16325, 'loss': 'CEL', 'num_layers': 2, 'optimizer': 'adamW', 'validation_split': 0.1}


100%|██████████| 16325/16325 [00:00<00:00, 28218.30it/s]


filled =0
empty  =130600
0.0null_dog=0
SmoothL1Loss() Adam (
Parameter Group 0
    amsgrad: False
    betas: (0.9, 0.999)
    capturable: False
    eps: 1e-08
    foreach: None
    lr: 0.0009348872323541364
    maximize: False
    weight_decay: 0
)
smalll_lin_GRUNet(
  (batchnorm): BatchNorm1d(510, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
  (fc0): Linear(in_features=510, out_features=510, bias=True)
  (gru1): GRUCell(510, 64)
  (gru2): GRUCell(510, 64)
  (gru3): GRUCell(510, 64)
  (gru4): GRUCell(510, 64)
  (gru5): GRUCell(510, 64)
  (gru6): GRUCell(510, 64)
  (gru7): GRUCell(510, 64)
  (gru8): GRUCell(510, 64)
  (rl1): ReLU()
  (drop1): Dropout(p=0.3, inplace=False)
  (fc1): Linear(in_features=512, out_features=64, bias=True)
  (rl2): ReLU()
  (drop2): Dropout(p=0.3, inplace=False)
  (fc2): Linear(in_features=64, out_features=8, bias=True)
  (output_fn): Identity()
)


100%|██████████| 27/27 [00:08<00:00,  3.34it/s]
100%|██████████| 27/27 [00:07<00:00,  3.39it/s]
100%|██████████| 27/27 [00:07<00:00,  3.43it/s]
100%|██████████| 27/27 [00:07<00:00,  3.46it/s]
100%|██████████| 27/27 [00:14<00:00,  1.84it/s]
100%|██████████| 27/27 [00:07<00:00,  3.45it/s]
100%|██████████| 27/27 [00:07<00:00,  3.49it/s]
100%|██████████| 27/27 [00:07<00:00,  3.44it/s]
100%|██████████| 27/27 [00:07<00:00,  3.48it/s]
100%|██████████| 27/27 [00:14<00:00,  1.83it/s]
100%|██████████| 27/27 [00:07<00:00,  3.48it/s]
100%|██████████| 27/27 [00:07<00:00,  3.40it/s]
100%|██████████| 27/27 [00:07<00:00,  3.42it/s]
100%|██████████| 27/27 [00:07<00:00,  3.44it/s]
100%|██████████| 27/27 [00:14<00:00,  1.83it/s]
100%|██████████| 27/27 [00:07<00:00,  3.47it/s]
100%|██████████| 27/27 [00:07<00:00,  3.43it/s]
100%|██████████| 27/27 [00:07<00:00,  3.44it/s]
100%|██████████| 27/27 [00:07<00:00,  3.45it/s]
100%|██████████| 27/27 [00:14<00:00,  1.83it/s]
100%|██████████| 27/27 [00:09<00:00,  2.