In [1]:
import pandas as pd
import numpy as np
import sklearn as sk
import os
import torch
import copy
from torch.utils.data import Dataset, DataLoader

from sklearn.feature_extraction import DictVectorizer
from sklearn.externals import joblib
from sklearn.model_selection import ParameterGrid


from functools import reduce
from util import *

In [2]:
# %load_ext autoreload
# %autoreload 2

In [3]:
use_gpu = torch.cuda.is_available()
print(use_gpu)

True


In [4]:
data_path = '../data'
data_dict = joblib.load(os.path.join(data_path, 'data_dict.pkl'))
exp_name = 'exp2'

In [5]:
# Key = starting state, value = next state
transition_dict_train = dict(zip(data_dict['train']['state_id'], data_dict['train']['next_state_id']))
transition_dict_val = dict(zip(data_dict['val']['state_id'], data_dict['val']['next_state_id']))

In [6]:
# Define the tuning grid
param_options = {
                  'state_dim' : [data_dict['train']['X'].shape[1]],
                  'action_dim' : [25],
                  'gamma' : [0.9],
                  'batch_size' : [512],
                  'lr' : [1e-4],
                  'num_epochs' : [300],
                  'hidden_dim' : [128, 256, 512, 1024],
                  'num_hidden' : [1, 2, 3, 5, 10],
                  'drop_prob' : [0.0],
                  'target_update': [10],
                  'option' : ['linear'],
                  'use_scheduler' : [False]
         }

config_grid = ParameterGrid(param_options)

In [7]:
# Train all the models
for config in config_grid:
    
    # Create a Dataset
    train_dataset = RL_Dataset(data_dict['train']['X'], 
                               data_dict['train']['action'],
                               data_dict['train']['reward'],
                               transition_dict_train)

    val_dataset = RL_Dataset(data_dict['val']['X'], 
                               data_dict['val']['action'],
                               data_dict['val']['reward'],
                               transition_dict_val)
    # Create a dataloader
    train_loader = DataLoader(train_dataset, 
                            config['batch_size'],
                            shuffle = True,
                            num_workers = 32
                             )

    val_loader = DataLoader(val_dataset, 
                             config['batch_size'],
                             shuffle = True,
                             num_workers = 32
                             )

    loaders = {'train' : train_loader,
               'val' : val_loader
              }

    dset_sizes = {'train' : len(train_dataset),
                  'val' : len(val_dataset)
                 }
    
    
    
    print(config)
    model = dueling_net(D_in = config['state_dim'], 
                        H = config['hidden_dim'], 
                        D_out = config['action_dim'],
                        drop_prob = config['drop_prob'],
                        num_hidden = config['num_hidden'],
                        option = config['option']
                       )

    target_model = dueling_net(D_in = config['state_dim'], 
                                H = config['hidden_dim'], 
                                D_out = config['action_dim'],
                                drop_prob = config['drop_prob'],
                                num_hidden = config['num_hidden'],
                                option = config['option']
                              )

    optimizer = optim.Adam([{'params': model.parameters()}], 
                            lr = config['lr'])

    if config['use_scheduler']:
        scheduler = lr_scheduler.ReduceLROnPlateau(optimizer, mode = 'min', verbose = True)
    else:
        scheduler = None

    def weights_init(m):
            if isinstance(m, nn.Linear):
                nn.init.xavier_uniform(m.weight.data).float()

    model.apply(weights_init)
    target_model.apply(weights_init)

    if use_gpu:
        model = model.cuda()
        target_model.cuda()

    criterion = torch.nn.SmoothL1Loss(size_average = False)

    performance_dict, best_model, best_loss, time_elapsed = train_model_double(model = model, 
                                                                                target_model = target_model,
                                                                                loaders = loaders, 
                                                                                dset_sizes = dset_sizes, 
                                                                                config = config, 
                                                                                criterion = criterion,
                                                                                optimizer = optimizer,
                                                                                scheduler = scheduler,
                                                                                use_gpu = use_gpu)
    
    config_str = reduce(lambda x, y: x + y + '_', [str(key) + '_' + str(value) for key, value in config.items()]) + 'time_'+ str(time.time()).split('.')[1]
    checkpoints_path = os.path.join('../checkpoints/' + exp_name, config_str + '.chk')
    torch.save(best_model.state_dict(), checkpoints_path)
    
    performance_df = dict_to_df(performance_dict)
    config_df = pd.DataFrame(config, index = [0])
    config_df['config_str'] = config_str
    performance_df['config_str'] = config_str
    performance_df = performance_df.set_index('config_str').join(config_df.set_index('config_str'))
    performance_df.to_csv(os.path.join('../performance/' + exp_name, 'performance_' + config_str + '.csv'), index = True)

{'num_hidden': 1, 'target_update': 10, 'option': 'linear', 'drop_prob': 0.0, 'state_dim': 46, 'use_scheduler': False, 'batch_size': 512, 'lr': 0.0001, 'hidden_dim': 128, 'num_epochs': 300, 'gamma': 0.9, 'action_dim': 25}
----------
Epoch 0/299
----------
Updating Target Model
train Loss: 1.494470, Best Value: 1.170697, Empirical Value: 0.128475
val Loss: 1.647179, Best Value: 1.163967, Empirical Value: 0.206467
Best Value updated
----------
Epoch 1/299
----------
train Loss: 1.372761, Best Value: 1.531943, Empirical Value: 0.821209
val Loss: 1.269305, Best Value: 1.650092, Empirical Value: 1.058347
Best Value updated
----------
Epoch 2/299
----------
train Loss: 1.296321, Best Value: 1.653908, Empirical Value: 1.077189
val Loss: 1.262995, Best Value: 1.628762, Empirical Value: 1.072010
----------
Epoch 3/299
----------
train Loss: 1.293526, Best Value: 1.614934, Empirical Value: 1.072405
val Loss: 1.261844, Best Value: 1.590778, Empirical Value: 1.061712
----------
Epoch 4/299
--------

train Loss: 1.198855, Best Value: 2.087402, Empirical Value: 1.836700
val Loss: 1.173769, Best Value: 2.123041, Empirical Value: 1.868088
Best Value updated
----------
Epoch 45/299
----------
train Loss: 1.198677, Best Value: 2.090237, Empirical Value: 1.837201
val Loss: 1.172456, Best Value: 2.085285, Empirical Value: 1.830157
----------
Epoch 46/299
----------
train Loss: 1.198579, Best Value: 2.090169, Empirical Value: 1.836372
val Loss: 1.172303, Best Value: 2.087485, Empirical Value: 1.836897
----------
Epoch 47/299
----------
train Loss: 1.198586, Best Value: 2.092585, Empirical Value: 1.835814
val Loss: 1.172307, Best Value: 2.090358, Empirical Value: 1.836995
----------
Epoch 48/299
----------
train Loss: 1.198635, Best Value: 2.092160, Empirical Value: 1.835385
val Loss: 1.172849, Best Value: 2.075443, Empirical Value: 1.823377
----------
Epoch 49/299
----------
train Loss: 1.198500, Best Value: 2.092285, Empirical Value: 1.834775
val Loss: 1.172319, Best Value: 2.093178, Empi

val Loss: 1.136830, Best Value: 2.496461, Empirical Value: 2.248963
----------
Epoch 90/299
----------
Updating Target Model
train Loss: 1.162360, Best Value: 2.501523, Empirical Value: 2.251131
val Loss: 1.134381, Best Value: 2.480602, Empirical Value: 2.244254
----------
Epoch 91/299
----------
train Loss: 1.158946, Best Value: 2.536925, Empirical Value: 2.293152
val Loss: 1.133197, Best Value: 2.551185, Empirical Value: 2.303364
Best Value updated
----------
Epoch 92/299
----------
train Loss: 1.158725, Best Value: 2.540147, Empirical Value: 2.293577
val Loss: 1.132972, Best Value: 2.540076, Empirical Value: 2.291936
----------
Epoch 93/299
----------
train Loss: 1.158364, Best Value: 2.543897, Empirical Value: 2.295058
val Loss: 1.132935, Best Value: 2.525617, Empirical Value: 2.273232
----------
Epoch 94/299
----------
train Loss: 1.158210, Best Value: 2.544028, Empirical Value: 2.294110
val Loss: 1.132959, Best Value: 2.528722, Empirical Value: 2.276877
----------
Epoch 95/299
--

train Loss: 1.140646, Best Value: 2.762455, Empirical Value: 2.508026
val Loss: 1.115846, Best Value: 2.750766, Empirical Value: 2.492542
----------
Epoch 136/299
----------
train Loss: 1.140705, Best Value: 2.764373, Empirical Value: 2.508018
val Loss: 1.115649, Best Value: 2.758442, Empirical Value: 2.495822
----------
Epoch 137/299
----------
train Loss: 1.140613, Best Value: 2.763803, Empirical Value: 2.508035
val Loss: 1.115564, Best Value: 2.770609, Empirical Value: 2.511970
----------
Epoch 138/299
----------
train Loss: 1.140533, Best Value: 2.763418, Empirical Value: 2.507538
val Loss: 1.115481, Best Value: 2.749240, Empirical Value: 2.490921
----------
Epoch 139/299
----------
train Loss: 1.140557, Best Value: 2.765328, Empirical Value: 2.508432
val Loss: 1.115840, Best Value: 2.754930, Empirical Value: 2.496724
----------
Epoch 140/299
----------
Updating Target Model
train Loss: 1.140513, Best Value: 2.763784, Empirical Value: 2.507504
val Loss: 1.113897, Best Value: 2.7667

val Loss: 1.101660, Best Value: 2.958008, Empirical Value: 2.690761
----------
Epoch 181/299
----------
train Loss: 1.125122, Best Value: 2.998584, Empirical Value: 2.739537
val Loss: 1.100184, Best Value: 3.012910, Empirical Value: 2.751223
Best Value updated
----------
Epoch 182/299
----------
train Loss: 1.124913, Best Value: 3.002277, Empirical Value: 2.740789
val Loss: 1.113884, Best Value: 3.060300, Empirical Value: 2.800910
Best Value updated
----------
Epoch 183/299
----------
train Loss: 1.124873, Best Value: 3.003879, Empirical Value: 2.739116
val Loss: 1.100226, Best Value: 3.000764, Empirical Value: 2.733714
----------
Epoch 184/299
----------
train Loss: 1.124902, Best Value: 3.006821, Empirical Value: 2.740510
val Loss: 1.100058, Best Value: 2.998958, Empirical Value: 2.730454
----------
Epoch 185/299
----------
train Loss: 1.124809, Best Value: 3.008462, Empirical Value: 2.740647
val Loss: 1.100109, Best Value: 2.995203, Empirical Value: 2.722014
----------
Epoch 186/299

train Loss: 1.116498, Best Value: 3.176894, Empirical Value: 2.892075
val Loss: 1.092091, Best Value: 3.186754, Empirical Value: 2.896736
----------
Epoch 227/299
----------
train Loss: 1.116493, Best Value: 3.181707, Empirical Value: 2.893072
val Loss: 1.102589, Best Value: 3.222691, Empirical Value: 2.942216
Best Value updated
----------
Epoch 228/299
----------
train Loss: 1.116044, Best Value: 3.183551, Empirical Value: 2.893081
val Loss: 1.116382, Best Value: 3.253771, Empirical Value: 2.959702
Best Value updated
----------
Epoch 229/299
----------
train Loss: 1.116395, Best Value: 3.183642, Empirical Value: 2.892112
val Loss: 1.092356, Best Value: 3.173158, Empirical Value: 2.884297
----------
Epoch 230/299
----------
Updating Target Model
train Loss: 1.116456, Best Value: 3.183557, Empirical Value: 2.892580
val Loss: 1.092023, Best Value: 3.175390, Empirical Value: 2.880006
----------
Epoch 231/299
----------
train Loss: 1.114719, Best Value: 3.215061, Empirical Value: 2.932277


val Loss: 1.081838, Best Value: 3.425985, Empirical Value: 3.127987
Best Value updated
----------
Epoch 272/299
----------
train Loss: 1.105555, Best Value: 3.419695, Empirical Value: 3.121263
val Loss: 1.081975, Best Value: 3.444767, Empirical Value: 3.138746
Best Value updated
----------
Epoch 273/299
----------
train Loss: 1.105599, Best Value: 3.419046, Empirical Value: 3.120439
val Loss: 1.081664, Best Value: 3.431578, Empirical Value: 3.123007
----------
Epoch 274/299
----------
train Loss: 1.105404, Best Value: 3.422264, Empirical Value: 3.120433
val Loss: 1.081531, Best Value: 3.436569, Empirical Value: 3.135258
----------
Epoch 275/299
----------
train Loss: 1.105524, Best Value: 3.424865, Empirical Value: 3.120658
val Loss: 1.081718, Best Value: 3.433952, Empirical Value: 3.126065
----------
Epoch 276/299
----------
train Loss: 1.105429, Best Value: 3.425907, Empirical Value: 3.120098
val Loss: 1.081697, Best Value: 3.439747, Empirical Value: 3.128764
----------
Epoch 277/299

train Loss: 1.231340, Best Value: 1.753097, Empirical Value: 1.278506
val Loss: 1.202904, Best Value: 1.766956, Empirical Value: 1.278059
----------
Epoch 16/299
----------
train Loss: 1.231062, Best Value: 1.755842, Empirical Value: 1.275538
val Loss: 1.202879, Best Value: 1.771515, Empirical Value: 1.278487
----------
Epoch 17/299
----------
train Loss: 1.230833, Best Value: 1.758313, Empirical Value: 1.274050
val Loss: 1.202991, Best Value: 1.744782, Empirical Value: 1.259587
----------
Epoch 18/299
----------
train Loss: 1.230689, Best Value: 1.761189, Empirical Value: 1.272881
val Loss: 1.202504, Best Value: 1.788879, Empirical Value: 1.287135
Best Value updated
----------
Epoch 19/299
----------
train Loss: 1.230703, Best Value: 1.760333, Empirical Value: 1.268107
val Loss: 1.202877, Best Value: 1.751399, Empirical Value: 1.263141
----------
Epoch 20/299
----------
Updating Target Model
train Loss: 1.230606, Best Value: 1.761258, Empirical Value: 1.267601
val Loss: 1.281907, Best

Updating Target Model
train Loss: 1.154158, Best Value: 2.569743, Empirical Value: 2.253019
val Loss: 1.131666, Best Value: 2.568544, Empirical Value: 2.244202
----------
Epoch 61/299
----------
train Loss: 1.146590, Best Value: 2.652685, Empirical Value: 2.365715
val Loss: 1.120478, Best Value: 2.637191, Empirical Value: 2.352782
Best Value updated
----------
Epoch 62/299
----------
train Loss: 1.145322, Best Value: 2.664987, Empirical Value: 2.373878
val Loss: 1.118839, Best Value: 2.661618, Empirical Value: 2.374313
Best Value updated
----------
Epoch 63/299
----------
train Loss: 1.145203, Best Value: 2.668926, Empirical Value: 2.373260
val Loss: 1.120175, Best Value: 2.636384, Empirical Value: 2.346659
----------
Epoch 64/299
----------
train Loss: 1.145188, Best Value: 2.671049, Empirical Value: 2.372862
val Loss: 1.119192, Best Value: 2.667138, Empirical Value: 2.370727
Best Value updated
----------
Epoch 65/299
----------
train Loss: 1.144868, Best Value: 2.676099, Empirical Va

train Loss: 1.123963, Best Value: 3.103751, Empirical Value: 2.768688
val Loss: 1.100534, Best Value: 3.089034, Empirical Value: 2.754112
----------
Epoch 106/299
----------
train Loss: 1.123624, Best Value: 3.108499, Empirical Value: 2.767637
val Loss: 1.100168, Best Value: 3.089201, Empirical Value: 2.754241
----------
Epoch 107/299
----------
train Loss: 1.123730, Best Value: 3.110659, Empirical Value: 2.767819
val Loss: 1.100836, Best Value: 3.104348, Empirical Value: 2.761937
----------
Epoch 108/299
----------
train Loss: 1.123462, Best Value: 3.114262, Empirical Value: 2.767799
val Loss: 1.100715, Best Value: 3.098712, Empirical Value: 2.741664
----------
Epoch 109/299
----------
train Loss: 1.123551, Best Value: 3.117603, Empirical Value: 2.766920
val Loss: 1.108535, Best Value: 3.085389, Empirical Value: 2.735245
----------
Epoch 110/299
----------
Updating Target Model
train Loss: 1.123552, Best Value: 3.120530, Empirical Value: 2.767559
val Loss: 1.102038, Best Value: 3.1504

Updating Target Model
train Loss: 1.103763, Best Value: 3.537551, Empirical Value: 3.142644
val Loss: 1.088233, Best Value: 3.524268, Empirical Value: 3.139519
----------
Epoch 151/299
----------
train Loss: 1.101950, Best Value: 3.593975, Empirical Value: 3.228992
val Loss: 1.080909, Best Value: 3.615079, Empirical Value: 3.246963
Best Value updated
----------
Epoch 152/299
----------
train Loss: 1.101669, Best Value: 3.603860, Empirical Value: 3.232611
val Loss: 1.081743, Best Value: 3.613911, Empirical Value: 3.245415
----------
Epoch 153/299
----------
train Loss: 1.101314, Best Value: 3.607758, Empirical Value: 3.232800
val Loss: 1.081517, Best Value: 3.616844, Empirical Value: 3.239915
Best Value updated
----------
Epoch 154/299
----------
train Loss: 1.101103, Best Value: 3.612867, Empirical Value: 3.232054
val Loss: 1.081138, Best Value: 3.608843, Empirical Value: 3.225558
----------
Epoch 155/299
----------
train Loss: 1.100887, Best Value: 3.615551, Empirical Value: 3.233013


val Loss: 1.072391, Best Value: 3.984168, Empirical Value: 3.595435
----------
Epoch 195/299
----------
train Loss: 1.088132, Best Value: 4.025867, Empirical Value: 3.625403
val Loss: 1.071232, Best Value: 4.010815, Empirical Value: 3.617127
----------
Epoch 196/299
----------
train Loss: 1.088370, Best Value: 4.030134, Empirical Value: 3.625120
val Loss: 1.071660, Best Value: 4.078254, Empirical Value: 3.673527
Best Value updated
----------
Epoch 197/299
----------
train Loss: 1.088412, Best Value: 4.032626, Empirical Value: 3.625751
val Loss: 1.071460, Best Value: 4.018975, Empirical Value: 3.617357
----------
Epoch 198/299
----------
train Loss: 1.088041, Best Value: 4.038071, Empirical Value: 3.627475
val Loss: 1.073475, Best Value: 4.098142, Empirical Value: 3.692506
Best Value updated
----------
Epoch 199/299
----------
train Loss: 1.087975, Best Value: 4.037656, Empirical Value: 3.624781
val Loss: 1.071453, Best Value: 4.066490, Empirical Value: 3.657018
----------
Epoch 200/299

Updating Target Model
train Loss: 1.075294, Best Value: 4.331589, Empirical Value: 3.902579
val Loss: 1.059293, Best Value: 4.280814, Empirical Value: 3.877890
----------
Epoch 241/299
----------
train Loss: 1.072796, Best Value: 4.346513, Empirical Value: 3.916831
val Loss: 1.058469, Best Value: 4.362636, Empirical Value: 3.921473
----------
Epoch 242/299
----------
train Loss: 1.072104, Best Value: 4.348426, Empirical Value: 3.913674
val Loss: 1.059160, Best Value: 4.297232, Empirical Value: 3.877039
----------
Epoch 243/299
----------
train Loss: 1.071913, Best Value: 4.348266, Empirical Value: 3.915566
val Loss: 1.059053, Best Value: 4.340666, Empirical Value: 3.907239
----------
Epoch 244/299
----------
train Loss: 1.072135, Best Value: 4.353174, Empirical Value: 3.914987
val Loss: 1.058755, Best Value: 4.355463, Empirical Value: 3.918855
----------
Epoch 245/299
----------
train Loss: 1.071775, Best Value: 4.351946, Empirical Value: 3.914275
val Loss: 1.057878, Best Value: 4.3448

train Loss: 1.066147, Best Value: 4.680902, Empirical Value: 4.232599
val Loss: 1.057484, Best Value: 4.661537, Empirical Value: 4.207907
----------
Epoch 286/299
----------
train Loss: 1.066873, Best Value: 4.684719, Empirical Value: 4.232112
val Loss: 1.056545, Best Value: 4.726524, Empirical Value: 4.281911
Best Value updated
----------
Epoch 287/299
----------
train Loss: 1.066223, Best Value: 4.688624, Empirical Value: 4.231104
val Loss: 1.058062, Best Value: 4.624448, Empirical Value: 4.179692
----------
Epoch 288/299
----------
train Loss: 1.066090, Best Value: 4.692469, Empirical Value: 4.234464
val Loss: 1.055547, Best Value: 4.669386, Empirical Value: 4.205156
----------
Epoch 289/299
----------
train Loss: 1.065651, Best Value: 4.692944, Empirical Value: 4.229624
val Loss: 1.056991, Best Value: 4.636139, Empirical Value: 4.184259
----------
Epoch 290/299
----------
Updating Target Model
train Loss: 1.066369, Best Value: 4.698278, Empirical Value: 4.233162
val Loss: 1.059808,

train Loss: 1.231763, Best Value: 1.688851, Empirical Value: 1.313134
val Loss: 1.205735, Best Value: 1.676417, Empirical Value: 1.296186
----------
Epoch 30/299
----------
Updating Target Model
train Loss: 1.231898, Best Value: 1.690629, Empirical Value: 1.310042
val Loss: 1.231989, Best Value: 1.707299, Empirical Value: 1.329212
----------
Epoch 31/299
----------
train Loss: 1.216764, Best Value: 1.880675, Empirical Value: 1.568104
val Loss: 1.188069, Best Value: 1.916257, Empirical Value: 1.592697
Best Value updated
----------
Epoch 32/299
----------
train Loss: 1.213972, Best Value: 1.896126, Empirical Value: 1.578533
val Loss: 1.187886, Best Value: 1.957761, Empirical Value: 1.618075
Best Value updated
----------
Epoch 33/299
----------
train Loss: 1.214092, Best Value: 1.898290, Empirical Value: 1.575992
val Loss: 1.187676, Best Value: 1.905567, Empirical Value: 1.576581
----------
Epoch 34/299
----------
train Loss: 1.214004, Best Value: 1.900807, Empirical Value: 1.575689
val L

train Loss: 1.163418, Best Value: 2.453626, Empirical Value: 2.165674
val Loss: 1.140276, Best Value: 2.492359, Empirical Value: 2.204062
----------
Epoch 75/299
----------
train Loss: 1.163249, Best Value: 2.454795, Empirical Value: 2.164794
val Loss: 1.140164, Best Value: 2.489082, Empirical Value: 2.194427
----------
Epoch 76/299
----------
train Loss: 1.163283, Best Value: 2.455398, Empirical Value: 2.164400
val Loss: 1.141111, Best Value: 2.503612, Empirical Value: 2.210603
Best Value updated
----------
Epoch 77/299
----------
train Loss: 1.163015, Best Value: 2.459308, Empirical Value: 2.163890
val Loss: 1.140928, Best Value: 2.472547, Empirical Value: 2.177517
----------
Epoch 78/299
----------
train Loss: 1.163166, Best Value: 2.459615, Empirical Value: 2.163497
val Loss: 1.140366, Best Value: 2.484351, Empirical Value: 2.188399
----------
Epoch 79/299
----------
train Loss: 1.162798, Best Value: 2.461320, Empirical Value: 2.162677
val Loss: 1.140492, Best Value: 2.494472, Empi

train Loss: 1.128837, Best Value: 2.908552, Empirical Value: 2.586909
val Loss: 1.113082, Best Value: 2.889189, Empirical Value: 2.561368
----------
Epoch 120/299
----------
Updating Target Model
train Loss: 1.128567, Best Value: 2.909999, Empirical Value: 2.587661
val Loss: 1.112437, Best Value: 2.909709, Empirical Value: 2.589137
----------
Epoch 121/299
----------
train Loss: 1.124598, Best Value: 2.984919, Empirical Value: 2.676919
val Loss: 1.107512, Best Value: 2.999922, Empirical Value: 2.694081
Best Value updated
----------
Epoch 122/299
----------
train Loss: 1.124128, Best Value: 2.995997, Empirical Value: 2.681994
val Loss: 1.123221, Best Value: 2.914764, Empirical Value: 2.618427
----------
Epoch 123/299
----------
train Loss: 1.124167, Best Value: 2.997059, Empirical Value: 2.680184
val Loss: 1.106971, Best Value: 3.018583, Empirical Value: 2.704852
Best Value updated
----------
Epoch 124/299
----------
train Loss: 1.123839, Best Value: 3.004176, Empirical Value: 2.679900


train Loss: 1.097860, Best Value: 3.485821, Empirical Value: 3.114964
val Loss: 1.086174, Best Value: 3.458202, Empirical Value: 3.098657
----------
Epoch 165/299
----------
train Loss: 1.097718, Best Value: 3.490776, Empirical Value: 3.116710
val Loss: 1.085483, Best Value: 3.495410, Empirical Value: 3.126172
----------
Epoch 166/299
----------
train Loss: 1.097239, Best Value: 3.497002, Empirical Value: 3.117854
val Loss: 1.085389, Best Value: 3.507584, Empirical Value: 3.134629
----------
Epoch 167/299
----------
train Loss: 1.097271, Best Value: 3.492878, Empirical Value: 3.114386
val Loss: 1.085784, Best Value: 3.472063, Empirical Value: 3.090228
----------
Epoch 168/299
----------
train Loss: 1.096794, Best Value: 3.498857, Empirical Value: 3.115870
val Loss: 1.084662, Best Value: 3.500806, Empirical Value: 3.123291
----------
Epoch 169/299
----------
train Loss: 1.097070, Best Value: 3.504270, Empirical Value: 3.115773
val Loss: 1.085122, Best Value: 3.507067, Empirical Value: 3

train Loss: 1.074666, Best Value: 4.014588, Empirical Value: 3.571771
val Loss: 1.067590, Best Value: 4.007867, Empirical Value: 3.567311
----------
Epoch 210/299
----------
Updating Target Model
train Loss: 1.074811, Best Value: 4.017180, Empirical Value: 3.572474
val Loss: 1.073072, Best Value: 4.013110, Empirical Value: 3.557404
----------
Epoch 211/299
----------
train Loss: 1.074904, Best Value: 4.107825, Empirical Value: 3.675793
val Loss: 1.067239, Best Value: 4.121885, Empirical Value: 3.694499
Best Value updated
----------
Epoch 212/299
----------
train Loss: 1.073078, Best Value: 4.125336, Empirical Value: 3.684759
val Loss: 1.066013, Best Value: 4.134707, Empirical Value: 3.701154
Best Value updated
----------
Epoch 213/299
----------
train Loss: 1.072940, Best Value: 4.125544, Empirical Value: 3.684121
val Loss: 1.067799, Best Value: 4.078975, Empirical Value: 3.630963
----------
Epoch 214/299
----------
train Loss: 1.072308, Best Value: 4.130594, Empirical Value: 3.682088


train Loss: 1.048026, Best Value: 4.722257, Empirical Value: 4.241431
val Loss: 1.046501, Best Value: 4.688329, Empirical Value: 4.213081
----------
Epoch 255/299
----------
train Loss: 1.047934, Best Value: 4.729955, Empirical Value: 4.244204
val Loss: 1.047007, Best Value: 4.717101, Empirical Value: 4.228882
----------
Epoch 256/299
----------
train Loss: 1.046888, Best Value: 4.733581, Empirical Value: 4.242419
val Loss: 1.054641, Best Value: 4.727428, Empirical Value: 4.233533
----------
Epoch 257/299
----------
train Loss: 1.046982, Best Value: 4.736947, Empirical Value: 4.243620
val Loss: 1.044138, Best Value: 4.726011, Empirical Value: 4.232998
----------
Epoch 258/299
----------
train Loss: 1.046723, Best Value: 4.738147, Empirical Value: 4.243971
val Loss: 1.045458, Best Value: 4.711211, Empirical Value: 4.211378
----------
Epoch 259/299
----------
train Loss: 1.046745, Best Value: 4.739673, Empirical Value: 4.240440
val Loss: 1.047243, Best Value: 4.711666, Empirical Value: 4

train Loss: 1.025429, Best Value: 5.183161, Empirical Value: 4.641358
val Loss: 1.027481, Best Value: 5.187251, Empirical Value: 4.646929
Training complete in 18m 30s
Best value: 5.205771
{'num_hidden': 5, 'target_update': 10, 'option': 'linear', 'drop_prob': 0.0, 'state_dim': 46, 'use_scheduler': False, 'batch_size': 512, 'lr': 0.0001, 'hidden_dim': 128, 'num_epochs': 300, 'gamma': 0.9, 'action_dim': 25}
----------
Epoch 0/299
----------
Updating Target Model
train Loss: 1.341565, Best Value: 1.024567, Empirical Value: 0.042337
val Loss: 1.585362, Best Value: 0.886760, Empirical Value: 0.012828
Best Value updated
----------
Epoch 1/299
----------
train Loss: 1.328581, Best Value: 1.194322, Empirical Value: 0.599749
val Loss: 1.252005, Best Value: 1.297951, Empirical Value: 0.758361
Best Value updated
----------
Epoch 2/299
----------
train Loss: 1.281754, Best Value: 1.252691, Empirical Value: 0.762496
val Loss: 1.251174, Best Value: 1.246335, Empirical Value: 0.758817
----------
Epoc

train Loss: 1.187554, Best Value: 2.150998, Empirical Value: 1.855893
val Loss: 1.164510, Best Value: 2.150296, Empirical Value: 1.858070
----------
Epoch 44/299
----------
train Loss: 1.187114, Best Value: 2.155737, Empirical Value: 1.856634
val Loss: 1.163793, Best Value: 2.133126, Empirical Value: 1.839041
----------
Epoch 45/299
----------
train Loss: 1.186885, Best Value: 2.158963, Empirical Value: 1.853827
val Loss: 1.164943, Best Value: 2.133005, Empirical Value: 1.830149
----------
Epoch 46/299
----------
train Loss: 1.186934, Best Value: 2.160042, Empirical Value: 1.851647
val Loss: 1.164052, Best Value: 2.143382, Empirical Value: 1.839739
----------
Epoch 47/299
----------
train Loss: 1.186618, Best Value: 2.162063, Empirical Value: 1.852219
val Loss: 1.165352, Best Value: 2.163829, Empirical Value: 1.846941
----------
Epoch 48/299
----------
train Loss: 1.186454, Best Value: 2.163460, Empirical Value: 1.848477
val Loss: 1.165514, Best Value: 2.186908, Empirical Value: 1.8733

train Loss: 1.147457, Best Value: 2.715303, Empirical Value: 2.379246
val Loss: 1.135879, Best Value: 2.738250, Empirical Value: 2.417496
----------
Epoch 90/299
----------
Updating Target Model
train Loss: 1.147012, Best Value: 2.719022, Empirical Value: 2.380133
val Loss: 1.139005, Best Value: 2.737905, Empirical Value: 2.410332
----------
Epoch 91/299
----------
train Loss: 1.141488, Best Value: 2.839513, Empirical Value: 2.525783
val Loss: 1.130131, Best Value: 2.887233, Empirical Value: 2.572929
Best Value updated
----------
Epoch 92/299
----------
train Loss: 1.140080, Best Value: 2.854576, Empirical Value: 2.535542
val Loss: 1.129803, Best Value: 2.831661, Empirical Value: 2.512773
----------
Epoch 93/299
----------
train Loss: 1.139301, Best Value: 2.863903, Empirical Value: 2.534940
val Loss: 1.131173, Best Value: 2.868622, Empirical Value: 2.541588
----------
Epoch 94/299
----------
train Loss: 1.139221, Best Value: 2.867080, Empirical Value: 2.535785
val Loss: 1.129848, Best

train Loss: 1.122775, Best Value: 3.253814, Empirical Value: 2.860772
val Loss: 1.127107, Best Value: 3.249738, Empirical Value: 2.877232
Best Value updated
----------
Epoch 136/299
----------
train Loss: 1.122419, Best Value: 3.255522, Empirical Value: 2.862020
val Loss: 1.123746, Best Value: 3.210844, Empirical Value: 2.825773
----------
Epoch 137/299
----------
train Loss: 1.121944, Best Value: 3.258481, Empirical Value: 2.862059
val Loss: 1.125332, Best Value: 3.212962, Empirical Value: 2.829147
----------
Epoch 138/299
----------
train Loss: 1.120941, Best Value: 3.258303, Empirical Value: 2.863173
val Loss: 1.122854, Best Value: 3.221207, Empirical Value: 2.829427
----------
Epoch 139/299
----------
train Loss: 1.121727, Best Value: 3.258288, Empirical Value: 2.858707
val Loss: 1.124493, Best Value: 3.229889, Empirical Value: 2.838446
----------
Epoch 140/299
----------
Updating Target Model
train Loss: 1.121627, Best Value: 3.266351, Empirical Value: 2.862996
val Loss: 1.129718,

Updating Target Model
train Loss: 1.107772, Best Value: 3.896549, Empirical Value: 3.449372
val Loss: 1.123840, Best Value: 3.851041, Empirical Value: 3.420068
----------
Epoch 181/299
----------
train Loss: 1.107396, Best Value: 3.993173, Empirical Value: 3.575272
val Loss: 1.114501, Best Value: 3.950794, Empirical Value: 3.540578
Best Value updated
----------
Epoch 182/299
----------
train Loss: 1.105978, Best Value: 4.005657, Empirical Value: 3.582408
val Loss: 1.113689, Best Value: 3.952079, Empirical Value: 3.543792
Best Value updated
----------
Epoch 183/299
----------
train Loss: 1.105969, Best Value: 4.012545, Empirical Value: 3.580605
val Loss: 1.113083, Best Value: 3.968183, Empirical Value: 3.541627
Best Value updated
----------
Epoch 184/299
----------
train Loss: 1.103689, Best Value: 4.022944, Empirical Value: 3.582377
val Loss: 1.114027, Best Value: 3.988801, Empirical Value: 3.569853
Best Value updated
----------
Epoch 185/299
----------
train Loss: 1.104311, Best Value

val Loss: 1.083203, Best Value: 4.510792, Empirical Value: 4.041732
----------
Epoch 225/299
----------
train Loss: 1.066206, Best Value: 4.554787, Empirical Value: 4.069936
val Loss: 1.100907, Best Value: 4.518688, Empirical Value: 4.046737
----------
Epoch 226/299
----------
train Loss: 1.065032, Best Value: 4.556139, Empirical Value: 4.068275
val Loss: 1.082713, Best Value: 4.524797, Empirical Value: 4.054225
----------
Epoch 227/299
----------
train Loss: 1.065437, Best Value: 4.558727, Empirical Value: 4.070409
val Loss: 1.082111, Best Value: 4.534982, Empirical Value: 4.056420
----------
Epoch 228/299
----------
train Loss: 1.064362, Best Value: 4.559956, Empirical Value: 4.066872
val Loss: 1.085565, Best Value: 4.481126, Empirical Value: 4.011953
----------
Epoch 229/299
----------
train Loss: 1.065192, Best Value: 4.560359, Empirical Value: 4.069131
val Loss: 1.085411, Best Value: 4.575363, Empirical Value: 4.098310
Best Value updated
----------
Epoch 230/299
----------
Updatin

Updating Target Model
train Loss: 1.040211, Best Value: 4.988540, Empirical Value: 4.477197
val Loss: 1.059952, Best Value: 4.939667, Empirical Value: 4.449133
----------
Epoch 271/299
----------
train Loss: 1.034833, Best Value: 5.053417, Empirical Value: 4.562299
val Loss: 1.063766, Best Value: 5.036741, Empirical Value: 4.563025
Best Value updated
----------
Epoch 272/299
----------
train Loss: 1.033834, Best Value: 5.069071, Empirical Value: 4.569640
val Loss: 1.062660, Best Value: 5.034032, Empirical Value: 4.553275
----------
Epoch 273/299
----------
train Loss: 1.032404, Best Value: 5.070651, Empirical Value: 4.570302
val Loss: 1.062491, Best Value: 4.972985, Empirical Value: 4.491589
----------
Epoch 274/299
----------
train Loss: 1.033868, Best Value: 5.074909, Empirical Value: 4.567845
val Loss: 1.061859, Best Value: 5.018595, Empirical Value: 4.534949
----------
Epoch 275/299
----------
train Loss: 1.032630, Best Value: 5.078282, Empirical Value: 4.568435
val Loss: 1.066006,

train Loss: 1.237675, Best Value: 1.621145, Empirical Value: 1.153379
val Loss: 1.212620, Best Value: 1.571335, Empirical Value: 1.122518
Best Value updated
----------
Epoch 15/299
----------
train Loss: 1.237332, Best Value: 1.625941, Empirical Value: 1.152332
val Loss: 1.212319, Best Value: 1.588508, Empirical Value: 1.128151
Best Value updated
----------
Epoch 16/299
----------
train Loss: 1.236959, Best Value: 1.628818, Empirical Value: 1.150188
val Loss: 1.215044, Best Value: 1.601852, Empirical Value: 1.132195
Best Value updated
----------
Epoch 17/299
----------
train Loss: 1.236390, Best Value: 1.634060, Empirical Value: 1.149008
val Loss: 1.212715, Best Value: 1.624118, Empirical Value: 1.142624
Best Value updated
----------
Epoch 18/299
----------
train Loss: 1.236406, Best Value: 1.641090, Empirical Value: 1.147070
val Loss: 1.214167, Best Value: 1.603384, Empirical Value: 1.118081
----------
Epoch 19/299
----------
train Loss: 1.236185, Best Value: 1.640195, Empirical Value

train Loss: 1.184030, Best Value: 2.624206, Empirical Value: 2.256341
val Loss: 1.195591, Best Value: 2.554994, Empirical Value: 2.211313
----------
Epoch 60/299
----------
Updating Target Model
train Loss: 1.183608, Best Value: 2.621495, Empirical Value: 2.250041
val Loss: 1.198187, Best Value: 2.565731, Empirical Value: 2.211573
----------
Epoch 61/299
----------
train Loss: 1.183864, Best Value: 2.746324, Empirical Value: 2.408938
val Loss: 1.184661, Best Value: 2.714129, Empirical Value: 2.389140
Best Value updated
----------
Epoch 62/299
----------
train Loss: 1.180636, Best Value: 2.755183, Empirical Value: 2.415554
val Loss: 1.191016, Best Value: 2.719976, Empirical Value: 2.392762
Best Value updated
----------
Epoch 63/299
----------
train Loss: 1.178561, Best Value: 2.768517, Empirical Value: 2.421592
val Loss: 1.188041, Best Value: 2.657666, Empirical Value: 2.333927
----------
Epoch 64/299
----------
train Loss: 1.178899, Best Value: 2.766098, Empirical Value: 2.417912
val L

val Loss: 1.189176, Best Value: 3.212767, Empirical Value: 2.871020
----------
Epoch 105/299
----------
train Loss: 1.155315, Best Value: 3.334209, Empirical Value: 2.966615
val Loss: 1.183546, Best Value: 3.337441, Empirical Value: 2.973693
----------
Epoch 106/299
----------
train Loss: 1.157219, Best Value: 3.343562, Empirical Value: 2.968623
val Loss: 1.187034, Best Value: 3.301676, Empirical Value: 2.936746
----------
Epoch 107/299
----------
train Loss: 1.154801, Best Value: 3.341132, Empirical Value: 2.963664
val Loss: 1.185689, Best Value: 3.265534, Empirical Value: 2.907386
----------
Epoch 108/299
----------
train Loss: 1.153350, Best Value: 3.343061, Empirical Value: 2.963516
val Loss: 1.184997, Best Value: 3.314581, Empirical Value: 2.945916
----------
Epoch 109/299
----------
train Loss: 1.151972, Best Value: 3.347026, Empirical Value: 2.965250
val Loss: 1.188688, Best Value: 3.229644, Empirical Value: 2.857557
----------
Epoch 110/299
----------
Updating Target Model
trai

Updating Target Model
train Loss: 1.128107, Best Value: 3.887514, Empirical Value: 3.465469
val Loss: 1.204021, Best Value: 3.916470, Empirical Value: 3.487901
Best Value updated
----------
Epoch 151/299
----------
train Loss: 1.145508, Best Value: 4.008020, Empirical Value: 3.619835
val Loss: 1.206528, Best Value: 3.881974, Empirical Value: 3.513013
----------
Epoch 152/299
----------
train Loss: 1.141932, Best Value: 4.033609, Empirical Value: 3.638812
val Loss: 1.209796, Best Value: 3.957773, Empirical Value: 3.579192
Best Value updated
----------
Epoch 153/299
----------
train Loss: 1.139761, Best Value: 4.041264, Empirical Value: 3.642028
val Loss: 1.206367, Best Value: 3.903255, Empirical Value: 3.525080
----------
Epoch 154/299
----------
train Loss: 1.136478, Best Value: 4.048108, Empirical Value: 3.639548
val Loss: 1.207698, Best Value: 3.913799, Empirical Value: 3.533570
----------
Epoch 155/299
----------
train Loss: 1.136293, Best Value: 4.052283, Empirical Value: 3.641838


train Loss: 1.108596, Best Value: 4.431534, Empirical Value: 3.982149
val Loss: 1.206251, Best Value: 4.346415, Empirical Value: 3.914565
----------
Epoch 196/299
----------
train Loss: 1.107681, Best Value: 4.437541, Empirical Value: 3.983993
val Loss: 1.214482, Best Value: 4.305478, Empirical Value: 3.884030
----------
Epoch 197/299
----------
train Loss: 1.105747, Best Value: 4.443416, Empirical Value: 3.984493
val Loss: 1.211866, Best Value: 4.403949, Empirical Value: 3.959342
----------
Epoch 198/299
----------
train Loss: 1.105621, Best Value: 4.441583, Empirical Value: 3.981868
val Loss: 1.205235, Best Value: 4.290662, Empirical Value: 3.871355
----------
Epoch 199/299
----------
train Loss: 1.105134, Best Value: 4.447628, Empirical Value: 3.985443
val Loss: 1.207792, Best Value: 4.376289, Empirical Value: 3.929927
----------
Epoch 200/299
----------
Updating Target Model
train Loss: 1.104655, Best Value: 4.449955, Empirical Value: 3.983854
val Loss: 1.180134, Best Value: 4.3400

train Loss: 1.087024, Best Value: 4.857985, Empirical Value: 4.386741
val Loss: 1.208459, Best Value: 4.753559, Empirical Value: 4.302074
----------
Epoch 242/299
----------
train Loss: 1.083435, Best Value: 4.866782, Empirical Value: 4.389747
val Loss: 1.216738, Best Value: 4.812839, Empirical Value: 4.346916
Best Value updated
----------
Epoch 243/299
----------
train Loss: 1.084487, Best Value: 4.867855, Empirical Value: 4.390839
val Loss: 1.209217, Best Value: 4.815165, Empirical Value: 4.344483
Best Value updated
----------
Epoch 244/299
----------
train Loss: 1.078159, Best Value: 4.871400, Empirical Value: 4.387431
val Loss: 1.202053, Best Value: 4.834660, Empirical Value: 4.376428
Best Value updated
----------
Epoch 245/299
----------
train Loss: 1.079347, Best Value: 4.876104, Empirical Value: 4.390258
val Loss: 1.206596, Best Value: 4.825022, Empirical Value: 4.364012
----------
Epoch 246/299
----------
train Loss: 1.079258, Best Value: 4.876377, Empirical Value: 4.386452
val

train Loss: 1.062238, Best Value: 5.143814, Empirical Value: 4.620806
val Loss: 1.234717, Best Value: 5.056211, Empirical Value: 4.550259
----------
Epoch 288/299
----------
train Loss: 1.061105, Best Value: 5.143362, Empirical Value: 4.619851
val Loss: 1.230131, Best Value: 5.056422, Empirical Value: 4.553478
----------
Epoch 289/299
----------
train Loss: 1.061161, Best Value: 5.146916, Empirical Value: 4.616887
val Loss: 1.231718, Best Value: 4.896955, Empirical Value: 4.401934
----------
Epoch 290/299
----------
Updating Target Model
train Loss: 1.061248, Best Value: 5.149215, Empirical Value: 4.625114
val Loss: 1.206221, Best Value: 5.004630, Empirical Value: 4.485423
----------
Epoch 291/299
----------
train Loss: 1.068846, Best Value: 5.172447, Empirical Value: 4.651993
val Loss: 1.227409, Best Value: 5.090182, Empirical Value: 4.591026
----------
Epoch 292/299
----------
train Loss: 1.068833, Best Value: 5.178097, Empirical Value: 4.654834
val Loss: 1.228242, Best Value: 5.0689

train Loss: 1.213280, Best Value: 2.171677, Empirical Value: 1.833158
val Loss: 1.184010, Best Value: 2.223427, Empirical Value: 1.876812
Best Value updated
----------
Epoch 32/299
----------
train Loss: 1.210661, Best Value: 2.192409, Empirical Value: 1.843846
val Loss: 1.184371, Best Value: 2.235343, Empirical Value: 1.878983
Best Value updated
----------
Epoch 33/299
----------
train Loss: 1.209903, Best Value: 2.200608, Empirical Value: 1.844686
val Loss: 1.183724, Best Value: 2.207129, Empirical Value: 1.846846
----------
Epoch 34/299
----------
train Loss: 1.209530, Best Value: 2.205518, Empirical Value: 1.843745
val Loss: 1.182634, Best Value: 2.227433, Empirical Value: 1.862389
----------
Epoch 35/299
----------
train Loss: 1.209083, Best Value: 2.213046, Empirical Value: 1.844157
val Loss: 1.182273, Best Value: 2.254305, Empirical Value: 1.880696
Best Value updated
----------
Epoch 36/299
----------
train Loss: 1.208804, Best Value: 2.213238, Empirical Value: 1.843985
val Loss

train Loss: 1.152789, Best Value: 2.818574, Empirical Value: 2.502702
val Loss: 1.127633, Best Value: 2.847801, Empirical Value: 2.531673
----------
Epoch 77/299
----------
train Loss: 1.152793, Best Value: 2.816358, Empirical Value: 2.501161
val Loss: 1.128271, Best Value: 2.862749, Empirical Value: 2.546809
----------
Epoch 78/299
----------
train Loss: 1.152664, Best Value: 2.818345, Empirical Value: 2.502234
val Loss: 1.127969, Best Value: 2.861133, Empirical Value: 2.545995
----------
Epoch 79/299
----------
train Loss: 1.152599, Best Value: 2.820823, Empirical Value: 2.501685
val Loss: 1.127600, Best Value: 2.848099, Empirical Value: 2.527262
----------
Epoch 80/299
----------
Updating Target Model
train Loss: 1.152640, Best Value: 2.821592, Empirical Value: 2.500966
val Loss: 1.124560, Best Value: 2.859645, Empirical Value: 2.539066
----------
Epoch 81/299
----------
train Loss: 1.145351, Best Value: 2.899805, Empirical Value: 2.604664
val Loss: 1.123030, Best Value: 2.934564, E

train Loss: 1.123042, Best Value: 3.163850, Empirical Value: 2.866525
val Loss: 1.099685, Best Value: 3.207877, Empirical Value: 2.904062
Best Value updated
----------
Epoch 122/299
----------
train Loss: 1.122904, Best Value: 3.166086, Empirical Value: 2.867619
val Loss: 1.099337, Best Value: 3.196981, Empirical Value: 2.897405
----------
Epoch 123/299
----------
train Loss: 1.122891, Best Value: 3.167580, Empirical Value: 2.867809
val Loss: 1.099393, Best Value: 3.199787, Empirical Value: 2.898015
----------
Epoch 124/299
----------
train Loss: 1.122624, Best Value: 3.167986, Empirical Value: 2.866559
val Loss: 1.099197, Best Value: 3.182665, Empirical Value: 2.887469
----------
Epoch 125/299
----------
train Loss: 1.122583, Best Value: 3.170366, Empirical Value: 2.868384
val Loss: 1.100738, Best Value: 3.146403, Empirical Value: 2.852905
----------
Epoch 126/299
----------
train Loss: 1.122619, Best Value: 3.170224, Empirical Value: 2.866749
val Loss: 1.099956, Best Value: 3.219527,

train Loss: 1.110257, Best Value: 3.386180, Empirical Value: 3.068290
val Loss: 1.092037, Best Value: 3.418604, Empirical Value: 3.103544
----------
Epoch 167/299
----------
train Loss: 1.110074, Best Value: 3.388892, Empirical Value: 3.068763
val Loss: 1.087930, Best Value: 3.388751, Empirical Value: 3.066529
----------
Epoch 168/299
----------
train Loss: 1.110167, Best Value: 3.391079, Empirical Value: 3.069167
val Loss: 1.087826, Best Value: 3.437707, Empirical Value: 3.109274
----------
Epoch 169/299
----------
train Loss: 1.110210, Best Value: 3.391901, Empirical Value: 3.067689
val Loss: 1.087649, Best Value: 3.400593, Empirical Value: 3.085875
----------
Epoch 170/299
----------
Updating Target Model
train Loss: 1.110056, Best Value: 3.391768, Empirical Value: 3.068505
val Loss: 1.086837, Best Value: 3.432783, Empirical Value: 3.099852
----------
Epoch 171/299
----------
train Loss: 1.107525, Best Value: 3.439622, Empirical Value: 3.130024
val Loss: 1.084851, Best Value: 3.4739

val Loss: 1.078423, Best Value: 3.683903, Empirical Value: 3.342812
Best Value updated
----------
Epoch 212/299
----------
train Loss: 1.099600, Best Value: 3.670179, Empirical Value: 3.325000
val Loss: 1.091817, Best Value: 3.722732, Empirical Value: 3.375790
Best Value updated
----------
Epoch 213/299
----------
train Loss: 1.099478, Best Value: 3.673207, Empirical Value: 3.323756
val Loss: 1.078499, Best Value: 3.719048, Empirical Value: 3.365995
----------
Epoch 214/299
----------
train Loss: 1.099128, Best Value: 3.678636, Empirical Value: 3.325659
val Loss: 1.078980, Best Value: 3.734947, Empirical Value: 3.374458
Best Value updated
----------
Epoch 215/299
----------
train Loss: 1.099410, Best Value: 3.677777, Empirical Value: 3.323449
val Loss: 1.077906, Best Value: 3.705075, Empirical Value: 3.349119
----------
Epoch 216/299
----------
train Loss: 1.099114, Best Value: 3.679996, Empirical Value: 3.324703
val Loss: 1.078721, Best Value: 3.739484, Empirical Value: 3.374831
Best 

train Loss: 1.092637, Best Value: 3.959020, Empirical Value: 3.573136
val Loss: 1.073296, Best Value: 4.001064, Empirical Value: 3.612187
----------
Epoch 257/299
----------
train Loss: 1.092441, Best Value: 3.960276, Empirical Value: 3.572412
val Loss: 1.073482, Best Value: 4.009653, Empirical Value: 3.617984
Best Value updated
----------
Epoch 258/299
----------
train Loss: 1.092392, Best Value: 3.963028, Empirical Value: 3.572275
val Loss: 1.073576, Best Value: 3.978917, Empirical Value: 3.591900
----------
Epoch 259/299
----------
train Loss: 1.092178, Best Value: 3.966705, Empirical Value: 3.573107
val Loss: 1.075189, Best Value: 3.991390, Empirical Value: 3.603053
----------
Epoch 260/299
----------
Updating Target Model
train Loss: 1.092177, Best Value: 3.965756, Empirical Value: 3.573188
val Loss: 1.074546, Best Value: 4.018190, Empirical Value: 3.614544
Best Value updated
----------
Epoch 261/299
----------
train Loss: 1.091103, Best Value: 4.021163, Empirical Value: 3.646887


Updating Target Model
train Loss: 1.354864, Best Value: 1.091806, Empirical Value: 0.079791
val Loss: 1.594443, Best Value: 0.977888, Empirical Value: 0.087076
Best Value updated
----------
Epoch 1/299
----------
train Loss: 1.324251, Best Value: 1.367292, Empirical Value: 0.782283
val Loss: 1.261312, Best Value: 1.410005, Empirical Value: 0.888404
Best Value updated
----------
Epoch 2/299
----------
train Loss: 1.292758, Best Value: 1.377191, Empirical Value: 0.870903
val Loss: 1.261180, Best Value: 1.340990, Empirical Value: 0.841759
----------
Epoch 3/299
----------
train Loss: 1.291362, Best Value: 1.335425, Empirical Value: 0.842307
val Loss: 1.261958, Best Value: 1.317758, Empirical Value: 0.830171
----------
Epoch 4/299
----------
train Loss: 1.291224, Best Value: 1.313029, Empirical Value: 0.819023
val Loss: 1.262249, Best Value: 1.300151, Empirical Value: 0.810128
----------
Epoch 5/299
----------
train Loss: 1.291561, Best Value: 1.298891, Empirical Value: 0.799083
val Loss: 

val Loss: 1.175863, Best Value: 2.447988, Empirical Value: 2.069725
----------
Epoch 46/299
----------
train Loss: 1.195105, Best Value: 2.493520, Empirical Value: 2.096349
val Loss: 1.174686, Best Value: 2.493799, Empirical Value: 2.101015
----------
Epoch 47/299
----------
train Loss: 1.194936, Best Value: 2.494112, Empirical Value: 2.095485
val Loss: 1.174193, Best Value: 2.494189, Empirical Value: 2.103858
----------
Epoch 48/299
----------
train Loss: 1.194953, Best Value: 2.495183, Empirical Value: 2.094433
val Loss: 1.174244, Best Value: 2.485492, Empirical Value: 2.085384
----------
Epoch 49/299
----------
train Loss: 1.194772, Best Value: 2.498840, Empirical Value: 2.093053
val Loss: 1.174623, Best Value: 2.496723, Empirical Value: 2.093020
----------
Epoch 50/299
----------
Updating Target Model
train Loss: 1.194752, Best Value: 2.499598, Empirical Value: 2.092764
val Loss: 1.182263, Best Value: 2.501476, Empirical Value: 2.100820
----------
Epoch 51/299
----------
train Loss

val Loss: 1.118905, Best Value: 3.212839, Empirical Value: 2.809872
----------
Epoch 91/299
----------
train Loss: 1.122813, Best Value: 3.346310, Empirical Value: 2.965463
val Loss: 1.106316, Best Value: 3.344384, Empirical Value: 2.957060
Best Value updated
----------
Epoch 92/299
----------
train Loss: 1.122162, Best Value: 3.355425, Empirical Value: 2.967513
val Loss: 1.108366, Best Value: 3.307810, Empirical Value: 2.926752
----------
Epoch 93/299
----------
train Loss: 1.122124, Best Value: 3.365073, Empirical Value: 2.969206
val Loss: 1.106326, Best Value: 3.348910, Empirical Value: 2.951553
Best Value updated
----------
Epoch 94/299
----------
train Loss: 1.121674, Best Value: 3.367907, Empirical Value: 2.967763
val Loss: 1.106838, Best Value: 3.375332, Empirical Value: 2.974786
Best Value updated
----------
Epoch 95/299
----------
train Loss: 1.121354, Best Value: 3.373590, Empirical Value: 2.967334
val Loss: 1.106217, Best Value: 3.377437, Empirical Value: 2.978792
Best Value

train Loss: 1.087347, Best Value: 4.010723, Empirical Value: 3.563124
val Loss: 1.077356, Best Value: 4.015471, Empirical Value: 3.571357
Best Value updated
----------
Epoch 136/299
----------
train Loss: 1.087699, Best Value: 4.016721, Empirical Value: 3.561581
val Loss: 1.077808, Best Value: 3.987645, Empirical Value: 3.549031
----------
Epoch 137/299
----------
train Loss: 1.087256, Best Value: 4.021223, Empirical Value: 3.564013
val Loss: 1.077277, Best Value: 4.023449, Empirical Value: 3.568993
Best Value updated
----------
Epoch 138/299
----------
train Loss: 1.087254, Best Value: 4.024109, Empirical Value: 3.562512
val Loss: 1.077047, Best Value: 4.000755, Empirical Value: 3.560248
----------
Epoch 139/299
----------
train Loss: 1.087251, Best Value: 4.023879, Empirical Value: 3.561879
val Loss: 1.078070, Best Value: 3.978302, Empirical Value: 3.520817
----------
Epoch 140/299
----------
Updating Target Model
train Loss: 1.086867, Best Value: 4.031220, Empirical Value: 3.562702


Updating Target Model
train Loss: 1.055533, Best Value: 4.652815, Empirical Value: 4.126342
val Loss: 1.054300, Best Value: 4.639481, Empirical Value: 4.106813
----------
Epoch 181/299
----------
train Loss: 1.051221, Best Value: 4.747924, Empirical Value: 4.251551
val Loss: 1.044412, Best Value: 4.733788, Empirical Value: 4.242607
Best Value updated
----------
Epoch 182/299
----------
train Loss: 1.050829, Best Value: 4.761772, Empirical Value: 4.254810
val Loss: 1.044985, Best Value: 4.780969, Empirical Value: 4.276217
Best Value updated
----------
Epoch 183/299
----------
train Loss: 1.049933, Best Value: 4.776443, Empirical Value: 4.256894
val Loss: 1.045756, Best Value: 4.812892, Empirical Value: 4.294328
Best Value updated
----------
Epoch 184/299
----------
train Loss: 1.049364, Best Value: 4.781144, Empirical Value: 4.255282
val Loss: 1.045176, Best Value: 4.751244, Empirical Value: 4.230918
----------
Epoch 185/299
----------
train Loss: 1.050139, Best Value: 4.779869, Empiric

train Loss: 1.022524, Best Value: 5.404352, Empirical Value: 4.819270
val Loss: 1.022344, Best Value: 5.359642, Empirical Value: 4.788372
----------
Epoch 226/299
----------
train Loss: 1.022746, Best Value: 5.409464, Empirical Value: 4.821537
val Loss: 1.023281, Best Value: 5.412402, Empirical Value: 4.822570
----------
Epoch 227/299
----------
train Loss: 1.022113, Best Value: 5.411415, Empirical Value: 4.821226
val Loss: 1.021629, Best Value: 5.435460, Empirical Value: 4.836306
Best Value updated
----------
Epoch 228/299
----------
train Loss: 1.022262, Best Value: 5.414197, Empirical Value: 4.819109
val Loss: 1.022255, Best Value: 5.360830, Empirical Value: 4.790085
----------
Epoch 229/299
----------
train Loss: 1.021401, Best Value: 5.418856, Empirical Value: 4.821279
val Loss: 1.056432, Best Value: 5.386385, Empirical Value: 4.798192
----------
Epoch 230/299
----------
Updating Target Model
train Loss: 1.022205, Best Value: 5.420693, Empirical Value: 4.820041
val Loss: 1.011556,

Updating Target Model
train Loss: 0.995600, Best Value: 6.004906, Empirical Value: 5.345182
val Loss: 0.998417, Best Value: 6.018784, Empirical Value: 5.368388
Best Value updated
----------
Epoch 271/299
----------
train Loss: 0.988810, Best Value: 6.121039, Empirical Value: 5.503411
val Loss: 0.997697, Best Value: 6.189287, Empirical Value: 5.577872
Best Value updated
----------
Epoch 272/299
----------
train Loss: 0.988041, Best Value: 6.138188, Empirical Value: 5.508816
val Loss: 0.994053, Best Value: 6.104063, Empirical Value: 5.488160
----------
Epoch 273/299
----------
train Loss: 0.989028, Best Value: 6.142584, Empirical Value: 5.508221
val Loss: 0.995489, Best Value: 6.172485, Empirical Value: 5.537745
----------
Epoch 274/299
----------
train Loss: 0.988999, Best Value: 6.147020, Empirical Value: 5.506588
val Loss: 0.995946, Best Value: 6.075401, Empirical Value: 5.457052
----------
Epoch 275/299
----------
train Loss: 0.987711, Best Value: 6.150727, Empirical Value: 5.509739


train Loss: 1.248399, Best Value: 1.619337, Empirical Value: 1.139211
val Loss: 1.222317, Best Value: 1.613669, Empirical Value: 1.129784
----------
Epoch 15/299
----------
train Loss: 1.248183, Best Value: 1.624122, Empirical Value: 1.138370
val Loss: 1.223359, Best Value: 1.630240, Empirical Value: 1.138263
----------
Epoch 16/299
----------
train Loss: 1.247722, Best Value: 1.627571, Empirical Value: 1.136625
val Loss: 1.222811, Best Value: 1.604564, Empirical Value: 1.113384
----------
Epoch 17/299
----------
train Loss: 1.247818, Best Value: 1.629036, Empirical Value: 1.132329
val Loss: 1.224396, Best Value: 1.592999, Empirical Value: 1.098633
----------
Epoch 18/299
----------
train Loss: 1.247898, Best Value: 1.630521, Empirical Value: 1.129359
val Loss: 1.225099, Best Value: 1.620103, Empirical Value: 1.118361
----------
Epoch 19/299
----------
train Loss: 1.247835, Best Value: 1.631786, Empirical Value: 1.126553
val Loss: 1.225237, Best Value: 1.636312, Empirical Value: 1.1286

val Loss: 1.164466, Best Value: 2.649069, Empirical Value: 2.259011
----------
Epoch 60/299
----------
Updating Target Model
train Loss: 1.175346, Best Value: 2.640241, Empirical Value: 2.250546
val Loss: 1.169107, Best Value: 2.654322, Empirical Value: 2.264083
----------
Epoch 61/299
----------
train Loss: 1.163162, Best Value: 2.780647, Empirical Value: 2.431677
val Loss: 1.150467, Best Value: 2.817241, Empirical Value: 2.469404
Best Value updated
----------
Epoch 62/299
----------
train Loss: 1.161648, Best Value: 2.796021, Empirical Value: 2.438085
val Loss: 1.149924, Best Value: 2.831810, Empirical Value: 2.471487
Best Value updated
----------
Epoch 63/299
----------
train Loss: 1.161195, Best Value: 2.805216, Empirical Value: 2.439554
val Loss: 1.150368, Best Value: 2.805231, Empirical Value: 2.427289
----------
Epoch 64/299
----------
train Loss: 1.160642, Best Value: 2.808156, Empirical Value: 2.436895
val Loss: 1.150776, Best Value: 2.829765, Empirical Value: 2.456721
-------

val Loss: 1.117585, Best Value: 3.530133, Empirical Value: 3.106628
----------
Epoch 105/299
----------
train Loss: 1.107360, Best Value: 3.570017, Empirical Value: 3.127441
val Loss: 1.108405, Best Value: 3.607648, Empirical Value: 3.163753
----------
Epoch 106/299
----------
train Loss: 1.107616, Best Value: 3.573145, Empirical Value: 3.128946
val Loss: 1.108868, Best Value: 3.591488, Empirical Value: 3.134664
----------
Epoch 107/299
----------
train Loss: 1.107165, Best Value: 3.580739, Empirical Value: 3.127993
val Loss: 1.108133, Best Value: 3.612685, Empirical Value: 3.150362
Best Value updated
----------
Epoch 108/299
----------
train Loss: 1.106857, Best Value: 3.579577, Empirical Value: 3.125687
val Loss: 1.108978, Best Value: 3.634394, Empirical Value: 3.163884
Best Value updated
----------
Epoch 109/299
----------
train Loss: 1.106386, Best Value: 3.587842, Empirical Value: 3.128406
val Loss: 1.109376, Best Value: 3.595079, Empirical Value: 3.121314
----------
Epoch 110/299

train Loss: 1.077274, Best Value: 4.175780, Empirical Value: 3.612748
val Loss: 1.091720, Best Value: 4.205663, Empirical Value: 3.640544
----------
Epoch 150/299
----------
Updating Target Model
train Loss: 1.076884, Best Value: 4.178046, Empirical Value: 3.614402
val Loss: 1.109898, Best Value: 4.209195, Empirical Value: 3.638084
----------
Epoch 151/299
----------
train Loss: 1.073612, Best Value: 4.362095, Empirical Value: 3.837524
val Loss: 1.099637, Best Value: 4.322345, Empirical Value: 3.803293
Best Value updated
----------
Epoch 152/299
----------
train Loss: 1.072794, Best Value: 4.386485, Empirical Value: 3.842885
val Loss: 1.088898, Best Value: 4.411736, Empirical Value: 3.865443
Best Value updated
----------
Epoch 153/299
----------
train Loss: 1.072080, Best Value: 4.399882, Empirical Value: 3.843415
val Loss: 1.088908, Best Value: 4.414241, Empirical Value: 3.843454
Best Value updated
----------
Epoch 154/299
----------
train Loss: 1.071774, Best Value: 4.414443, Empiric

val Loss: 1.059847, Best Value: 5.544331, Empirical Value: 4.865786
Best Value updated
----------
Epoch 194/299
----------
train Loss: 1.025313, Best Value: 5.525959, Empirical Value: 4.840824
val Loss: 1.055393, Best Value: 5.553012, Empirical Value: 4.864200
Best Value updated
----------
Epoch 195/299
----------
train Loss: 1.025040, Best Value: 5.538156, Empirical Value: 4.841787
val Loss: 1.057689, Best Value: 5.523453, Empirical Value: 4.829420
----------
Epoch 196/299
----------
train Loss: 1.024611, Best Value: 5.540976, Empirical Value: 4.838555
val Loss: 1.058117, Best Value: 5.571304, Empirical Value: 4.888728
Best Value updated
----------
Epoch 197/299
----------
train Loss: 1.024257, Best Value: 5.547454, Empirical Value: 4.839635
val Loss: 1.059801, Best Value: 5.503734, Empirical Value: 4.801743
----------
Epoch 198/299
----------
train Loss: 1.024076, Best Value: 5.555055, Empirical Value: 4.841781
val Loss: 1.059376, Best Value: 5.534644, Empirical Value: 4.807189
-----

val Loss: 1.017906, Best Value: 6.633103, Empirical Value: 5.814605
----------
Epoch 238/299
----------
train Loss: 0.970099, Best Value: 6.656861, Empirical Value: 5.824382
val Loss: 1.020415, Best Value: 6.557600, Empirical Value: 5.754117
----------
Epoch 239/299
----------
train Loss: 0.971012, Best Value: 6.659157, Empirical Value: 5.826968
val Loss: 1.024636, Best Value: 6.619963, Empirical Value: 5.791092
----------
Epoch 240/299
----------
Updating Target Model
train Loss: 0.969359, Best Value: 6.668293, Empirical Value: 5.824972
val Loss: 1.029112, Best Value: 6.608630, Empirical Value: 5.791226
----------
Epoch 241/299
----------
train Loss: 0.960055, Best Value: 6.822918, Empirical Value: 6.025567
val Loss: 1.014133, Best Value: 6.876047, Empirical Value: 6.069515
Best Value updated
----------
Epoch 242/299
----------
train Loss: 0.958682, Best Value: 6.844480, Empirical Value: 6.028943
val Loss: 1.017814, Best Value: 6.776906, Empirical Value: 5.967995
----------
Epoch 243/

train Loss: 0.911668, Best Value: 7.889666, Empirical Value: 6.989877
val Loss: 1.029363, Best Value: 7.874591, Empirical Value: 6.962763
Best Value updated
----------
Epoch 283/299
----------
train Loss: 0.910861, Best Value: 7.902896, Empirical Value: 6.988959
val Loss: 0.977053, Best Value: 7.920405, Empirical Value: 7.006474
Best Value updated
----------
Epoch 284/299
----------
train Loss: 0.910120, Best Value: 7.915825, Empirical Value: 6.990766
val Loss: 0.975903, Best Value: 7.897475, Empirical Value: 6.973501
----------
Epoch 285/299
----------
train Loss: 0.908770, Best Value: 7.926027, Empirical Value: 6.989339
val Loss: 0.982891, Best Value: 7.848043, Empirical Value: 6.901417
----------
Epoch 286/299
----------
train Loss: 0.909471, Best Value: 7.932594, Empirical Value: 6.988043
val Loss: 0.975877, Best Value: 7.920177, Empirical Value: 6.984974
----------
Epoch 287/299
----------
train Loss: 0.907974, Best Value: 7.936789, Empirical Value: 6.988462
val Loss: 0.978073, Be

val Loss: 1.192709, Best Value: 2.489918, Empirical Value: 1.917826
----------
Epoch 26/299
----------
train Loss: 1.206392, Best Value: 2.447429, Empirical Value: 1.881174
val Loss: 1.194973, Best Value: 2.457745, Empirical Value: 1.884593
----------
Epoch 27/299
----------
train Loss: 1.205689, Best Value: 2.452428, Empirical Value: 1.876164
val Loss: 1.194413, Best Value: 2.459042, Empirical Value: 1.892209
----------
Epoch 28/299
----------
train Loss: 1.204703, Best Value: 2.454657, Empirical Value: 1.877331
val Loss: 1.192750, Best Value: 2.567988, Empirical Value: 1.964353
Best Value updated
----------
Epoch 29/299
----------
train Loss: 1.205123, Best Value: 2.458751, Empirical Value: 1.873069
val Loss: 1.193186, Best Value: 2.495240, Empirical Value: 1.906225
----------
Epoch 30/299
----------
Updating Target Model
train Loss: 1.204565, Best Value: 2.461597, Empirical Value: 1.874119
val Loss: 1.282276, Best Value: 2.506102, Empirical Value: 1.909336
----------
Epoch 31/299
--

train Loss: 1.129591, Best Value: 3.672734, Empirical Value: 3.211922
val Loss: 1.137090, Best Value: 3.733182, Empirical Value: 3.262078
Best Value updated
----------
Epoch 72/299
----------
train Loss: 1.124809, Best Value: 3.693780, Empirical Value: 3.218541
val Loss: 1.132392, Best Value: 3.745404, Empirical Value: 3.275433
Best Value updated
----------
Epoch 73/299
----------
train Loss: 1.124223, Best Value: 3.704033, Empirical Value: 3.220495
val Loss: 1.133612, Best Value: 3.734336, Empirical Value: 3.255920
----------
Epoch 74/299
----------
train Loss: 1.123181, Best Value: 3.714204, Empirical Value: 3.220597
val Loss: 1.137937, Best Value: 3.660867, Empirical Value: 3.186245
----------
Epoch 75/299
----------
train Loss: 1.123082, Best Value: 3.712602, Empirical Value: 3.218079
val Loss: 1.134019, Best Value: 3.707382, Empirical Value: 3.211046
----------
Epoch 76/299
----------
train Loss: 1.122478, Best Value: 3.722679, Empirical Value: 3.220805
val Loss: 1.134825, Best Va

train Loss: 1.068648, Best Value: 4.833587, Empirical Value: 4.169621
val Loss: 1.110361, Best Value: 4.866865, Empirical Value: 4.210331
Best Value updated
----------
Epoch 117/299
----------
train Loss: 1.067003, Best Value: 4.835876, Empirical Value: 4.163609
val Loss: 1.107427, Best Value: 4.783257, Empirical Value: 4.121381
----------
Epoch 118/299
----------
train Loss: 1.067031, Best Value: 4.843405, Empirical Value: 4.165816
val Loss: 1.107202, Best Value: 4.836377, Empirical Value: 4.174592
----------
Epoch 119/299
----------
train Loss: 1.067607, Best Value: 4.850645, Empirical Value: 4.166555
val Loss: 1.108435, Best Value: 4.820545, Empirical Value: 4.135074
----------
Epoch 120/299
----------
Updating Target Model
train Loss: 1.066683, Best Value: 4.857569, Empirical Value: 4.164809
val Loss: 1.127690, Best Value: 4.858978, Empirical Value: 4.178974
----------
Epoch 121/299
----------
train Loss: 1.056063, Best Value: 5.068415, Empirical Value: 4.435733
val Loss: 1.093620,

train Loss: 1.002262, Best Value: 6.476744, Empirical Value: 5.688906
val Loss: 1.075051, Best Value: 6.524303, Empirical Value: 5.746876
Best Value updated
----------
Epoch 162/299
----------
train Loss: 0.997336, Best Value: 6.517206, Empirical Value: 5.701969
val Loss: 1.079126, Best Value: 6.449350, Empirical Value: 5.652719
----------
Epoch 163/299
----------
train Loss: 0.995136, Best Value: 6.531011, Empirical Value: 5.704652
val Loss: 1.071881, Best Value: 6.571706, Empirical Value: 5.759126
Best Value updated
----------
Epoch 164/299
----------
train Loss: 0.992265, Best Value: 6.545600, Empirical Value: 5.704016
val Loss: 1.069280, Best Value: 6.577683, Empirical Value: 5.712316
Best Value updated
----------
Epoch 165/299
----------
train Loss: 0.991372, Best Value: 6.558227, Empirical Value: 5.699355
val Loss: 1.070186, Best Value: 6.588462, Empirical Value: 5.742450
Best Value updated
----------
Epoch 166/299
----------
train Loss: 0.990467, Best Value: 6.566580, Empirical 

train Loss: 0.931403, Best Value: 7.789016, Empirical Value: 6.799859
val Loss: 1.044911, Best Value: 7.785688, Empirical Value: 6.802431
----------
Epoch 207/299
----------
train Loss: 0.930045, Best Value: 7.798468, Empirical Value: 6.797942
val Loss: 1.049195, Best Value: 7.802216, Empirical Value: 6.835990
----------
Epoch 208/299
----------
train Loss: 0.929917, Best Value: 7.801210, Empirical Value: 6.798327
val Loss: 1.039797, Best Value: 7.768656, Empirical Value: 6.805975
----------
Epoch 209/299
----------
train Loss: 0.928108, Best Value: 7.806183, Empirical Value: 6.798717
val Loss: 1.039441, Best Value: 7.801754, Empirical Value: 6.819722
----------
Epoch 210/299
----------
Updating Target Model
train Loss: 0.928083, Best Value: 7.810409, Empirical Value: 6.796247
val Loss: 1.049033, Best Value: 7.804849, Empirical Value: 6.817904
----------
Epoch 211/299
----------
train Loss: 0.918966, Best Value: 8.015883, Empirical Value: 7.077085
val Loss: 1.027241, Best Value: 8.0261

val Loss: 1.018846, Best Value: 8.953993, Empirical Value: 7.868254
----------
Epoch 251/299
----------
train Loss: 0.865923, Best Value: 9.125684, Empirical Value: 8.093942
val Loss: 1.001183, Best Value: 9.161352, Empirical Value: 8.144626
Best Value updated
----------
Epoch 252/299
----------
train Loss: 0.862165, Best Value: 9.157232, Empirical Value: 8.108797
val Loss: 1.014365, Best Value: 9.288074, Empirical Value: 8.246595
Best Value updated
----------
Epoch 253/299
----------
train Loss: 0.860874, Best Value: 9.167725, Empirical Value: 8.102457
val Loss: 1.013538, Best Value: 9.080372, Empirical Value: 8.018443
----------
Epoch 254/299
----------
train Loss: 0.859371, Best Value: 9.173295, Empirical Value: 8.102101
val Loss: 1.006938, Best Value: 9.183464, Empirical Value: 8.149810
----------
Epoch 255/299
----------
train Loss: 0.858174, Best Value: 9.176866, Empirical Value: 8.100284
val Loss: 1.004385, Best Value: 9.219244, Empirical Value: 8.185446
----------
Epoch 256/299

train Loss: 0.804367, Best Value: 10.119890, Empirical Value: 9.000505
val Loss: 0.976418, Best Value: 10.103545, Empirical Value: 9.007639
----------
Epoch 296/299
----------
train Loss: 0.803601, Best Value: 10.120901, Empirical Value: 8.998214
val Loss: 0.978131, Best Value: 10.135868, Empirical Value: 9.029474
----------
Epoch 297/299
----------
train Loss: 0.801378, Best Value: 10.124321, Empirical Value: 8.997985
val Loss: 0.973498, Best Value: 10.223447, Empirical Value: 9.128436
----------
Epoch 298/299
----------
train Loss: 0.800468, Best Value: 10.122848, Empirical Value: 8.995199
val Loss: 0.978282, Best Value: 10.110547, Empirical Value: 8.999232
----------
Epoch 299/299
----------
train Loss: 0.799178, Best Value: 10.131127, Empirical Value: 8.997198
val Loss: 0.980692, Best Value: 10.155557, Empirical Value: 9.044424
Training complete in 20m 19s
Best value: 10.260849
{'num_hidden': 10, 'target_update': 10, 'option': 'linear', 'drop_prob': 0.0, 'state_dim': 46, 'use_sched

val Loss: 1.228346, Best Value: 2.575129, Empirical Value: 2.054584
----------
Epoch 39/299
----------
train Loss: 1.209850, Best Value: 2.649048, Empirical Value: 2.092823
val Loss: 1.233030, Best Value: 2.589090, Empirical Value: 2.070731
----------
Epoch 40/299
----------
Updating Target Model
train Loss: 1.210562, Best Value: 2.644030, Empirical Value: 2.087264
val Loss: 1.284376, Best Value: 2.599347, Empirical Value: 2.060532
----------
Epoch 41/299
----------
train Loss: 1.220512, Best Value: 2.889023, Empirical Value: 2.398952
val Loss: 1.235501, Best Value: 2.887058, Empirical Value: 2.409829
Best Value updated
----------
Epoch 42/299
----------
train Loss: 1.211111, Best Value: 2.916735, Empirical Value: 2.415534
val Loss: 1.230826, Best Value: 2.855238, Empirical Value: 2.370862
----------
Epoch 43/299
----------
train Loss: 1.210961, Best Value: 2.934354, Empirical Value: 2.420493
val Loss: 1.237199, Best Value: 2.951781, Empirical Value: 2.451855
Best Value updated
-------

val Loss: 1.286779, Best Value: 4.557121, Empirical Value: 3.825661
----------
Epoch 84/299
----------
train Loss: 1.167777, Best Value: 4.660748, Empirical Value: 3.904267
val Loss: 1.283977, Best Value: 4.622348, Empirical Value: 3.874257
Best Value updated
----------
Epoch 85/299
----------
train Loss: 1.166955, Best Value: 4.669276, Empirical Value: 3.903094
val Loss: 1.285248, Best Value: 4.614362, Empirical Value: 3.851444
----------
Epoch 86/299
----------
train Loss: 1.161828, Best Value: 4.677757, Empirical Value: 3.904008
val Loss: 1.287560, Best Value: 4.700079, Empirical Value: 3.930646
Best Value updated
----------
Epoch 87/299
----------
train Loss: 1.158076, Best Value: 4.695020, Empirical Value: 3.906274
val Loss: 1.293843, Best Value: 4.717795, Empirical Value: 3.934011
Best Value updated
----------
Epoch 88/299
----------
train Loss: 1.158737, Best Value: 4.699676, Empirical Value: 3.904370
val Loss: 1.290278, Best Value: 4.631951, Empirical Value: 3.847707
----------

train Loss: 1.079057, Best Value: 6.198277, Empirical Value: 5.307359
val Loss: 1.309384, Best Value: 6.189361, Empirical Value: 5.298050
----------
Epoch 130/299
----------
Updating Target Model
train Loss: 1.075565, Best Value: 6.200958, Empirical Value: 5.305188
val Loss: 1.310337, Best Value: 6.087276, Empirical Value: 5.196584
----------
Epoch 131/299
----------
train Loss: 1.074178, Best Value: 6.381208, Empirical Value: 5.544738
val Loss: 1.287008, Best Value: 6.392787, Empirical Value: 5.561635
Best Value updated
----------
Epoch 132/299
----------
train Loss: 1.071227, Best Value: 6.407896, Empirical Value: 5.554861
val Loss: 1.278627, Best Value: 6.465799, Empirical Value: 5.616006
Best Value updated
----------
Epoch 133/299
----------
train Loss: 1.066779, Best Value: 6.413506, Empirical Value: 5.551373
val Loss: 1.288991, Best Value: 6.415572, Empirical Value: 5.534964
----------
Epoch 134/299
----------
train Loss: 1.065008, Best Value: 6.422555, Empirical Value: 5.550755


train Loss: 0.966890, Best Value: 7.757128, Empirical Value: 6.800161
val Loss: 1.256643, Best Value: 7.794940, Empirical Value: 6.840311
----------
Epoch 175/299
----------
train Loss: 0.962448, Best Value: 7.774978, Empirical Value: 6.806701
val Loss: 1.257420, Best Value: 7.695323, Empirical Value: 6.739764
----------
Epoch 176/299
----------
train Loss: 0.957859, Best Value: 7.777114, Empirical Value: 6.803108
val Loss: 1.266382, Best Value: 7.683928, Empirical Value: 6.725880
----------
Epoch 177/299
----------
train Loss: 0.957789, Best Value: 7.777245, Empirical Value: 6.801593
val Loss: 1.244914, Best Value: 7.763532, Empirical Value: 6.787133
----------
Epoch 178/299
----------
train Loss: 0.953138, Best Value: 7.785199, Empirical Value: 6.800359
val Loss: 1.266826, Best Value: 7.799701, Empirical Value: 6.822029
----------
Epoch 179/299
----------
train Loss: 0.950853, Best Value: 7.790229, Empirical Value: 6.801694
val Loss: 1.256812, Best Value: 7.872601, Empirical Value: 6

train Loss: 0.855426, Best Value: 9.020694, Empirical Value: 7.979395
val Loss: 1.214512, Best Value: 9.048273, Empirical Value: 8.019633
----------
Epoch 220/299
----------
Updating Target Model
train Loss: 0.854498, Best Value: 9.026765, Empirical Value: 7.979172
val Loss: 1.179517, Best Value: 9.312926, Empirical Value: 8.245017
Best Value updated
----------
Epoch 221/299
----------
train Loss: 0.872580, Best Value: 9.281572, Empirical Value: 8.323833
val Loss: 1.192170, Best Value: 9.407051, Empirical Value: 8.437148
Best Value updated
----------
Epoch 222/299
----------
train Loss: 0.862692, Best Value: 9.318831, Empirical Value: 8.338600
val Loss: 1.200080, Best Value: 9.425059, Empirical Value: 8.462159
Best Value updated
----------
Epoch 223/299
----------
train Loss: 0.859415, Best Value: 9.335607, Empirical Value: 8.341030
val Loss: 1.217444, Best Value: 9.426052, Empirical Value: 8.404205
Best Value updated
----------
Epoch 224/299
----------
train Loss: 0.852488, Best Value

train Loss: 0.776388, Best Value: 10.037586, Empirical Value: 8.963214
val Loss: 1.154865, Best Value: 10.186022, Empirical Value: 9.153336
Best Value updated
----------
Epoch 265/299
----------
train Loss: 0.771264, Best Value: 10.042619, Empirical Value: 8.960415
val Loss: 1.158459, Best Value: 10.188612, Empirical Value: 9.148355
Best Value updated
----------
Epoch 266/299
----------
train Loss: 0.769721, Best Value: 10.053696, Empirical Value: 8.962690
val Loss: 1.158723, Best Value: 10.199453, Empirical Value: 9.150983
Best Value updated
----------
Epoch 267/299
----------
train Loss: 0.769751, Best Value: 10.049141, Empirical Value: 8.958618
val Loss: 1.158130, Best Value: 10.183172, Empirical Value: 9.128284
----------
Epoch 268/299
----------
train Loss: 0.766353, Best Value: 10.053133, Empirical Value: 8.958341
val Loss: 1.157261, Best Value: 10.078199, Empirical Value: 8.996767
----------
Epoch 269/299
----------
train Loss: 0.763615, Best Value: 10.053100, Empirical Value: 8

val Loss: 1.258857, Best Value: 1.244203, Empirical Value: 0.740128
----------
Epoch 8/299
----------
train Loss: 1.288525, Best Value: 1.223871, Empirical Value: 0.728621
val Loss: 1.260621, Best Value: 1.220111, Empirical Value: 0.725218
----------
Epoch 9/299
----------
train Loss: 1.290340, Best Value: 1.209499, Empirical Value: 0.715237
val Loss: 1.262630, Best Value: 1.198847, Empirical Value: 0.702992
----------
Epoch 10/299
----------
Updating Target Model
train Loss: 1.292058, Best Value: 1.198414, Empirical Value: 0.706421
val Loss: 1.312405, Best Value: 1.192937, Empirical Value: 0.697566
----------
Epoch 11/299
----------
train Loss: 1.252504, Best Value: 1.478435, Empirical Value: 1.104885
val Loss: 1.219514, Best Value: 1.499886, Empirical Value: 1.123141
Best Value updated
----------
Epoch 12/299
----------
train Loss: 1.246625, Best Value: 1.505600, Empirical Value: 1.123200
val Loss: 1.218176, Best Value: 1.532671, Empirical Value: 1.141648
Best Value updated
---------

val Loss: 1.148628, Best Value: 2.342287, Empirical Value: 2.045881
Best Value updated
----------
Epoch 53/299
----------
train Loss: 1.173978, Best Value: 2.338730, Empirical Value: 2.039874
val Loss: 1.148816, Best Value: 2.382828, Empirical Value: 2.077714
Best Value updated
----------
Epoch 54/299
----------
train Loss: 1.173989, Best Value: 2.342926, Empirical Value: 2.039118
val Loss: 1.148470, Best Value: 2.344042, Empirical Value: 2.036464
----------
Epoch 55/299
----------
train Loss: 1.173718, Best Value: 2.347915, Empirical Value: 2.038694
val Loss: 1.148737, Best Value: 2.364330, Empirical Value: 2.054865
----------
Epoch 56/299
----------
train Loss: 1.173575, Best Value: 2.348533, Empirical Value: 2.039223
val Loss: 1.152117, Best Value: 2.346629, Empirical Value: 2.048461
----------
Epoch 57/299
----------
train Loss: 1.173534, Best Value: 2.352768, Empirical Value: 2.038515
val Loss: 1.148809, Best Value: 2.382902, Empirical Value: 2.074853
Best Value updated
----------

val Loss: 1.122509, Best Value: 2.861737, Empirical Value: 2.505929
----------
Epoch 98/299
----------
train Loss: 1.144913, Best Value: 2.872820, Empirical Value: 2.516675
val Loss: 1.121522, Best Value: 2.870758, Empirical Value: 2.520933
----------
Epoch 99/299
----------
train Loss: 1.144778, Best Value: 2.872619, Empirical Value: 2.517249
val Loss: 1.122205, Best Value: 2.874296, Empirical Value: 2.516509
----------
Epoch 100/299
----------
Updating Target Model
train Loss: 1.144909, Best Value: 2.875335, Empirical Value: 2.516121
val Loss: 1.128633, Best Value: 2.888632, Empirical Value: 2.527877
Best Value updated
----------
Epoch 101/299
----------
train Loss: 1.141998, Best Value: 2.981677, Empirical Value: 2.654181
val Loss: 1.120440, Best Value: 2.985599, Empirical Value: 2.664021
Best Value updated
----------
Epoch 102/299
----------
train Loss: 1.140960, Best Value: 2.993197, Empirical Value: 2.657353
val Loss: 1.118094, Best Value: 3.027081, Empirical Value: 2.677296
Best

train Loss: 1.124061, Best Value: 3.576273, Empirical Value: 3.184886
val Loss: 1.104153, Best Value: 3.583309, Empirical Value: 3.182637
Best Value updated
----------
Epoch 143/299
----------
train Loss: 1.123429, Best Value: 3.587806, Empirical Value: 3.185826
val Loss: 1.104032, Best Value: 3.608861, Empirical Value: 3.196455
Best Value updated
----------
Epoch 144/299
----------
train Loss: 1.123504, Best Value: 3.594458, Empirical Value: 3.185413
val Loss: 1.104002, Best Value: 3.596083, Empirical Value: 3.185265
----------
Epoch 145/299
----------
train Loss: 1.123874, Best Value: 3.601355, Empirical Value: 3.185128
val Loss: 1.109630, Best Value: 3.560239, Empirical Value: 3.153644
----------
Epoch 146/299
----------
train Loss: 1.123107, Best Value: 3.605686, Empirical Value: 3.186551
val Loss: 1.104348, Best Value: 3.641039, Empirical Value: 3.207704
Best Value updated
----------
Epoch 147/299
----------
train Loss: 1.123360, Best Value: 3.608570, Empirical Value: 3.184083
val

val Loss: 1.095685, Best Value: 4.290151, Empirical Value: 3.791151
Best Value updated
----------
Epoch 187/299
----------
train Loss: 1.110296, Best Value: 4.230341, Empirical Value: 3.739864
val Loss: 1.095322, Best Value: 4.243752, Empirical Value: 3.749643
----------
Epoch 188/299
----------
train Loss: 1.110235, Best Value: 4.230601, Empirical Value: 3.739440
val Loss: 1.094405, Best Value: 4.213931, Empirical Value: 3.730424
----------
Epoch 189/299
----------
train Loss: 1.110056, Best Value: 4.234281, Empirical Value: 3.740615
val Loss: 1.094629, Best Value: 4.264775, Empirical Value: 3.766155
----------
Epoch 190/299
----------
Updating Target Model
train Loss: 1.109987, Best Value: 4.238396, Empirical Value: 3.740539
val Loss: 1.110528, Best Value: 4.247781, Empirical Value: 3.721514
----------
Epoch 191/299
----------
train Loss: 1.112779, Best Value: 4.332917, Empirical Value: 3.874042
val Loss: 1.113861, Best Value: 4.259012, Empirical Value: 3.829246
----------
Epoch 192/

train Loss: 1.100246, Best Value: 4.938554, Empirical Value: 4.437446
val Loss: 1.089744, Best Value: 4.975502, Empirical Value: 4.471560
Best Value updated
----------
Epoch 232/299
----------
train Loss: 1.099123, Best Value: 4.951391, Empirical Value: 4.439278
val Loss: 1.087710, Best Value: 4.992630, Empirical Value: 4.479714
Best Value updated
----------
Epoch 233/299
----------
train Loss: 1.099774, Best Value: 4.963303, Empirical Value: 4.440997
val Loss: 1.088335, Best Value: 4.988384, Empirical Value: 4.470551
----------
Epoch 234/299
----------
train Loss: 1.099191, Best Value: 4.967656, Empirical Value: 4.441639
val Loss: 1.089138, Best Value: 4.991093, Empirical Value: 4.467018
----------
Epoch 235/299
----------
train Loss: 1.098466, Best Value: 4.973437, Empirical Value: 4.442256
val Loss: 1.089845, Best Value: 4.995702, Empirical Value: 4.465144
Best Value updated
----------
Epoch 236/299
----------
train Loss: 1.099033, Best Value: 4.977903, Empirical Value: 4.443652
val

train Loss: 1.071969, Best Value: 5.441684, Empirical Value: 4.873852
val Loss: 1.066865, Best Value: 5.441686, Empirical Value: 4.877173
----------
Epoch 277/299
----------
train Loss: 1.071219, Best Value: 5.445549, Empirical Value: 4.877587
val Loss: 1.064918, Best Value: 5.491922, Empirical Value: 4.906366
----------
Epoch 278/299
----------
train Loss: 1.071982, Best Value: 5.448101, Empirical Value: 4.875405
val Loss: 1.067307, Best Value: 5.434115, Empirical Value: 4.866062
----------
Epoch 279/299
----------
train Loss: 1.071652, Best Value: 5.449229, Empirical Value: 4.876023
val Loss: 1.067604, Best Value: 5.482645, Empirical Value: 4.920842
----------
Epoch 280/299
----------
Updating Target Model
train Loss: 1.071717, Best Value: 5.455067, Empirical Value: 4.878778
val Loss: 1.062137, Best Value: 5.536673, Empirical Value: 4.955030
Best Value updated
----------
Epoch 281/299
----------
train Loss: 1.064968, Best Value: 5.555112, Empirical Value: 5.017839
val Loss: 1.058935,

Updating Target Model
train Loss: 1.246580, Best Value: 1.724572, Empirical Value: 1.174891
val Loss: 1.311427, Best Value: 1.682573, Empirical Value: 1.139554
----------
Epoch 21/299
----------
train Loss: 1.233745, Best Value: 2.019672, Empirical Value: 1.573792
val Loss: 1.209596, Best Value: 2.049468, Empirical Value: 1.578246
Best Value updated
----------
Epoch 22/299
----------
train Loss: 1.228151, Best Value: 2.062825, Empirical Value: 1.590385
val Loss: 1.208285, Best Value: 2.053448, Empirical Value: 1.578146
Best Value updated
----------
Epoch 23/299
----------
train Loss: 1.226665, Best Value: 2.077010, Empirical Value: 1.591970
val Loss: 1.208329, Best Value: 2.073813, Empirical Value: 1.604152
Best Value updated
----------
Epoch 24/299
----------
train Loss: 1.226059, Best Value: 2.085368, Empirical Value: 1.589813
val Loss: 1.207243, Best Value: 2.049333, Empirical Value: 1.557066
----------
Epoch 25/299
----------
train Loss: 1.225126, Best Value: 2.101091, Empirical Va

train Loss: 1.153341, Best Value: 3.367924, Empirical Value: 2.836679
val Loss: 1.144917, Best Value: 3.388541, Empirical Value: 2.856497
Best Value updated
----------
Epoch 66/299
----------
train Loss: 1.153808, Best Value: 3.380954, Empirical Value: 2.835798
val Loss: 1.144749, Best Value: 3.369488, Empirical Value: 2.833928
----------
Epoch 67/299
----------
train Loss: 1.153750, Best Value: 3.384394, Empirical Value: 2.836011
val Loss: 1.144345, Best Value: 3.368312, Empirical Value: 2.838170
----------
Epoch 68/299
----------
train Loss: 1.152620, Best Value: 3.393322, Empirical Value: 2.837026
val Loss: 1.146255, Best Value: 3.338709, Empirical Value: 2.778552
----------
Epoch 69/299
----------
train Loss: 1.152909, Best Value: 3.393021, Empirical Value: 2.834943
val Loss: 1.144922, Best Value: 3.389998, Empirical Value: 2.832865
Best Value updated
----------
Epoch 70/299
----------
Updating Target Model
train Loss: 1.152873, Best Value: 3.406545, Empirical Value: 2.834553
val L

Updating Target Model
train Loss: 1.110330, Best Value: 4.574517, Empirical Value: 3.909219
val Loss: 1.129703, Best Value: 4.569246, Empirical Value: 3.900733
----------
Epoch 111/299
----------
train Loss: 1.092654, Best Value: 4.751569, Empirical Value: 4.167513
val Loss: 1.096652, Best Value: 4.813714, Empirical Value: 4.213367
Best Value updated
----------
Epoch 112/299
----------
train Loss: 1.091922, Best Value: 4.775177, Empirical Value: 4.173016
val Loss: 1.093127, Best Value: 4.773143, Empirical Value: 4.146008
----------
Epoch 113/299
----------
train Loss: 1.089716, Best Value: 4.781824, Empirical Value: 4.172001
val Loss: 1.094374, Best Value: 4.740718, Empirical Value: 4.142275
----------
Epoch 114/299
----------
train Loss: 1.090095, Best Value: 4.796619, Empirical Value: 4.175189
val Loss: 1.095772, Best Value: 4.809856, Empirical Value: 4.174428
----------
Epoch 115/299
----------
train Loss: 1.089945, Best Value: 4.802486, Empirical Value: 4.172247
val Loss: 1.101005,

train Loss: 1.026627, Best Value: 5.612672, Empirical Value: 4.961725
val Loss: 1.042101, Best Value: 5.610622, Empirical Value: 4.956997
----------
Epoch 156/299
----------
train Loss: 1.025766, Best Value: 5.622166, Empirical Value: 4.961253
val Loss: 1.042911, Best Value: 5.594179, Empirical Value: 4.936998
----------
Epoch 157/299
----------
train Loss: 1.025671, Best Value: 5.628496, Empirical Value: 4.962043
val Loss: 1.040620, Best Value: 5.615226, Empirical Value: 4.942500
----------
Epoch 158/299
----------
train Loss: 1.025572, Best Value: 5.630748, Empirical Value: 4.961740
val Loss: 1.055533, Best Value: 5.575345, Empirical Value: 4.893235
----------
Epoch 159/299
----------
train Loss: 1.025162, Best Value: 5.638289, Empirical Value: 4.961588
val Loss: 1.043192, Best Value: 5.681849, Empirical Value: 4.984372
Best Value updated
----------
Epoch 160/299
----------
Updating Target Model
train Loss: 1.024623, Best Value: 5.640378, Empirical Value: 4.959975
val Loss: 1.040702,

Updating Target Model
train Loss: 0.978877, Best Value: 6.420091, Empirical Value: 5.640660
val Loss: 1.014046, Best Value: 6.432698, Empirical Value: 5.649123
----------
Epoch 201/299
----------
train Loss: 0.975021, Best Value: 6.578365, Empirical Value: 5.848665
val Loss: 0.996751, Best Value: 6.587491, Empirical Value: 5.837863
Best Value updated
----------
Epoch 202/299
----------
train Loss: 0.972607, Best Value: 6.605667, Empirical Value: 5.856361
val Loss: 0.997357, Best Value: 6.651386, Empirical Value: 5.870063
Best Value updated
----------
Epoch 203/299
----------
train Loss: 0.972047, Best Value: 6.617078, Empirical Value: 5.850866
val Loss: 0.998844, Best Value: 6.627470, Empirical Value: 5.850661
----------
Epoch 204/299
----------
train Loss: 0.972135, Best Value: 6.629404, Empirical Value: 5.852036
val Loss: 1.001434, Best Value: 6.642052, Empirical Value: 5.859046
----------
Epoch 205/299
----------
train Loss: 0.971120, Best Value: 6.640732, Empirical Value: 5.854894


val Loss: 0.973196, Best Value: 7.552495, Empirical Value: 6.633710
Best Value updated
----------
Epoch 245/299
----------
train Loss: 0.934415, Best Value: 7.553286, Empirical Value: 6.648820
val Loss: 0.975943, Best Value: 7.541570, Empirical Value: 6.626150
----------
Epoch 246/299
----------
train Loss: 0.933240, Best Value: 7.567566, Empirical Value: 6.651429
val Loss: 0.971746, Best Value: 7.505838, Empirical Value: 6.615716
----------
Epoch 247/299
----------
train Loss: 0.932776, Best Value: 7.571075, Empirical Value: 6.649937
val Loss: 0.979205, Best Value: 7.643684, Empirical Value: 6.729328
Best Value updated
----------
Epoch 248/299
----------
train Loss: 0.933767, Best Value: 7.569334, Empirical Value: 6.649120
val Loss: 0.972984, Best Value: 7.537566, Empirical Value: 6.601104
----------
Epoch 249/299
----------
train Loss: 0.933295, Best Value: 7.577464, Empirical Value: 6.650881
val Loss: 0.972851, Best Value: 7.592153, Empirical Value: 6.657607
----------
Epoch 250/299

Updating Target Model
train Loss: 0.902039, Best Value: 8.625497, Empirical Value: 7.558772
val Loss: 0.964358, Best Value: 8.663148, Empirical Value: 7.607613
Best Value updated
----------
Epoch 291/299
----------
train Loss: 0.892538, Best Value: 8.868009, Empirical Value: 7.876201
val Loss: 0.942903, Best Value: 8.845945, Empirical Value: 7.826269
Best Value updated
----------
Epoch 292/299
----------
train Loss: 0.892560, Best Value: 8.900927, Empirical Value: 7.880418
val Loss: 0.945045, Best Value: 8.879928, Empirical Value: 7.851269
Best Value updated
----------
Epoch 293/299
----------
train Loss: 0.891170, Best Value: 8.918864, Empirical Value: 7.879778
val Loss: 0.948264, Best Value: 8.967215, Empirical Value: 7.929582
Best Value updated
----------
Epoch 294/299
----------
train Loss: 0.889843, Best Value: 8.936867, Empirical Value: 7.880048
val Loss: 0.946000, Best Value: 8.927883, Empirical Value: 7.854494
----------
Epoch 295/299
----------
train Loss: 0.888569, Best Value

val Loss: 1.181977, Best Value: 3.165635, Empirical Value: 2.522444
Best Value updated
----------
Epoch 33/299
----------
train Loss: 1.196160, Best Value: 3.135983, Empirical Value: 2.486386
val Loss: 1.180855, Best Value: 3.156033, Empirical Value: 2.508202
----------
Epoch 34/299
----------
train Loss: 1.194495, Best Value: 3.152861, Empirical Value: 2.487117
val Loss: 1.180180, Best Value: 3.140582, Empirical Value: 2.477882
----------
Epoch 35/299
----------
train Loss: 1.194061, Best Value: 3.154799, Empirical Value: 2.485498
val Loss: 1.181692, Best Value: 3.145549, Empirical Value: 2.480300
----------
Epoch 36/299
----------
train Loss: 1.192754, Best Value: 3.168135, Empirical Value: 2.484667
val Loss: 1.181677, Best Value: 3.132870, Empirical Value: 2.447485
----------
Epoch 37/299
----------
train Loss: 1.192250, Best Value: 3.176632, Empirical Value: 2.485165
val Loss: 1.183838, Best Value: 3.160971, Empirical Value: 2.475047
----------
Epoch 38/299
----------
train Loss: 1

train Loss: 1.106974, Best Value: 4.519673, Empirical Value: 3.834582
val Loss: 1.125712, Best Value: 4.523975, Empirical Value: 3.828972
----------
Epoch 79/299
----------
train Loss: 1.106280, Best Value: 4.526568, Empirical Value: 3.833344
val Loss: 1.124263, Best Value: 4.561221, Empirical Value: 3.879202
----------
Epoch 80/299
----------
Updating Target Model
train Loss: 1.106346, Best Value: 4.531352, Empirical Value: 3.834299
val Loss: 1.155006, Best Value: 4.574218, Empirical Value: 3.889369
----------
Epoch 81/299
----------
train Loss: 1.100344, Best Value: 4.761536, Empirical Value: 4.154037
val Loss: 1.121824, Best Value: 4.793545, Empirical Value: 4.152901
Best Value updated
----------
Epoch 82/299
----------
train Loss: 1.096417, Best Value: 4.791955, Empirical Value: 4.162659
val Loss: 1.113278, Best Value: 4.821227, Empirical Value: 4.158830
Best Value updated
----------
Epoch 83/299
----------
train Loss: 1.094710, Best Value: 4.803126, Empirical Value: 4.157645
val L

val Loss: 1.063711, Best Value: 6.181842, Empirical Value: 5.375739
Best Value updated
----------
Epoch 123/299
----------
train Loss: 1.014571, Best Value: 6.186525, Empirical Value: 5.350447
val Loss: 1.063371, Best Value: 6.213419, Empirical Value: 5.376689
Best Value updated
----------
Epoch 124/299
----------
train Loss: 1.011855, Best Value: 6.206585, Empirical Value: 5.350739
val Loss: 1.058624, Best Value: 6.206213, Empirical Value: 5.371379
----------
Epoch 125/299
----------
train Loss: 1.011198, Best Value: 6.218994, Empirical Value: 5.351534
val Loss: 1.062043, Best Value: 6.227434, Empirical Value: 5.348236
Best Value updated
----------
Epoch 126/299
----------
train Loss: 1.010607, Best Value: 6.223766, Empirical Value: 5.347225
val Loss: 1.062711, Best Value: 6.223163, Empirical Value: 5.349897
----------
Epoch 127/299
----------
train Loss: 1.010616, Best Value: 6.232429, Empirical Value: 5.347544
val Loss: 1.062939, Best Value: 6.241528, Empirical Value: 5.363450
Best 

train Loss: 0.939859, Best Value: 7.825713, Empirical Value: 6.705219
val Loss: 1.032896, Best Value: 7.870433, Empirical Value: 6.749717
Best Value updated
----------
Epoch 168/299
----------
train Loss: 0.940220, Best Value: 7.828092, Empirical Value: 6.700765
val Loss: 1.030195, Best Value: 7.855418, Empirical Value: 6.741680
----------
Epoch 169/299
----------
train Loss: 0.939060, Best Value: 7.836202, Empirical Value: 6.701062
val Loss: 1.050589, Best Value: 7.721461, Empirical Value: 6.621174
----------
Epoch 170/299
----------
Updating Target Model
train Loss: 0.939298, Best Value: 7.848406, Empirical Value: 6.701398
val Loss: 1.101103, Best Value: 7.893225, Empirical Value: 6.749508
Best Value updated
----------
Epoch 171/299
----------
train Loss: 0.945351, Best Value: 8.160744, Empirical Value: 7.122164
val Loss: 1.037644, Best Value: 8.158312, Empirical Value: 7.090734
Best Value updated
----------
Epoch 172/299
----------
train Loss: 0.940749, Best Value: 8.217286, Empiric

val Loss: 1.050139, Best Value: 9.512679, Empirical Value: 8.220378
----------
Epoch 211/299
----------
train Loss: 0.871137, Best Value: 9.816556, Empirical Value: 8.586953
val Loss: 1.004593, Best Value: 9.898940, Empirical Value: 8.672267
Best Value updated
----------
Epoch 212/299
----------
train Loss: 0.869884, Best Value: 9.857891, Empirical Value: 8.586851
val Loss: 0.995334, Best Value: 9.887851, Empirical Value: 8.597023
----------
Epoch 213/299
----------
train Loss: 0.865782, Best Value: 9.877448, Empirical Value: 8.587072
val Loss: 0.997263, Best Value: 9.903170, Empirical Value: 8.595743
Best Value updated
----------
Epoch 214/299
----------
train Loss: 0.864073, Best Value: 9.898315, Empirical Value: 8.582687
val Loss: 0.995630, Best Value: 9.868100, Empirical Value: 8.570869
----------
Epoch 215/299
----------
train Loss: 0.862676, Best Value: 9.905397, Empirical Value: 8.583835
val Loss: 1.004159, Best Value: 9.911127, Empirical Value: 8.595112
Best Value updated
-----

train Loss: 0.782137, Best Value: 11.536487, Empirical Value: 10.106333
val Loss: 0.968012, Best Value: 11.447269, Empirical Value: 10.055388
----------
Epoch 256/299
----------
train Loss: 0.782035, Best Value: 11.531407, Empirical Value: 10.106039
val Loss: 0.953974, Best Value: 11.582780, Empirical Value: 10.170960
Best Value updated
----------
Epoch 257/299
----------
train Loss: 0.780116, Best Value: 11.532384, Empirical Value: 10.102337
val Loss: 0.952955, Best Value: 11.534619, Empirical Value: 10.073485
----------
Epoch 258/299
----------
train Loss: 0.780524, Best Value: 11.550458, Empirical Value: 10.099247
val Loss: 0.953820, Best Value: 11.403740, Empirical Value: 10.018330
----------
Epoch 259/299
----------
train Loss: 0.776669, Best Value: 11.553969, Empirical Value: 10.102490
val Loss: 0.957400, Best Value: 11.563545, Empirical Value: 10.075466
----------
Epoch 260/299
----------
Updating Target Model
train Loss: 0.778122, Best Value: 11.570657, Empirical Value: 10.1021

val Loss: 0.902933, Best Value: 12.771195, Empirical Value: 11.283173
----------
Epoch 299/299
----------
train Loss: 0.707732, Best Value: 12.786779, Empirical Value: 11.287657
val Loss: 0.907402, Best Value: 12.809053, Empirical Value: 11.294085
Training complete in 18m 51s
Best value: 12.831766
{'num_hidden': 5, 'target_update': 10, 'option': 'linear', 'drop_prob': 0.0, 'state_dim': 46, 'use_scheduler': False, 'batch_size': 512, 'lr': 0.0001, 'hidden_dim': 512, 'num_epochs': 300, 'gamma': 0.9, 'action_dim': 25}
----------
Epoch 0/299
----------
Updating Target Model
train Loss: 1.315171, Best Value: 1.051880, Empirical Value: 0.051844
val Loss: 1.598129, Best Value: 0.946619, Empirical Value: 0.051251
Best Value updated
----------
Epoch 1/299
----------
train Loss: 1.300464, Best Value: 1.428575, Empirical Value: 0.781569
val Loss: 1.251502, Best Value: 1.496007, Empirical Value: 0.840903
Best Value updated
----------
Epoch 2/299
----------
train Loss: 1.275346, Best Value: 1.508184

train Loss: 1.179902, Best Value: 3.324593, Empirical Value: 2.727826
val Loss: 1.187668, Best Value: 3.344235, Empirical Value: 2.740368
Best Value updated
----------
Epoch 42/299
----------
train Loss: 1.174412, Best Value: 3.352974, Empirical Value: 2.736727
val Loss: 1.187692, Best Value: 3.345544, Empirical Value: 2.735099
Best Value updated
----------
Epoch 43/299
----------
train Loss: 1.172176, Best Value: 3.356949, Empirical Value: 2.732675
val Loss: 1.186972, Best Value: 3.421190, Empirical Value: 2.783372
Best Value updated
----------
Epoch 44/299
----------
train Loss: 1.168808, Best Value: 3.382926, Empirical Value: 2.736666
val Loss: 1.185901, Best Value: 3.422842, Empirical Value: 2.767504
Best Value updated
----------
Epoch 45/299
----------
train Loss: 1.167392, Best Value: 3.396261, Empirical Value: 2.733400
val Loss: 1.188394, Best Value: 3.389285, Empirical Value: 2.736191
----------
Epoch 46/299
----------
train Loss: 1.166500, Best Value: 3.410738, Empirical Value

train Loss: 1.087198, Best Value: 5.660861, Empirical Value: 4.575927
val Loss: 1.183387, Best Value: 5.615775, Empirical Value: 4.535182
----------
Epoch 86/299
----------
train Loss: 1.083407, Best Value: 5.685606, Empirical Value: 4.574264
val Loss: 1.197332, Best Value: 5.629379, Empirical Value: 4.581540
----------
Epoch 87/299
----------
train Loss: 1.081506, Best Value: 5.711086, Empirical Value: 4.576189
val Loss: 1.176568, Best Value: 5.830407, Empirical Value: 4.673561
Best Value updated
----------
Epoch 88/299
----------
train Loss: 1.079909, Best Value: 5.724871, Empirical Value: 4.574715
val Loss: 1.173486, Best Value: 5.852900, Empirical Value: 4.713373
Best Value updated
----------
Epoch 89/299
----------
train Loss: 1.076747, Best Value: 5.729980, Empirical Value: 4.572057
val Loss: 1.179626, Best Value: 5.667790, Empirical Value: 4.522661
----------
Epoch 90/299
----------
Updating Target Model
train Loss: 1.075979, Best Value: 5.750652, Empirical Value: 4.570088
val L

train Loss: 0.982930, Best Value: 8.582173, Empirical Value: 7.143793
val Loss: 1.176075, Best Value: 8.568916, Empirical Value: 7.177384
----------
Epoch 130/299
----------
Updating Target Model
train Loss: 0.979406, Best Value: 8.608320, Empirical Value: 7.148218
val Loss: 1.297848, Best Value: 8.670060, Empirical Value: 7.206830
----------
Epoch 131/299
----------
train Loss: 0.991750, Best Value: 9.107909, Empirical Value: 7.792396
val Loss: 1.161859, Best Value: 9.141701, Empirical Value: 7.830358
Best Value updated
----------
Epoch 132/299
----------
train Loss: 0.972823, Best Value: 9.173689, Empirical Value: 7.819076
val Loss: 1.165869, Best Value: 9.128592, Empirical Value: 7.752712
----------
Epoch 133/299
----------
train Loss: 0.964947, Best Value: 9.205808, Empirical Value: 7.812748
val Loss: 1.161240, Best Value: 9.209784, Empirical Value: 7.851006
Best Value updated
----------
Epoch 134/299
----------
train Loss: 0.961440, Best Value: 9.222983, Empirical Value: 7.813925


val Loss: 1.097478, Best Value: 11.249409, Empirical Value: 9.836485
Best Value updated
----------
Epoch 174/299
----------
train Loss: 0.827892, Best Value: 11.100593, Empirical Value: 9.695067
val Loss: 1.097188, Best Value: 11.131840, Empirical Value: 9.751447
----------
Epoch 175/299
----------
train Loss: 0.822003, Best Value: 11.110902, Empirical Value: 9.692787
val Loss: 1.091099, Best Value: 11.074483, Empirical Value: 9.674457
----------
Epoch 176/299
----------
train Loss: 0.819947, Best Value: 11.123727, Empirical Value: 9.696429
val Loss: 1.108897, Best Value: 11.138521, Empirical Value: 9.714703
----------
Epoch 177/299
----------
train Loss: 0.820004, Best Value: 11.123562, Empirical Value: 9.692587
val Loss: 1.099537, Best Value: 11.109141, Empirical Value: 9.686018
----------
Epoch 178/299
----------
train Loss: 0.816481, Best Value: 11.117416, Empirical Value: 9.688801
val Loss: 1.103032, Best Value: 11.113200, Empirical Value: 9.714458
----------
Epoch 179/299
-------

train Loss: 0.717925, Best Value: 12.046750, Empirical Value: 10.610388
val Loss: 1.045476, Best Value: 12.228607, Empirical Value: 10.782457
Best Value updated
----------
Epoch 219/299
----------
train Loss: 0.714430, Best Value: 12.048681, Empirical Value: 10.602630
val Loss: 1.097235, Best Value: 12.129134, Empirical Value: 10.711050
----------
Epoch 220/299
----------
Updating Target Model
train Loss: 0.712421, Best Value: 12.053782, Empirical Value: 10.606063
val Loss: 1.016312, Best Value: 12.112851, Empirical Value: 10.651102
----------
Epoch 221/299
----------
train Loss: 0.712539, Best Value: 12.241728, Empirical Value: 10.848883
val Loss: 1.023495, Best Value: 12.284690, Empirical Value: 10.867313
Best Value updated
----------
Epoch 222/299
----------
train Loss: 0.707494, Best Value: 12.258512, Empirical Value: 10.842872
val Loss: 1.017636, Best Value: 12.303087, Empirical Value: 10.885009
Best Value updated
----------
Epoch 223/299
----------
train Loss: 0.700319, Best Valu

train Loss: 0.642169, Best Value: 12.987747, Empirical Value: 11.519635
val Loss: 0.985401, Best Value: 13.015937, Empirical Value: 11.531590
----------
Epoch 263/299
----------
train Loss: 0.634416, Best Value: 13.000285, Empirical Value: 11.514285
val Loss: 0.978801, Best Value: 12.983886, Empirical Value: 11.508375
----------
Epoch 264/299
----------
train Loss: 0.634269, Best Value: 13.002390, Empirical Value: 11.510666
val Loss: 0.987984, Best Value: 13.137104, Empirical Value: 11.679398
Best Value updated
----------
Epoch 265/299
----------
train Loss: 0.630356, Best Value: 13.002613, Empirical Value: 11.509850
val Loss: 0.989007, Best Value: 13.175277, Empirical Value: 11.740590
Best Value updated
----------
Epoch 266/299
----------
train Loss: 0.626068, Best Value: 13.001404, Empirical Value: 11.502758
val Loss: 0.984311, Best Value: 13.063687, Empirical Value: 11.567118
----------
Epoch 267/299
----------
train Loss: 0.625168, Best Value: 13.018297, Empirical Value: 11.503213


train Loss: 1.278070, Best Value: 1.503038, Empirical Value: 0.732900
val Loss: 1.257385, Best Value: 1.463570, Empirical Value: 0.710576
----------
Epoch 6/299
----------
train Loss: 1.276485, Best Value: 1.516197, Empirical Value: 0.726764
val Loss: 1.257249, Best Value: 1.508798, Empirical Value: 0.718549
----------
Epoch 7/299
----------
train Loss: 1.275532, Best Value: 1.542083, Empirical Value: 0.719095
val Loss: 1.257815, Best Value: 1.524898, Empirical Value: 0.712427
Best Value updated
----------
Epoch 8/299
----------
train Loss: 1.274477, Best Value: 1.559902, Empirical Value: 0.717639
val Loss: 1.256450, Best Value: 1.542932, Empirical Value: 0.699912
Best Value updated
----------
Epoch 9/299
----------
train Loss: 1.273211, Best Value: 1.578503, Empirical Value: 0.716255
val Loss: 1.259121, Best Value: 1.617509, Empirical Value: 0.744323
Best Value updated
----------
Epoch 10/299
----------
Updating Target Model
train Loss: 1.273503, Best Value: 1.586363, Empirical Value:

Updating Target Model
train Loss: 1.195558, Best Value: 3.888726, Empirical Value: 2.942979
val Loss: 1.401463, Best Value: 3.733051, Empirical Value: 2.842385
----------
Epoch 51/299
----------
train Loss: 1.193664, Best Value: 4.278650, Empirical Value: 3.414769
val Loss: 1.280298, Best Value: 4.248167, Empirical Value: 3.395837
Best Value updated
----------
Epoch 52/299
----------
train Loss: 1.179234, Best Value: 4.327590, Empirical Value: 3.428513
val Loss: 1.271398, Best Value: 4.289073, Empirical Value: 3.360164
Best Value updated
----------
Epoch 53/299
----------
train Loss: 1.172000, Best Value: 4.375138, Empirical Value: 3.422070
val Loss: 1.279319, Best Value: 4.249934, Empirical Value: 3.332831
----------
Epoch 54/299
----------
train Loss: 1.167470, Best Value: 4.398486, Empirical Value: 3.425889
val Loss: 1.285515, Best Value: 4.286586, Empirical Value: 3.355556
----------
Epoch 55/299
----------
train Loss: 1.163041, Best Value: 4.406690, Empirical Value: 3.417691
val L

val Loss: 1.397444, Best Value: 7.799582, Empirical Value: 6.353409
----------
Epoch 95/299
----------
train Loss: 1.087846, Best Value: 7.800140, Empirical Value: 6.322709
val Loss: 1.381414, Best Value: 7.776086, Empirical Value: 6.304301
----------
Epoch 96/299
----------
train Loss: 1.079578, Best Value: 7.808061, Empirical Value: 6.322238
val Loss: 1.395383, Best Value: 7.971064, Empirical Value: 6.478127
Best Value updated
----------
Epoch 97/299
----------
train Loss: 1.069648, Best Value: 7.832924, Empirical Value: 6.318703
val Loss: 1.401716, Best Value: 7.761959, Empirical Value: 6.264667
----------
Epoch 98/299
----------
train Loss: 1.067988, Best Value: 7.848121, Empirical Value: 6.316813
val Loss: 1.403527, Best Value: 7.841450, Empirical Value: 6.336549
----------
Epoch 99/299
----------
train Loss: 1.061765, Best Value: 7.866727, Empirical Value: 6.318145
val Loss: 1.400591, Best Value: 7.888104, Empirical Value: 6.325505
----------
Epoch 100/299
----------
Updating Tar

val Loss: 1.327300, Best Value: 10.434721, Empirical Value: 9.004548
----------
Epoch 140/299
----------
Updating Target Model
train Loss: 0.854025, Best Value: 10.364132, Empirical Value: 8.900067
val Loss: 1.269975, Best Value: 10.419467, Empirical Value: 8.959739
----------
Epoch 141/299
----------
train Loss: 0.865727, Best Value: 10.697828, Empirical Value: 9.338163
val Loss: 1.250042, Best Value: 10.807916, Empirical Value: 9.482187
Best Value updated
----------
Epoch 142/299
----------
train Loss: 0.849516, Best Value: 10.705230, Empirical Value: 9.335070
val Loss: 1.257007, Best Value: 10.673275, Empirical Value: 9.330679
----------
Epoch 143/299
----------
train Loss: 0.837983, Best Value: 10.712049, Empirical Value: 9.332898
val Loss: 1.275432, Best Value: 10.830949, Empirical Value: 9.456102
Best Value updated
----------
Epoch 144/299
----------
train Loss: 0.831654, Best Value: 10.699849, Empirical Value: 9.324904
val Loss: 1.252934, Best Value: 10.755127, Empirical Value: 

train Loss: 0.664036, Best Value: 11.889806, Empirical Value: 10.531031
val Loss: 1.129875, Best Value: 12.000131, Empirical Value: 10.647915
----------
Epoch 185/299
----------
train Loss: 0.661987, Best Value: 11.889286, Empirical Value: 10.526455
val Loss: 1.149648, Best Value: 11.991721, Empirical Value: 10.657262
----------
Epoch 186/299
----------
train Loss: 0.652891, Best Value: 11.888169, Empirical Value: 10.526131
val Loss: 1.147168, Best Value: 11.991474, Empirical Value: 10.643039
----------
Epoch 187/299
----------
train Loss: 0.648757, Best Value: 11.889896, Empirical Value: 10.523588
val Loss: 1.144935, Best Value: 12.012849, Empirical Value: 10.631708
----------
Epoch 188/299
----------
train Loss: 0.645756, Best Value: 11.895935, Empirical Value: 10.516250
val Loss: 1.154355, Best Value: 12.047832, Empirical Value: 10.709720
Best Value updated
----------
Epoch 189/299
----------
train Loss: 0.641245, Best Value: 11.896679, Empirical Value: 10.520771
val Loss: 1.149513,

val Loss: 1.106614, Best Value: 12.736739, Empirical Value: 11.341502
----------
Epoch 229/299
----------
train Loss: 0.541394, Best Value: 12.609727, Empirical Value: 11.204470
val Loss: 1.076079, Best Value: 12.705293, Empirical Value: 11.282491
----------
Epoch 230/299
----------
Updating Target Model
train Loss: 0.543506, Best Value: 12.624659, Empirical Value: 11.200253
val Loss: 1.013577, Best Value: 12.663684, Empirical Value: 11.281630
----------
Epoch 231/299
----------
train Loss: 0.573239, Best Value: 12.689836, Empirical Value: 11.301007
val Loss: 1.053539, Best Value: 12.828817, Empirical Value: 11.490485
Best Value updated
----------
Epoch 232/299
----------
train Loss: 0.563931, Best Value: 12.681362, Empirical Value: 11.282657
val Loss: 1.084583, Best Value: 12.705410, Empirical Value: 11.305384
----------
Epoch 233/299
----------
train Loss: 0.555998, Best Value: 12.686540, Empirical Value: 11.278916
val Loss: 1.070355, Best Value: 12.807773, Empirical Value: 11.423548

train Loss: 0.489827, Best Value: 13.096347, Empirical Value: 11.661965
val Loss: 1.024721, Best Value: 13.258913, Empirical Value: 11.829538
----------
Epoch 274/299
----------
train Loss: 0.484141, Best Value: 13.086452, Empirical Value: 11.657899
val Loss: 1.049084, Best Value: 13.312047, Empirical Value: 11.883581
Best Value updated
----------
Epoch 275/299
----------
train Loss: 0.479152, Best Value: 13.096515, Empirical Value: 11.655282
val Loss: 1.038518, Best Value: 13.305832, Empirical Value: 11.909951
----------
Epoch 276/299
----------
train Loss: 0.476290, Best Value: 13.108779, Empirical Value: 11.651927
val Loss: 1.029690, Best Value: 13.262105, Empirical Value: 11.824263
----------
Epoch 277/299
----------
train Loss: 0.470050, Best Value: 13.098767, Empirical Value: 11.645580
val Loss: 1.034605, Best Value: 13.342193, Empirical Value: 11.929651
Best Value updated
----------
Epoch 278/299
----------
train Loss: 0.465227, Best Value: 13.105932, Empirical Value: 11.642481


val Loss: 1.229756, Best Value: 1.553687, Empirical Value: 1.107399
Best Value updated
----------
Epoch 17/299
----------
train Loss: 1.253546, Best Value: 1.562415, Empirical Value: 1.117096
val Loss: 1.230954, Best Value: 1.550128, Empirical Value: 1.095904
----------
Epoch 18/299
----------
train Loss: 1.253449, Best Value: 1.568672, Empirical Value: 1.116450
val Loss: 1.230331, Best Value: 1.570509, Empirical Value: 1.115815
Best Value updated
----------
Epoch 19/299
----------
train Loss: 1.253244, Best Value: 1.572159, Empirical Value: 1.115112
val Loss: 1.230753, Best Value: 1.533604, Empirical Value: 1.100079
----------
Epoch 20/299
----------
Updating Target Model
train Loss: 1.252738, Best Value: 1.575037, Empirical Value: 1.113673
val Loss: 1.273857, Best Value: 1.543168, Empirical Value: 1.096064
----------
Epoch 21/299
----------
train Loss: 1.238379, Best Value: 1.816354, Empirical Value: 1.442432
val Loss: 1.212772, Best Value: 1.834314, Empirical Value: 1.458521
Best Va

train Loss: 1.169941, Best Value: 2.926943, Empirical Value: 2.531147
val Loss: 1.149492, Best Value: 2.971187, Empirical Value: 2.560237
Best Value updated
----------
Epoch 62/299
----------
train Loss: 1.167220, Best Value: 2.955450, Empirical Value: 2.533833
val Loss: 1.148923, Best Value: 2.959056, Empirical Value: 2.528426
----------
Epoch 63/299
----------
train Loss: 1.166811, Best Value: 2.971602, Empirical Value: 2.535038
val Loss: 1.148775, Best Value: 2.957757, Empirical Value: 2.526192
----------
Epoch 64/299
----------
train Loss: 1.165836, Best Value: 2.981678, Empirical Value: 2.537444
val Loss: 1.148266, Best Value: 2.994652, Empirical Value: 2.546487
Best Value updated
----------
Epoch 65/299
----------
train Loss: 1.165779, Best Value: 2.989148, Empirical Value: 2.535765
val Loss: 1.148639, Best Value: 3.040531, Empirical Value: 2.580064
Best Value updated
----------
Epoch 66/299
----------
train Loss: 1.165466, Best Value: 2.996597, Empirical Value: 2.536320
val Loss

val Loss: 1.112908, Best Value: 4.065458, Empirical Value: 3.508227
----------
Epoch 106/299
----------
train Loss: 1.127882, Best Value: 4.073380, Empirical Value: 3.489599
val Loss: 1.112805, Best Value: 4.122857, Empirical Value: 3.504667
Best Value updated
----------
Epoch 107/299
----------
train Loss: 1.127278, Best Value: 4.082222, Empirical Value: 3.488895
val Loss: 1.112796, Best Value: 4.090084, Empirical Value: 3.498930
----------
Epoch 108/299
----------
train Loss: 1.126996, Best Value: 4.095668, Empirical Value: 3.489831
val Loss: 1.113836, Best Value: 4.130777, Empirical Value: 3.526338
Best Value updated
----------
Epoch 109/299
----------
train Loss: 1.127001, Best Value: 4.096230, Empirical Value: 3.489342
val Loss: 1.112395, Best Value: 4.143578, Empirical Value: 3.531793
Best Value updated
----------
Epoch 110/299
----------
Updating Target Model
train Loss: 1.126566, Best Value: 4.105981, Empirical Value: 3.490973
val Loss: 1.149409, Best Value: 4.161752, Empirical

val Loss: 1.071703, Best Value: 4.887846, Empirical Value: 4.318117
Best Value updated
----------
Epoch 151/299
----------
train Loss: 1.075107, Best Value: 4.933331, Empirical Value: 4.423050
val Loss: 1.074552, Best Value: 4.880378, Empirical Value: 4.406703
----------
Epoch 152/299
----------
train Loss: 1.074978, Best Value: 4.944493, Empirical Value: 4.423917
val Loss: 1.061700, Best Value: 4.986529, Empirical Value: 4.453098
Best Value updated
----------
Epoch 153/299
----------
train Loss: 1.073361, Best Value: 4.951777, Empirical Value: 4.424253
val Loss: 1.062217, Best Value: 4.999933, Empirical Value: 4.458196
Best Value updated
----------
Epoch 154/299
----------
train Loss: 1.073516, Best Value: 4.966347, Empirical Value: 4.426867
val Loss: 1.064739, Best Value: 5.067574, Empirical Value: 4.502106
Best Value updated
----------
Epoch 155/299
----------
train Loss: 1.074043, Best Value: 4.960626, Empirical Value: 4.420721
val Loss: 1.064919, Best Value: 4.959803, Empirical Va

val Loss: 1.036600, Best Value: 5.444355, Empirical Value: 4.864874
----------
Epoch 196/299
----------
train Loss: 1.042190, Best Value: 5.440313, Empirical Value: 4.852633
val Loss: 1.035572, Best Value: 5.504126, Empirical Value: 4.928857
Best Value updated
----------
Epoch 197/299
----------
train Loss: 1.043265, Best Value: 5.451037, Empirical Value: 4.853078
val Loss: 1.037584, Best Value: 5.523688, Empirical Value: 4.930078
Best Value updated
----------
Epoch 198/299
----------
train Loss: 1.041398, Best Value: 5.449178, Empirical Value: 4.853740
val Loss: 1.035815, Best Value: 5.565237, Empirical Value: 4.923870
Best Value updated
----------
Epoch 199/299
----------
train Loss: 1.042356, Best Value: 5.451137, Empirical Value: 4.850065
val Loss: 1.034992, Best Value: 5.494090, Empirical Value: 4.897699
----------
Epoch 200/299
----------
Updating Target Model
train Loss: 1.041959, Best Value: 5.452433, Empirical Value: 4.852231
val Loss: 1.036486, Best Value: 5.518955, Empirical

Updating Target Model
train Loss: 1.022588, Best Value: 5.927881, Empirical Value: 5.283942
val Loss: 1.026189, Best Value: 5.947410, Empirical Value: 5.290565
----------
Epoch 241/299
----------
train Loss: 1.023857, Best Value: 5.988666, Empirical Value: 5.369688
val Loss: 1.035948, Best Value: 5.983086, Empirical Value: 5.381427
----------
Epoch 242/299
----------
train Loss: 1.023561, Best Value: 5.991534, Empirical Value: 5.369452
val Loss: 1.020342, Best Value: 6.049204, Empirical Value: 5.423270
Best Value updated
----------
Epoch 243/299
----------
train Loss: 1.024949, Best Value: 5.999244, Empirical Value: 5.366849
val Loss: 1.018538, Best Value: 6.078789, Empirical Value: 5.431970
Best Value updated
----------
Epoch 244/299
----------
train Loss: 1.023509, Best Value: 6.004511, Empirical Value: 5.367482
val Loss: 1.019730, Best Value: 6.037837, Empirical Value: 5.387829
----------
Epoch 245/299
----------
train Loss: 1.022849, Best Value: 6.009985, Empirical Value: 5.367430


val Loss: 1.019821, Best Value: 6.398442, Empirical Value: 5.690490
----------
Epoch 286/299
----------
train Loss: 1.015641, Best Value: 6.361378, Empirical Value: 5.637848
val Loss: 1.019915, Best Value: 6.396639, Empirical Value: 5.678242
----------
Epoch 287/299
----------
train Loss: 1.014952, Best Value: 6.360205, Empirical Value: 5.637222
val Loss: 1.016681, Best Value: 6.345894, Empirical Value: 5.637916
----------
Epoch 288/299
----------
train Loss: 1.014673, Best Value: 6.363408, Empirical Value: 5.638459
val Loss: 1.015866, Best Value: 6.414720, Empirical Value: 5.693490
Best Value updated
----------
Epoch 289/299
----------
train Loss: 1.015023, Best Value: 6.369048, Empirical Value: 5.636861
val Loss: 1.019286, Best Value: 6.373971, Empirical Value: 5.678433
----------
Epoch 290/299
----------
Updating Target Model
train Loss: 1.014031, Best Value: 6.369102, Empirical Value: 5.639092
val Loss: 1.026414, Best Value: 6.386846, Empirical Value: 5.658378
----------
Epoch 291/

train Loss: 1.239043, Best Value: 2.617609, Empirical Value: 1.848462
val Loss: 1.228673, Best Value: 2.660798, Empirical Value: 1.877639
Best Value updated
----------
Epoch 29/299
----------
train Loss: 1.238955, Best Value: 2.624841, Empirical Value: 1.847481
val Loss: 1.228951, Best Value: 2.600591, Empirical Value: 1.825402
----------
Epoch 30/299
----------
Updating Target Model
train Loss: 1.239236, Best Value: 2.630423, Empirical Value: 1.845435
val Loss: 1.388840, Best Value: 2.672207, Empirical Value: 1.866444
Best Value updated
----------
Epoch 31/299
----------
train Loss: 1.241587, Best Value: 3.045625, Empirical Value: 2.419438
val Loss: 1.227468, Best Value: 3.076381, Empirical Value: 2.436965
Best Value updated
----------
Epoch 32/299
----------
train Loss: 1.231065, Best Value: 3.105784, Empirical Value: 2.442314
val Loss: 1.227460, Best Value: 3.084574, Empirical Value: 2.412248
Best Value updated
----------
Epoch 33/299
----------
train Loss: 1.229752, Best Value: 3.1

val Loss: 1.142260, Best Value: 4.544094, Empirical Value: 3.963996
Best Value updated
----------
Epoch 73/299
----------
train Loss: 1.133195, Best Value: 4.520476, Empirical Value: 3.932956
val Loss: 1.139584, Best Value: 4.516219, Empirical Value: 3.919721
----------
Epoch 74/299
----------
train Loss: 1.132270, Best Value: 4.538716, Empirical Value: 3.933750
val Loss: 1.140683, Best Value: 4.618295, Empirical Value: 4.019308
Best Value updated
----------
Epoch 75/299
----------
train Loss: 1.131609, Best Value: 4.540818, Empirical Value: 3.930667
val Loss: 1.142751, Best Value: 4.576055, Empirical Value: 3.947023
----------
Epoch 76/299
----------
train Loss: 1.130846, Best Value: 4.553399, Empirical Value: 3.932904
val Loss: 1.142164, Best Value: 4.554439, Empirical Value: 3.913535
----------
Epoch 77/299
----------
train Loss: 1.129973, Best Value: 4.549805, Empirical Value: 3.931948
val Loss: 1.145051, Best Value: 4.551115, Empirical Value: 3.915434
----------
Epoch 78/299
-----

train Loss: 1.047709, Best Value: 5.525426, Empirical Value: 4.801921
val Loss: 1.069388, Best Value: 5.605042, Empirical Value: 4.888618
Best Value updated
----------
Epoch 118/299
----------
train Loss: 1.047936, Best Value: 5.523247, Empirical Value: 4.802048
val Loss: 1.069488, Best Value: 5.533404, Empirical Value: 4.809192
----------
Epoch 119/299
----------
train Loss: 1.047292, Best Value: 5.534782, Empirical Value: 4.803994
val Loss: 1.068311, Best Value: 5.566980, Empirical Value: 4.823194
----------
Epoch 120/299
----------
Updating Target Model
train Loss: 1.046497, Best Value: 5.540263, Empirical Value: 4.800151
val Loss: 1.084669, Best Value: 5.491493, Empirical Value: 4.745087
----------
Epoch 121/299
----------
train Loss: 1.034875, Best Value: 5.661542, Empirical Value: 4.961796
val Loss: 1.058867, Best Value: 5.725464, Empirical Value: 5.023302
Best Value updated
----------
Epoch 122/299
----------
train Loss: 1.034196, Best Value: 5.680756, Empirical Value: 4.960667


val Loss: 1.013898, Best Value: 6.971826, Empirical Value: 6.082626
Best Value updated
----------
Epoch 162/299
----------
train Loss: 0.978903, Best Value: 6.952895, Empirical Value: 6.077777
val Loss: 1.026137, Best Value: 6.908539, Empirical Value: 6.022866
----------
Epoch 163/299
----------
train Loss: 0.979428, Best Value: 6.966912, Empirical Value: 6.074617
val Loss: 1.015728, Best Value: 6.998141, Empirical Value: 6.104074
Best Value updated
----------
Epoch 164/299
----------
train Loss: 0.976701, Best Value: 6.994067, Empirical Value: 6.079280
val Loss: 1.020389, Best Value: 7.032665, Empirical Value: 6.090638
Best Value updated
----------
Epoch 165/299
----------
train Loss: 0.978414, Best Value: 6.997555, Empirical Value: 6.071856
val Loss: 1.018205, Best Value: 7.096318, Empirical Value: 6.145227
Best Value updated
----------
Epoch 166/299
----------
train Loss: 0.976147, Best Value: 7.017075, Empirical Value: 6.078542
val Loss: 1.017566, Best Value: 7.070056, Empirical Va

train Loss: 0.927249, Best Value: 8.499992, Empirical Value: 7.338223
val Loss: 0.994652, Best Value: 8.518088, Empirical Value: 7.330545
----------
Epoch 207/299
----------
train Loss: 0.926719, Best Value: 8.493296, Empirical Value: 7.331682
val Loss: 0.996996, Best Value: 8.508231, Empirical Value: 7.338020
----------
Epoch 208/299
----------
train Loss: 0.925351, Best Value: 8.516995, Empirical Value: 7.333456
val Loss: 0.999577, Best Value: 8.543252, Empirical Value: 7.398487
----------
Epoch 209/299
----------
train Loss: 0.926147, Best Value: 8.516235, Empirical Value: 7.333961
val Loss: 1.053741, Best Value: 8.290591, Empirical Value: 7.122186
----------
Epoch 210/299
----------
Updating Target Model
train Loss: 0.925116, Best Value: 8.522233, Empirical Value: 7.334416
val Loss: 1.060836, Best Value: 8.537537, Empirical Value: 7.330025
----------
Epoch 211/299
----------
train Loss: 0.933737, Best Value: 8.770213, Empirical Value: 7.671404
val Loss: 1.000545, Best Value: 8.7821

Updating Target Model
train Loss: 0.896711, Best Value: 10.117628, Empirical Value: 8.727539
val Loss: 1.049005, Best Value: 10.199835, Empirical Value: 8.794153
----------
Epoch 251/299
----------
train Loss: 0.905824, Best Value: 10.415257, Empirical Value: 9.137895
val Loss: 1.005091, Best Value: 10.463546, Empirical Value: 9.133009
Best Value updated
----------
Epoch 252/299
----------
train Loss: 0.902264, Best Value: 10.483933, Empirical Value: 9.137450
val Loss: 0.993153, Best Value: 10.445758, Empirical Value: 9.192265
----------
Epoch 253/299
----------
train Loss: 0.899187, Best Value: 10.507145, Empirical Value: 9.143212
val Loss: 0.992129, Best Value: 10.608678, Empirical Value: 9.272001
Best Value updated
----------
Epoch 254/299
----------
train Loss: 0.900841, Best Value: 10.527090, Empirical Value: 9.141604
val Loss: 1.052611, Best Value: 10.438080, Empirical Value: 8.986476
----------
Epoch 255/299
----------
train Loss: 0.896805, Best Value: 10.536206, Empirical Value

val Loss: 0.993066, Best Value: 12.281963, Empirical Value: 10.671992
Best Value updated
----------
Epoch 295/299
----------
train Loss: 0.870485, Best Value: 12.209745, Empirical Value: 10.577024
val Loss: 0.988516, Best Value: 12.245142, Empirical Value: 10.648693
----------
Epoch 296/299
----------
train Loss: 0.873861, Best Value: 12.223860, Empirical Value: 10.575579
val Loss: 0.985141, Best Value: 12.327169, Empirical Value: 10.666055
Best Value updated
----------
Epoch 297/299
----------
train Loss: 0.869787, Best Value: 12.249372, Empirical Value: 10.575770
val Loss: 0.998251, Best Value: 12.380519, Empirical Value: 10.688444
Best Value updated
----------
Epoch 298/299
----------
train Loss: 0.872060, Best Value: 12.254207, Empirical Value: 10.574673
val Loss: 0.980717, Best Value: 12.276097, Empirical Value: 10.652198
----------
Epoch 299/299
----------
train Loss: 0.867815, Best Value: 12.258120, Empirical Value: 10.575788
val Loss: 1.005510, Best Value: 12.205263, Empirical 

train Loss: 1.203372, Best Value: 2.988914, Empirical Value: 2.294788
val Loss: 1.209046, Best Value: 2.990635, Empirical Value: 2.290476
----------
Epoch 38/299
----------
train Loss: 1.203358, Best Value: 3.005722, Empirical Value: 2.291776
val Loss: 1.208359, Best Value: 2.995331, Empirical Value: 2.289275
----------
Epoch 39/299
----------
train Loss: 1.201975, Best Value: 3.007297, Empirical Value: 2.292107
val Loss: 1.214030, Best Value: 2.917704, Empirical Value: 2.231190
----------
Epoch 40/299
----------
Updating Target Model
train Loss: 1.203626, Best Value: 3.013526, Empirical Value: 2.282402
val Loss: 1.282840, Best Value: 3.024731, Empirical Value: 2.320992
Best Value updated
----------
Epoch 41/299
----------
train Loss: 1.186143, Best Value: 3.314350, Empirical Value: 2.713211
val Loss: 1.187836, Best Value: 3.346443, Empirical Value: 2.749078
Best Value updated
----------
Epoch 42/299
----------
train Loss: 1.183217, Best Value: 3.342108, Empirical Value: 2.713027
val L

val Loss: 1.132764, Best Value: 5.216652, Empirical Value: 4.403861
Best Value updated
----------
Epoch 82/299
----------
train Loss: 1.091939, Best Value: 5.306187, Empirical Value: 4.438161
val Loss: 1.135051, Best Value: 5.352892, Empirical Value: 4.439864
Best Value updated
----------
Epoch 83/299
----------
train Loss: 1.088047, Best Value: 5.348645, Empirical Value: 4.432726
val Loss: 1.128324, Best Value: 5.342915, Empirical Value: 4.426675
----------
Epoch 84/299
----------
train Loss: 1.085249, Best Value: 5.366581, Empirical Value: 4.434660
val Loss: 1.128188, Best Value: 5.417860, Empirical Value: 4.459839
Best Value updated
----------
Epoch 85/299
----------
train Loss: 1.082292, Best Value: 5.396267, Empirical Value: 4.438882
val Loss: 1.130614, Best Value: 5.379759, Empirical Value: 4.433288
----------
Epoch 86/299
----------
train Loss: 1.082786, Best Value: 5.406155, Empirical Value: 4.433402
val Loss: 1.133094, Best Value: 5.402198, Empirical Value: 4.442020
----------

val Loss: 1.109341, Best Value: 8.100332, Empirical Value: 6.706303
----------
Epoch 126/299
----------
train Loss: 0.994467, Best Value: 8.126328, Empirical Value: 6.698970
val Loss: 1.110608, Best Value: 8.145448, Empirical Value: 6.707937
Best Value updated
----------
Epoch 127/299
----------
train Loss: 0.993591, Best Value: 8.143899, Empirical Value: 6.703578
val Loss: 1.110020, Best Value: 8.164737, Empirical Value: 6.717726
Best Value updated
----------
Epoch 128/299
----------
train Loss: 0.992721, Best Value: 8.160867, Empirical Value: 6.702601
val Loss: 1.120723, Best Value: 8.191379, Empirical Value: 6.697606
Best Value updated
----------
Epoch 129/299
----------
train Loss: 0.992035, Best Value: 8.173823, Empirical Value: 6.694963
val Loss: 1.111739, Best Value: 8.177314, Empirical Value: 6.707557
----------
Epoch 130/299
----------
Updating Target Model
train Loss: 0.990672, Best Value: 8.185864, Empirical Value: 6.694606
val Loss: 1.296768, Best Value: 8.199488, Empirical

val Loss: 1.123243, Best Value: 10.449840, Empirical Value: 8.958462
----------
Epoch 170/299
----------
Updating Target Model
train Loss: 0.868817, Best Value: 10.566596, Empirical Value: 9.015960
val Loss: 1.117952, Best Value: 10.628429, Empirical Value: 9.055378
Best Value updated
----------
Epoch 171/299
----------
train Loss: 0.884327, Best Value: 10.833658, Empirical Value: 9.390035
val Loss: 1.050253, Best Value: 10.887254, Empirical Value: 9.455804
Best Value updated
----------
Epoch 172/299
----------
train Loss: 0.877977, Best Value: 10.843811, Empirical Value: 9.370408
val Loss: 1.061592, Best Value: 10.864338, Empirical Value: 9.363375
----------
Epoch 173/299
----------
train Loss: 0.876407, Best Value: 10.841997, Empirical Value: 9.358988
val Loss: 1.060070, Best Value: 10.947833, Empirical Value: 9.451528
Best Value updated
----------
Epoch 174/299
----------
train Loss: 0.869729, Best Value: 10.864473, Empirical Value: 9.361773
val Loss: 1.064582, Best Value: 10.927504

val Loss: 0.983391, Best Value: 12.545809, Empirical Value: 11.006003
Best Value updated
----------
Epoch 214/299
----------
train Loss: 0.753603, Best Value: 12.438966, Empirical Value: 10.889496
val Loss: 0.976067, Best Value: 12.508368, Empirical Value: 10.963319
----------
Epoch 215/299
----------
train Loss: 0.751073, Best Value: 12.440481, Empirical Value: 10.890917
val Loss: 0.980215, Best Value: 12.528790, Empirical Value: 10.950207
----------
Epoch 216/299
----------
train Loss: 0.749231, Best Value: 12.447977, Empirical Value: 10.887342
val Loss: 0.991569, Best Value: 12.514133, Empirical Value: 10.926615
----------
Epoch 217/299
----------
train Loss: 0.744784, Best Value: 12.455282, Empirical Value: 10.893444
val Loss: 0.974810, Best Value: 12.618553, Empirical Value: 11.019821
Best Value updated
----------
Epoch 218/299
----------
train Loss: 0.742322, Best Value: 12.468829, Empirical Value: 10.884233
val Loss: 0.985226, Best Value: 12.603639, Empirical Value: 10.973918
--

train Loss: 0.659813, Best Value: 13.465783, Empirical Value: 11.850992
val Loss: 0.933531, Best Value: 13.578702, Empirical Value: 12.015672
----------
Epoch 259/299
----------
train Loss: 0.657520, Best Value: 13.463177, Empirical Value: 11.847248
val Loss: 0.934760, Best Value: 13.526084, Empirical Value: 11.933107
----------
Epoch 260/299
----------
Updating Target Model
train Loss: 0.656558, Best Value: 13.476594, Empirical Value: 11.847827
val Loss: 0.917204, Best Value: 13.439441, Empirical Value: 11.793829
----------
Epoch 261/299
----------
train Loss: 0.666655, Best Value: 13.576725, Empirical Value: 11.996845
val Loss: 0.920928, Best Value: 13.697357, Empirical Value: 12.103040
Best Value updated
----------
Epoch 262/299
----------
train Loss: 0.664219, Best Value: 13.571136, Empirical Value: 11.980592
val Loss: 0.920760, Best Value: 13.727559, Empirical Value: 12.100046
Best Value updated
----------
Epoch 263/299
----------
train Loss: 0.659828, Best Value: 13.589411, Empir

train Loss: 1.305350, Best Value: 1.256690, Empirical Value: 0.679733
val Loss: 1.263812, Best Value: 1.308341, Empirical Value: 0.709832
Best Value updated
----------
Epoch 2/299
----------
train Loss: 1.287947, Best Value: 1.347433, Empirical Value: 0.710619
val Loss: 1.262830, Best Value: 1.351384, Empirical Value: 0.696175
Best Value updated
----------
Epoch 3/299
----------
train Loss: 1.285577, Best Value: 1.394083, Empirical Value: 0.709157
val Loss: 1.260157, Best Value: 1.395048, Empirical Value: 0.717075
Best Value updated
----------
Epoch 4/299
----------
train Loss: 1.283905, Best Value: 1.414362, Empirical Value: 0.701165
val Loss: 1.261521, Best Value: 1.424709, Empirical Value: 0.696485
Best Value updated
----------
Epoch 5/299
----------
train Loss: 1.282541, Best Value: 1.442914, Empirical Value: 0.699577
val Loss: 1.260406, Best Value: 1.448656, Empirical Value: 0.679916
Best Value updated
----------
Epoch 6/299
----------
train Loss: 1.283664, Best Value: 1.444718, E

train Loss: 1.201812, Best Value: 3.898266, Empirical Value: 3.059065
val Loss: 1.240101, Best Value: 3.877296, Empirical Value: 3.063610
----------
Epoch 46/299
----------
train Loss: 1.199264, Best Value: 3.915250, Empirical Value: 3.051953
val Loss: 1.248053, Best Value: 3.958397, Empirical Value: 3.106609
Best Value updated
----------
Epoch 47/299
----------
train Loss: 1.197057, Best Value: 3.923950, Empirical Value: 3.046357
val Loss: 1.250790, Best Value: 3.925671, Empirical Value: 3.021205
----------
Epoch 48/299
----------
train Loss: 1.197981, Best Value: 3.946092, Empirical Value: 3.043282
val Loss: 1.264974, Best Value: 3.962426, Empirical Value: 3.086877
Best Value updated
----------
Epoch 49/299
----------
train Loss: 1.196776, Best Value: 3.970970, Empirical Value: 3.036085
val Loss: 1.251148, Best Value: 3.942597, Empirical Value: 3.032633
----------
Epoch 50/299
----------
Updating Target Model
train Loss: 1.194782, Best Value: 3.979145, Empirical Value: 3.031504
val L

train Loss: 1.066539, Best Value: 7.037558, Empirical Value: 5.518592
val Loss: 1.231188, Best Value: 6.934384, Empirical Value: 5.475190
----------
Epoch 90/299
----------
Updating Target Model
train Loss: 1.061565, Best Value: 7.061182, Empirical Value: 5.528645
val Loss: 1.459922, Best Value: 6.936128, Empirical Value: 5.437170
----------
Epoch 91/299
----------
train Loss: 1.077711, Best Value: 7.587975, Empirical Value: 6.189221
val Loss: 1.223739, Best Value: 7.531294, Empirical Value: 6.143530
Best Value updated
----------
Epoch 92/299
----------
train Loss: 1.065224, Best Value: 7.650500, Empirical Value: 6.192008
val Loss: 1.231671, Best Value: 7.684877, Empirical Value: 6.233195
Best Value updated
----------
Epoch 93/299
----------
train Loss: 1.061172, Best Value: 7.669086, Empirical Value: 6.182062
val Loss: 1.225219, Best Value: 7.748333, Empirical Value: 6.230032
Best Value updated
----------
Epoch 94/299
----------
train Loss: 1.051500, Best Value: 7.704271, Empirical Va

val Loss: 1.129104, Best Value: 10.502660, Empirical Value: 9.014583
Best Value updated
----------
Epoch 134/299
----------
train Loss: 0.879521, Best Value: 10.408076, Empirical Value: 8.883422
val Loss: 1.158520, Best Value: 10.549510, Empirical Value: 9.043894
Best Value updated
----------
Epoch 135/299
----------
train Loss: 0.876385, Best Value: 10.418116, Empirical Value: 8.876461
val Loss: 1.144302, Best Value: 10.666347, Empirical Value: 9.116377
Best Value updated
----------
Epoch 136/299
----------
train Loss: 0.870937, Best Value: 10.422513, Empirical Value: 8.872961
val Loss: 1.146591, Best Value: 10.472909, Empirical Value: 8.970120
----------
Epoch 137/299
----------
train Loss: 0.871067, Best Value: 10.420066, Empirical Value: 8.872350
val Loss: 1.155532, Best Value: 10.623042, Empirical Value: 9.056251
----------
Epoch 138/299
----------
train Loss: 0.864143, Best Value: 10.426386, Empirical Value: 8.870231
val Loss: 1.156541, Best Value: 10.588780, Empirical Value: 9.0

train Loss: 0.702297, Best Value: 11.934621, Empirical Value: 10.416260
val Loss: 1.068922, Best Value: 12.019046, Empirical Value: 10.539837
----------
Epoch 179/299
----------
train Loss: 0.697511, Best Value: 11.954642, Empirical Value: 10.418915
val Loss: 1.064089, Best Value: 12.053842, Empirical Value: 10.538084
----------
Epoch 180/299
----------
Updating Target Model
train Loss: 0.697268, Best Value: 11.952689, Empirical Value: 10.414547
val Loss: 0.999132, Best Value: 12.093861, Empirical Value: 10.616260
----------
Epoch 181/299
----------
train Loss: 0.698920, Best Value: 12.201473, Empirical Value: 10.763209
val Loss: 1.031907, Best Value: 12.385026, Empirical Value: 10.972789
Best Value updated
----------
Epoch 182/299
----------
train Loss: 0.690389, Best Value: 12.189770, Empirical Value: 10.744610
val Loss: 1.032164, Best Value: 12.358656, Empirical Value: 10.939902
----------
Epoch 183/299
----------
train Loss: 0.683019, Best Value: 12.216834, Empirical Value: 10.7447

train Loss: 0.582649, Best Value: 13.185250, Empirical Value: 11.714702
val Loss: 0.988342, Best Value: 13.334469, Empirical Value: 11.890042
Best Value updated
----------
Epoch 223/299
----------
train Loss: 0.575114, Best Value: 13.198456, Empirical Value: 11.713646
val Loss: 0.978675, Best Value: 13.306780, Empirical Value: 11.810777
----------
Epoch 224/299
----------
train Loss: 0.569622, Best Value: 13.200708, Empirical Value: 11.707261
val Loss: 0.980091, Best Value: 13.253908, Empirical Value: 11.804199
----------
Epoch 225/299
----------
train Loss: 0.566521, Best Value: 13.202159, Empirical Value: 11.710798
val Loss: 0.979765, Best Value: 13.314665, Empirical Value: 11.820368
----------
Epoch 226/299
----------
train Loss: 0.561882, Best Value: 13.209894, Empirical Value: 11.703042
val Loss: 0.990591, Best Value: 13.259864, Empirical Value: 11.759111
----------
Epoch 227/299
----------
train Loss: 0.563734, Best Value: 13.211754, Empirical Value: 11.698544
val Loss: 0.990622,

val Loss: 0.978609, Best Value: 13.870789, Empirical Value: 12.263913
----------
Epoch 267/299
----------
train Loss: 0.503746, Best Value: 13.828271, Empirical Value: 12.205759
val Loss: 0.981222, Best Value: 13.964108, Empirical Value: 12.364658
----------
Epoch 268/299
----------
train Loss: 0.499659, Best Value: 13.820653, Empirical Value: 12.201027
val Loss: 0.989501, Best Value: 13.907606, Empirical Value: 12.267066
----------
Epoch 269/299
----------
train Loss: 0.503024, Best Value: 13.830433, Empirical Value: 12.200907
val Loss: 0.992448, Best Value: 13.971019, Empirical Value: 12.391191
Best Value updated
----------
Epoch 270/299
----------
Updating Target Model
train Loss: 0.495876, Best Value: 13.834626, Empirical Value: 12.201741
val Loss: 0.933389, Best Value: 13.882467, Empirical Value: 12.272473
----------
Epoch 271/299
----------
train Loss: 0.524760, Best Value: 13.953239, Empirical Value: 12.372509
val Loss: 0.963530, Best Value: 13.994421, Empirical Value: 12.419102

val Loss: 1.260505, Best Value: 1.657639, Empirical Value: 0.771497
Best Value updated
----------
Epoch 10/299
----------
Updating Target Model
train Loss: 1.274973, Best Value: 1.630290, Empirical Value: 0.773201
val Loss: 1.532688, Best Value: 1.665013, Empirical Value: 0.785904
Best Value updated
----------
Epoch 11/299
----------
train Loss: 1.279068, Best Value: 2.180538, Empirical Value: 1.455123
val Loss: 1.249275, Best Value: 2.211004, Empirical Value: 1.495503
Best Value updated
----------
Epoch 12/299
----------
train Loss: 1.256484, Best Value: 2.225029, Empirical Value: 1.487811
val Loss: 1.235657, Best Value: 2.265472, Empirical Value: 1.514607
Best Value updated
----------
Epoch 13/299
----------
train Loss: 1.256438, Best Value: 2.262303, Empirical Value: 1.495703
val Loss: 1.235755, Best Value: 2.269379, Empirical Value: 1.495432
Best Value updated
----------
Epoch 14/299
----------
train Loss: 1.251091, Best Value: 2.268902, Empirical Value: 1.496013
val Loss: 1.248139

val Loss: 1.236833, Best Value: 4.757122, Empirical Value: 3.667677
Best Value updated
----------
Epoch 54/299
----------
train Loss: 1.172386, Best Value: 4.664266, Empirical Value: 3.552196
val Loss: 1.236397, Best Value: 4.756233, Empirical Value: 3.645634
----------
Epoch 55/299
----------
train Loss: 1.167125, Best Value: 4.693006, Empirical Value: 3.554840
val Loss: 1.245720, Best Value: 4.660227, Empirical Value: 3.559227
----------
Epoch 56/299
----------
train Loss: 1.160513, Best Value: 4.730755, Empirical Value: 3.561500
val Loss: 1.242030, Best Value: 4.873288, Empirical Value: 3.691315
Best Value updated
----------
Epoch 57/299
----------
train Loss: 1.159690, Best Value: 4.774351, Empirical Value: 3.556135
val Loss: 1.235354, Best Value: 4.910566, Empirical Value: 3.684806
Best Value updated
----------
Epoch 58/299
----------
train Loss: 1.156173, Best Value: 4.789667, Empirical Value: 3.556639
val Loss: 1.255196, Best Value: 5.019271, Empirical Value: 3.752126
Best Value

train Loss: 1.106507, Best Value: 7.979170, Empirical Value: 6.484459
val Loss: 1.392077, Best Value: 8.170077, Empirical Value: 6.645869
Best Value updated
----------
Epoch 99/299
----------
train Loss: 1.098745, Best Value: 8.027243, Empirical Value: 6.494496
val Loss: 1.384751, Best Value: 8.221518, Empirical Value: 6.672271
Best Value updated
----------
Epoch 100/299
----------
Updating Target Model
train Loss: 1.093239, Best Value: 8.056341, Empirical Value: 6.490489
val Loss: 1.490904, Best Value: 7.985790, Empirical Value: 6.464639
----------
Epoch 101/299
----------
train Loss: 1.105499, Best Value: 8.482580, Empirical Value: 7.089571
val Loss: 1.339556, Best Value: 8.334835, Empirical Value: 7.062846
Best Value updated
----------
Epoch 102/299
----------
train Loss: 1.083374, Best Value: 8.481068, Empirical Value: 7.084648
val Loss: 1.334912, Best Value: 8.502725, Empirical Value: 7.121317
Best Value updated
----------
Epoch 103/299
----------
train Loss: 1.072980, Best Value:

val Loss: 1.241856, Best Value: 10.575201, Empirical Value: 9.232054
----------
Epoch 143/299
----------
train Loss: 0.856047, Best Value: 10.608517, Empirical Value: 9.192160
val Loss: 1.245443, Best Value: 10.706993, Empirical Value: 9.294292
Best Value updated
----------
Epoch 144/299
----------
train Loss: 0.848068, Best Value: 10.632434, Empirical Value: 9.195706
val Loss: 1.243234, Best Value: 10.774333, Empirical Value: 9.376690
Best Value updated
----------
Epoch 145/299
----------
train Loss: 0.840333, Best Value: 10.650671, Empirical Value: 9.189942
val Loss: 1.256944, Best Value: 10.894953, Empirical Value: 9.454614
Best Value updated
----------
Epoch 146/299
----------
train Loss: 0.829443, Best Value: 10.668416, Empirical Value: 9.195115
val Loss: 1.242252, Best Value: 10.772969, Empirical Value: 9.324437
----------
Epoch 147/299
----------
train Loss: 0.824328, Best Value: 10.686129, Empirical Value: 9.195869
val Loss: 1.269319, Best Value: 10.717735, Empirical Value: 9.2

train Loss: 0.647590, Best Value: 11.974423, Empirical Value: 10.557039
val Loss: 1.155527, Best Value: 12.186605, Empirical Value: 10.812802
----------
Epoch 187/299
----------
train Loss: 0.640233, Best Value: 11.988924, Empirical Value: 10.557266
val Loss: 1.133189, Best Value: 12.150458, Empirical Value: 10.714350
----------
Epoch 188/299
----------
train Loss: 0.635602, Best Value: 11.995973, Empirical Value: 10.557316
val Loss: 1.141241, Best Value: 12.194061, Empirical Value: 10.766515
Best Value updated
----------
Epoch 189/299
----------
train Loss: 0.637456, Best Value: 12.016072, Empirical Value: 10.554248
val Loss: 1.150515, Best Value: 12.076676, Empirical Value: 10.625060
----------
Epoch 190/299
----------
Updating Target Model
train Loss: 0.630310, Best Value: 12.010098, Empirical Value: 10.549776
val Loss: 1.055920, Best Value: 12.052494, Empirical Value: 10.584163
----------
Epoch 191/299
----------
train Loss: 0.647071, Best Value: 12.117669, Empirical Value: 10.7302

Updating Target Model
train Loss: 0.508518, Best Value: 12.703627, Empirical Value: 11.235214
val Loss: 0.926643, Best Value: 12.755560, Empirical Value: 11.324208
----------
Epoch 231/299
----------
train Loss: 0.529794, Best Value: 12.775895, Empirical Value: 11.347148
val Loss: 1.001425, Best Value: 12.952036, Empirical Value: 11.533409
Best Value updated
----------
Epoch 232/299
----------
train Loss: 0.517797, Best Value: 12.762984, Empirical Value: 11.312075
val Loss: 0.993922, Best Value: 12.808055, Empirical Value: 11.385541
----------
Epoch 233/299
----------
train Loss: 0.511881, Best Value: 12.764764, Empirical Value: 11.302538
val Loss: 1.004457, Best Value: 12.815074, Empirical Value: 11.373426
----------
Epoch 234/299
----------
train Loss: 0.504442, Best Value: 12.756760, Empirical Value: 11.295944
val Loss: 1.016108, Best Value: 12.848932, Empirical Value: 11.404461
----------
Epoch 235/299
----------
train Loss: 0.498390, Best Value: 12.768552, Empirical Value: 11.2981

train Loss: 0.427684, Best Value: 13.046416, Empirical Value: 11.601666
val Loss: 0.998975, Best Value: 13.144092, Empirical Value: 11.714021
----------
Epoch 276/299
----------
train Loss: 0.423389, Best Value: 13.047946, Empirical Value: 11.596194
val Loss: 1.008222, Best Value: 13.199274, Empirical Value: 11.765069
----------
Epoch 277/299
----------
train Loss: 0.420430, Best Value: 13.041193, Empirical Value: 11.584820
val Loss: 1.025506, Best Value: 13.123984, Empirical Value: 11.760381
----------
Epoch 278/299
----------
train Loss: 0.416626, Best Value: 13.037542, Empirical Value: 11.589213
val Loss: 1.016941, Best Value: 13.188055, Empirical Value: 11.746635
----------
Epoch 279/299
----------
train Loss: 0.412716, Best Value: 13.043329, Empirical Value: 11.584781
val Loss: 1.019426, Best Value: 13.244795, Empirical Value: 11.854545
----------
Epoch 280/299
----------
Updating Target Model
train Loss: 0.410351, Best Value: 13.045506, Empirical Value: 11.580599
val Loss: 0.9144