In [1]:
from data import *
from utils.augmentations import SSDAugmentation
from layers.modules import MultiBoxLoss
from ssd import build_ssd
import os
import sys
import time
import torch
from torch.autograd import Variable
import torch.nn as nn

import torch.optim as optim
import torch.backends.cudnn as cudnn
import torch.nn.init as init
import torch.utils.data as data
import numpy as np
import argparse
import matplotlib.pyplot as plt
import torchvision

os.environ['CUDA_LAUNCH_BLOCKING'] = "1"

## Argument Declare

In [2]:
DATASET_ROOT = "/home/austin/DataSet/ncsist_dataset/ncsist"
DATASET_NAME = "ncsist"
cfg = subt
BASE_NET = "./weights/vgg16_reducedfc.pth"
DATA_DETECTION = SUBTDetection
BATCH_SIZE = 2
PRETRAINED_MODEL = None
PRETRAINED_ITER = 0
SAVE_MODEL_ITER = 500
START_ITER = 0
NUM_WORKERS = 4
CUDA = True
LR = 1e-3
MOMENTUM = 0.4
WEIGHT_DECAY = 5e-4
GAMMA = 0.1
VISDOM = False
SAVE_FOLDER = "./weights/" + DATASET_NAME + "/"
if not os.path.exists(SAVE_FOLDER):
    os.makedirs(SAVE_FOLDER)
print('done')
print(DATA_DETECTION)

done
<class 'data.subt_artifact.SUBTDetection'>


In [3]:
if torch.cuda.is_available():
    if not CUDA:
        print("WTF are u wasting your CUDA device?")
    else:
        torch.set_default_tensor_type('torch.cuda.FloatTensor')
else:
    torch.set_default_tensor_type('torch.FloatTensor')

## Define function

In [4]:
def str2bool(v):
    return v.lower() in ("yes", "true", "t", "1")

# Initial model weights & bias
def xavier(param):
    init.xavier_uniform(param)
def weights_init(m):
    if isinstance(m, nn.Conv2d):
        xavier(m.weight.data)
        m.bias.data.zero_()

# Adjust learning rate during training
def adjust_learning_rate(optimizer, gamma, step):
    """Sets the learning rate to the initial LR decayed by 10 at every
        specified step
    # Adapted from PyTorch Imagenet example:
    # https://github.com/pytorch/examples/blob/master/imagenet/main.py
    """
    lr = LR * (gamma ** (step))
    for param_group in optimizer.param_groups:
        param_group['lr'] = lr
        print("Change learning rate to: ", lr)

## Create dataset

In [5]:
dataset = DATA_DETECTION(root=DATASET_ROOT, image_sets=['train'],transform=SSDAugmentation(cfg['min_dim'], MEANS))

classes = dataset.target_transform.class_to_ind
print("Class to index: \n", classes)
classes = sorted(classes.items(), key=lambda kv: kv[1])
label = []
for i in classes:
    label.append(i[0])
label.append('None')
print(label)
true_label = ['missle', 'backpack', 'blueline', 'drill', 'can']
print(dataset.target_transform)

Class to index: 
 {'missle': 0, 'backpack': 1, 'blueline': 2, 'drill': 3, 'can': 4}
['missle', 'backpack', 'blueline', 'drill', 'can', 'None']
<data.subt_artifact.SUBTAnnotationTransform object at 0x7fe9dc315e10>


## Create model

In [6]:
# Delcare SSD Network
#ssd_net = build_ssd('train', cfg['min_dim'], cfg['num_classes'])
ssd_net = build_ssd('train', cfg['min_dim'], 6)
net = ssd_net
if CUDA:
    net = torch.nn.DataParallel(ssd_net)
    cudnn.benchmark = True
    
if PRETRAINED_MODEL is not None: # Use SSD pretrained model
    print('Resuming training, loading {}...'.format(PRETRAINED_MODEL))
    ssd_net.load_weights(SAVE_FOLDER + PRETRAINED_MODEL)
else:
    print('Initializing weights...')
    vgg_weights = torch.load(BASE_NET) # load vgg pretrained model
    ssd_net.vgg.load_state_dict(vgg_weights)
    ssd_net.extras.apply(weights_init) # Initial SSD model weights & bias
    ssd_net.loc.apply(weights_init)
    ssd_net.conf.apply(weights_init)

optimizer = optim.SGD(net.parameters(), lr=LR, momentum=MOMENTUM,
                weight_decay=WEIGHT_DECAY)
print(cfg['min_dim'])
#criterion = MultiBoxLoss(BATCH_SIZE ,cfg['num_classes'], 0.5, True, 0, True, 3, 0.5,
                #False, CUDA)
criterion = MultiBoxLoss(BATCH_SIZE ,6, 0.5, True, 0, True, 3, 0.5,False, CUDA)

Initializing weights...
300


  self.priors = Variable(self.priorbox.forward(), volatile=True)
  init.constant(self.weight,self.gamma)
  


## Training

### Initialize

In [7]:
net.train()
# loss counters
loc_loss = 0
conf_loss = 0
epoch = 0
print('Loading the dataset...')
epoch_size = len(dataset) // BATCH_SIZE
print('Training SSD on:', DATASET_NAME)

data_loader = data.DataLoader(dataset, BATCH_SIZE,
                                num_workers=NUM_WORKERS,
                                shuffle=True, collate_fn=detection_collate,
                                pin_memory=True)
batch_iterator = iter(data_loader)

Loading the dataset...
Training SSD on: ncsist


  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)


### Start training

In [8]:
step_index = 0
for iteration in range(START_ITER, cfg['max_iter']):
    if iteration in cfg['lr_steps']:
        step_index += 1
        adjust_learning_rate(optimizer, GAMMA, step_index)
    
    # make sure data iter not out of range
    try:
        images, targets = next(batch_iterator)
        #print(targets[0][0][4].item(), label[int(targets[0][0][4].item())])
    except StopIteration:
        batch_iterator = iter(data_loader)
        images, targets = next(batch_iterator)
    if CUDA:
        images = Variable(images.cuda())
        targets = [Variable(ann.cuda(), volatile=True) for ann in targets]
    else:
        images = Variable(images)
        targets = [Variable(ann, volatile=True) for ann in targets]
    
    # Forward
    t0 = time.time()
    out = net(images)
    # backprop
    optimizer.zero_grad()
    loss_l, loss_c = criterion(out, targets)
    loss = loss_l + loss_c
    loss.backward()
    optimizer.step()
    t1 = time.time()
    loc_loss += loss_l.item()
    conf_loss += loss_c.item()
    
    if iteration % 10 == 0:
            print('timer: %.4f sec.' % (t1 - t0))
            print('iter ' + repr(PRETRAINED_ITER + iteration) + ' || Loss: %.4f ||' % (loss.item()), end='')
    
    if iteration != 0 and iteration % SAVE_MODEL_ITER == 0:
            print('Saving state, iter:', iteration)
            torch.save(ssd_net.state_dict(), SAVE_FOLDER + DATASET_NAME + "_" +
                       repr(PRETRAINED_ITER + iteration) + '.pth')
# Save final model
torch.save(ssd_net.state_dict(),
            SAVE_FOLDER + DATASET_NAME + '.pth')

  app.launch_new_instance()


timer: 1.6843 sec.
iter 0 || Loss: 25.3610 ||timer: 0.0737 sec.
iter 10 || Loss: 13.7424 ||timer: 0.0743 sec.
iter 20 || Loss: 12.0291 ||timer: 0.0740 sec.
iter 30 || Loss: 22.8058 ||timer: 0.0740 sec.
iter 40 || Loss: 13.6582 ||timer: 0.0744 sec.
iter 50 || Loss: 12.2426 ||timer: 0.0743 sec.
iter 60 || Loss: 11.1824 ||timer: 0.0742 sec.
iter 70 || Loss: 9.7754 ||timer: 0.0743 sec.
iter 80 || Loss: 13.8774 ||timer: 0.0737 sec.
iter 90 || Loss: 11.1061 ||timer: 0.0738 sec.
iter 100 || Loss: 14.2042 ||timer: 0.0749 sec.
iter 110 || Loss: 9.0314 ||timer: 0.0750 sec.
iter 120 || Loss: 8.1012 ||timer: 0.0753 sec.
iter 130 || Loss: 8.8196 ||timer: 0.0736 sec.
iter 140 || Loss: 9.3161 ||timer: 0.0743 sec.
iter 150 || Loss: 9.0463 ||timer: 0.0748 sec.
iter 160 || Loss: 8.5661 ||timer: 0.0751 sec.
iter 170 || Loss: 3.8306 ||timer: 0.0749 sec.
iter 180 || Loss: 7.0922 ||timer: 0.0746 sec.
iter 190 || Loss: 7.3088 ||timer: 0.0752 sec.
iter 200 || Loss: 6.1022 ||timer: 0.0749 sec.
iter 210 || Loss

  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)


timer: 0.0892 sec.
iter 360 || Loss: 7.2813 ||timer: 0.0739 sec.
iter 370 || Loss: 10.0878 ||timer: 0.0739 sec.
iter 380 || Loss: 5.1641 ||timer: 0.0745 sec.
iter 390 || Loss: 5.5293 ||timer: 0.0741 sec.
iter 400 || Loss: 6.5488 ||timer: 0.0758 sec.
iter 410 || Loss: 5.7965 ||timer: 0.0744 sec.
iter 420 || Loss: 7.1061 ||timer: 0.0747 sec.
iter 430 || Loss: 6.0996 ||timer: 0.0747 sec.
iter 440 || Loss: 7.1082 ||timer: 0.0745 sec.
iter 450 || Loss: 4.6745 ||timer: 0.0748 sec.
iter 460 || Loss: 4.9923 ||timer: 0.0750 sec.
iter 470 || Loss: 6.3701 ||timer: 0.0741 sec.
iter 480 || Loss: 3.3314 ||timer: 0.0750 sec.
iter 490 || Loss: 6.4609 ||timer: 0.0740 sec.
iter 500 || Loss: 7.6424 ||Saving state, iter: 500
timer: 0.0747 sec.
iter 510 || Loss: 5.8698 ||timer: 0.0743 sec.
iter 520 || Loss: 4.9954 ||timer: 0.0751 sec.
iter 530 || Loss: 5.1336 ||timer: 0.0753 sec.
iter 540 || Loss: 4.3848 ||timer: 0.0748 sec.
iter 550 || Loss: 3.2365 ||timer: 0.0762 sec.
iter 560 || Loss: 4.6106 ||timer: 0.

  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)


timer: 0.0851 sec.
iter 720 || Loss: 5.0938 ||timer: 0.0754 sec.
iter 730 || Loss: 5.2161 ||timer: 0.0747 sec.
iter 740 || Loss: 4.1328 ||timer: 0.0748 sec.
iter 750 || Loss: 4.6689 ||timer: 0.0757 sec.
iter 760 || Loss: 7.3201 ||timer: 0.0748 sec.
iter 770 || Loss: 4.5530 ||timer: 0.0753 sec.
iter 780 || Loss: 4.5160 ||timer: 0.0748 sec.
iter 790 || Loss: 8.8821 ||timer: 0.0746 sec.
iter 800 || Loss: 4.4073 ||timer: 0.0749 sec.
iter 810 || Loss: 5.3197 ||timer: 0.0745 sec.
iter 820 || Loss: 5.9461 ||timer: 0.0749 sec.
iter 830 || Loss: 4.3186 ||timer: 0.0747 sec.
iter 840 || Loss: 7.9586 ||timer: 0.0752 sec.
iter 850 || Loss: 3.7158 ||timer: 0.0748 sec.
iter 860 || Loss: 3.5699 ||timer: 0.0747 sec.
iter 870 || Loss: 8.8428 ||timer: 0.0752 sec.
iter 880 || Loss: 9.3802 ||timer: 0.0752 sec.
iter 890 || Loss: 6.2488 ||timer: 0.0745 sec.
iter 900 || Loss: 3.0281 ||timer: 0.0747 sec.
iter 910 || Loss: 2.9565 ||timer: 0.0748 sec.
iter 920 || Loss: 5.8024 ||timer: 0.0747 sec.
iter 930 || Los

  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)


timer: 0.0801 sec.
iter 1080 || Loss: 3.4189 ||timer: 0.0751 sec.
iter 1090 || Loss: 4.0245 ||timer: 0.0747 sec.
iter 1100 || Loss: 4.3095 ||timer: 0.0744 sec.
iter 1110 || Loss: 4.6765 ||timer: 0.0753 sec.
iter 1120 || Loss: 4.2255 ||timer: 0.0752 sec.
iter 1130 || Loss: 9.7089 ||timer: 0.0751 sec.
iter 1140 || Loss: 5.6860 ||timer: 0.0745 sec.
iter 1150 || Loss: 3.7455 ||timer: 0.0744 sec.
iter 1160 || Loss: 4.8873 ||timer: 0.0747 sec.
iter 1170 || Loss: 3.5170 ||timer: 0.0752 sec.
iter 1180 || Loss: 2.9104 ||timer: 0.0749 sec.
iter 1190 || Loss: 4.7428 ||timer: 0.0759 sec.
iter 1200 || Loss: 4.7731 ||timer: 0.0749 sec.
iter 1210 || Loss: 7.0013 ||timer: 0.0758 sec.
iter 1220 || Loss: 4.5855 ||timer: 0.0751 sec.
iter 1230 || Loss: 2.7528 ||timer: 0.0749 sec.
iter 1240 || Loss: 3.3140 ||timer: 0.0749 sec.
iter 1250 || Loss: 2.7541 ||timer: 0.0760 sec.
iter 1260 || Loss: 5.3534 ||timer: 0.0754 sec.
iter 1270 || Loss: 2.8339 ||timer: 0.0754 sec.
iter 1280 || Loss: 5.0146 ||timer: 0.0756

  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)


timer: 0.0787 sec.
iter 1440 || Loss: 3.8197 ||timer: 0.0760 sec.
iter 1450 || Loss: 2.5193 ||timer: 0.0756 sec.
iter 1460 || Loss: 3.1281 ||timer: 0.0754 sec.
iter 1470 || Loss: 3.2092 ||timer: 0.0755 sec.
iter 1480 || Loss: 3.8901 ||timer: 0.0759 sec.
iter 1490 || Loss: 4.0330 ||timer: 0.0757 sec.
iter 1500 || Loss: 3.6916 ||Saving state, iter: 1500
timer: 0.0760 sec.
iter 1510 || Loss: 1.5984 ||timer: 0.0752 sec.
iter 1520 || Loss: 6.9206 ||timer: 0.0760 sec.
iter 1530 || Loss: 2.0694 ||timer: 0.0752 sec.
iter 1540 || Loss: 2.4601 ||timer: 0.0749 sec.
iter 1550 || Loss: 4.1002 ||timer: 0.0748 sec.
iter 1560 || Loss: 2.4695 ||timer: 0.0750 sec.
iter 1570 || Loss: 3.8759 ||timer: 0.0745 sec.
iter 1580 || Loss: 2.0982 ||timer: 0.0747 sec.
iter 1590 || Loss: 3.6589 ||timer: 0.0758 sec.
iter 1600 || Loss: 2.0247 ||timer: 0.0749 sec.
iter 1610 || Loss: 2.9712 ||timer: 0.0767 sec.
iter 1620 || Loss: 4.2545 ||timer: 0.0747 sec.
iter 1630 || Loss: 3.0238 ||timer: 0.0754 sec.
iter 1640 || Los

  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)


timer: 0.0810 sec.
iter 1800 || Loss: 2.4871 ||timer: 0.0748 sec.
iter 1810 || Loss: 3.2191 ||timer: 0.0755 sec.
iter 1820 || Loss: 3.9301 ||timer: 0.0762 sec.
iter 1830 || Loss: 2.6415 ||timer: 0.0751 sec.
iter 1840 || Loss: 2.0223 ||timer: 0.0752 sec.
iter 1850 || Loss: 4.9139 ||timer: 0.0762 sec.
iter 1860 || Loss: 3.2507 ||timer: 0.0759 sec.
iter 1870 || Loss: 3.1175 ||timer: 0.0754 sec.
iter 1880 || Loss: 3.9381 ||timer: 0.0749 sec.
iter 1890 || Loss: 2.2003 ||timer: 0.0759 sec.
iter 1900 || Loss: 2.4382 ||timer: 0.0750 sec.
iter 1910 || Loss: 3.3236 ||timer: 0.0751 sec.
iter 1920 || Loss: 2.4599 ||timer: 0.0753 sec.
iter 1930 || Loss: 2.0751 ||timer: 0.0761 sec.
iter 1940 || Loss: 2.9457 ||timer: 0.0772 sec.
iter 1950 || Loss: 10.2627 ||timer: 0.0759 sec.
iter 1960 || Loss: 1.7494 ||timer: 0.0760 sec.
iter 1970 || Loss: 5.1023 ||timer: 0.0755 sec.
iter 1980 || Loss: 4.5889 ||timer: 0.0751 sec.
iter 1990 || Loss: 3.1394 ||timer: 0.0758 sec.
iter 2000 || Loss: 1.8959 ||Saving state

  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)


timer: 0.0938 sec.
iter 2160 || Loss: 3.8160 ||timer: 0.0749 sec.
iter 2170 || Loss: 3.4228 ||timer: 0.0758 sec.
iter 2180 || Loss: 4.4796 ||timer: 0.0773 sec.
iter 2190 || Loss: 2.1800 ||timer: 0.0792 sec.
iter 2200 || Loss: 2.4165 ||timer: 0.0769 sec.
iter 2210 || Loss: 2.7496 ||timer: 0.0756 sec.
iter 2220 || Loss: 2.7370 ||timer: 0.0754 sec.
iter 2230 || Loss: 1.0871 ||timer: 0.0752 sec.
iter 2240 || Loss: 2.7709 ||timer: 0.0761 sec.
iter 2250 || Loss: 5.8962 ||timer: 0.0750 sec.
iter 2260 || Loss: 2.2409 ||timer: 0.0760 sec.
iter 2270 || Loss: 2.7644 ||timer: 0.0750 sec.
iter 2280 || Loss: 2.8184 ||timer: 0.0756 sec.
iter 2290 || Loss: 1.8533 ||timer: 0.0779 sec.
iter 2300 || Loss: 4.8125 ||timer: 0.0756 sec.
iter 2310 || Loss: 1.5416 ||timer: 0.0759 sec.
iter 2320 || Loss: 3.9452 ||timer: 0.0759 sec.
iter 2330 || Loss: 4.1167 ||timer: 0.0784 sec.
iter 2340 || Loss: 2.4920 ||timer: 0.0757 sec.
iter 2350 || Loss: 2.2480 ||timer: 0.0766 sec.
iter 2360 || Loss: 1.3696 ||timer: 0.0748

  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)


timer: 0.0925 sec.
iter 2520 || Loss: 3.5630 ||timer: 0.0761 sec.
iter 2530 || Loss: 1.9435 ||timer: 0.0754 sec.
iter 2540 || Loss: 3.6982 ||timer: 0.0769 sec.
iter 2550 || Loss: 2.8601 ||timer: 0.0763 sec.
iter 2560 || Loss: 3.3327 ||timer: 0.0750 sec.
iter 2570 || Loss: 2.3414 ||timer: 0.0798 sec.
iter 2580 || Loss: 5.5392 ||timer: 0.0773 sec.
iter 2590 || Loss: 2.0532 ||timer: 0.0771 sec.
iter 2600 || Loss: 2.8665 ||timer: 0.0761 sec.
iter 2610 || Loss: 4.6366 ||timer: 0.0752 sec.
iter 2620 || Loss: 2.7069 ||timer: 0.0770 sec.
iter 2630 || Loss: 2.4827 ||timer: 0.0755 sec.
iter 2640 || Loss: 3.4630 ||timer: 0.0757 sec.
iter 2650 || Loss: 1.4797 ||timer: 0.0749 sec.
iter 2660 || Loss: 3.6480 ||timer: 0.0757 sec.
iter 2670 || Loss: 4.2010 ||timer: 0.0761 sec.
iter 2680 || Loss: 5.6792 ||timer: 0.0755 sec.
iter 2690 || Loss: 1.1808 ||timer: 0.0762 sec.
iter 2700 || Loss: 2.8938 ||timer: 0.0751 sec.
iter 2710 || Loss: 2.0801 ||timer: 0.0777 sec.
iter 2720 || Loss: 2.7807 ||timer: 0.0766

  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)


timer: 0.0802 sec.
iter 2880 || Loss: 2.4958 ||timer: 0.0753 sec.
iter 2890 || Loss: 5.3640 ||timer: 0.0765 sec.
iter 2900 || Loss: 3.6972 ||timer: 0.0759 sec.
iter 2910 || Loss: 6.4226 ||timer: 0.0748 sec.
iter 2920 || Loss: 3.6119 ||timer: 0.0754 sec.
iter 2930 || Loss: 4.6736 ||timer: 0.0752 sec.
iter 2940 || Loss: 7.2190 ||timer: 0.0767 sec.
iter 2950 || Loss: 3.1916 ||timer: 0.0757 sec.
iter 2960 || Loss: 2.4844 ||timer: 0.0780 sec.
iter 2970 || Loss: 3.8786 ||timer: 0.0753 sec.
iter 2980 || Loss: 1.6886 ||timer: 0.0763 sec.
iter 2990 || Loss: 1.5429 ||timer: 0.0775 sec.
iter 3000 || Loss: 3.3739 ||Saving state, iter: 3000
timer: 0.0762 sec.
iter 3010 || Loss: 2.2314 ||timer: 0.0771 sec.
iter 3020 || Loss: 3.4850 ||timer: 0.0789 sec.
iter 3030 || Loss: 4.7701 ||timer: 0.0758 sec.
iter 3040 || Loss: 1.4638 ||timer: 0.0759 sec.
iter 3050 || Loss: 1.9172 ||timer: 0.0786 sec.
iter 3060 || Loss: 2.4716 ||timer: 0.0783 sec.
iter 3070 || Loss: 4.2800 ||timer: 0.0763 sec.
iter 3080 || Los

  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)


timer: 0.0859 sec.
iter 3240 || Loss: 2.1431 ||timer: 0.0775 sec.
iter 3250 || Loss: 2.4700 ||timer: 0.0754 sec.
iter 3260 || Loss: 2.7355 ||timer: 0.0799 sec.
iter 3270 || Loss: 1.8722 ||timer: 0.0792 sec.
iter 3280 || Loss: 2.1839 ||timer: 0.0763 sec.
iter 3290 || Loss: 2.6746 ||timer: 0.0760 sec.
iter 3300 || Loss: 2.1627 ||timer: 0.0752 sec.
iter 3310 || Loss: 2.4862 ||timer: 0.0751 sec.
iter 3320 || Loss: 3.4809 ||timer: 0.0755 sec.
iter 3330 || Loss: 5.2373 ||timer: 0.0769 sec.
iter 3340 || Loss: 2.7018 ||timer: 0.0756 sec.
iter 3350 || Loss: 1.6560 ||timer: 0.0765 sec.
iter 3360 || Loss: 2.6409 ||timer: 0.0768 sec.
iter 3370 || Loss: 3.0141 ||timer: 0.0754 sec.
iter 3380 || Loss: 2.0685 ||timer: 0.0769 sec.
iter 3390 || Loss: 5.1558 ||timer: 0.0799 sec.
iter 3400 || Loss: 1.6356 ||timer: 0.0759 sec.
iter 3410 || Loss: 2.3868 ||timer: 0.0778 sec.
iter 3420 || Loss: 2.9744 ||timer: 0.0775 sec.
iter 3430 || Loss: 2.9600 ||timer: 0.0774 sec.
iter 3440 || Loss: 1.9088 ||timer: 0.0773

  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)


timer: 0.0810 sec.
iter 3600 || Loss: 1.7837 ||timer: 0.0766 sec.
iter 3610 || Loss: 1.7122 ||timer: 0.0797 sec.
iter 3620 || Loss: 2.1695 ||timer: 0.0772 sec.
iter 3630 || Loss: 3.3049 ||timer: 0.0756 sec.
iter 3640 || Loss: 1.5713 ||timer: 0.0756 sec.
iter 3650 || Loss: 2.5930 ||timer: 0.0787 sec.
iter 3660 || Loss: 2.7659 ||timer: 0.0787 sec.
iter 3670 || Loss: 3.3517 ||timer: 0.0777 sec.
iter 3680 || Loss: 2.2967 ||timer: 0.0768 sec.
iter 3690 || Loss: 1.4100 ||timer: 0.0815 sec.
iter 3700 || Loss: 1.5005 ||timer: 0.0755 sec.
iter 3710 || Loss: 1.6560 ||timer: 0.0800 sec.
iter 3720 || Loss: 1.5510 ||timer: 0.0758 sec.
iter 3730 || Loss: 2.2730 ||timer: 0.0757 sec.
iter 3740 || Loss: 1.7187 ||timer: 0.0766 sec.
iter 3750 || Loss: 3.0908 ||timer: 0.0755 sec.
iter 3760 || Loss: 3.0071 ||timer: 0.0759 sec.
iter 3770 || Loss: 2.4827 ||timer: 0.0758 sec.
iter 3780 || Loss: 3.4536 ||timer: 0.0795 sec.
iter 3790 || Loss: 5.1115 ||timer: 0.0757 sec.
iter 3800 || Loss: 4.9602 ||timer: 0.0773

  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)


timer: 0.0856 sec.
iter 3960 || Loss: 2.6844 ||timer: 0.0755 sec.
iter 3970 || Loss: 2.6291 ||timer: 0.0761 sec.
iter 3980 || Loss: 1.5492 ||timer: 0.0754 sec.
iter 3990 || Loss: 0.9299 ||Change learning rate to:  0.0001
timer: 0.0753 sec.
iter 4000 || Loss: 2.3415 ||Saving state, iter: 4000
timer: 0.0756 sec.
iter 4010 || Loss: 4.1512 ||timer: 0.0757 sec.
iter 4020 || Loss: 2.3039 ||timer: 0.0772 sec.
iter 4030 || Loss: 2.1852 ||timer: 0.0791 sec.
iter 4040 || Loss: 1.3787 ||timer: 0.0779 sec.
iter 4050 || Loss: 2.6652 ||timer: 0.0773 sec.
iter 4060 || Loss: 2.4649 ||timer: 0.0801 sec.
iter 4070 || Loss: 0.9850 ||timer: 0.0751 sec.
iter 4080 || Loss: 3.8375 ||timer: 0.0762 sec.
iter 4090 || Loss: 0.9999 ||timer: 0.0770 sec.
iter 4100 || Loss: 1.9391 ||timer: 0.0757 sec.
iter 4110 || Loss: 2.3361 ||timer: 0.0763 sec.
iter 4120 || Loss: 1.8130 ||timer: 0.0782 sec.
iter 4130 || Loss: 1.8557 ||timer: 0.0771 sec.
iter 4140 || Loss: 2.3885 ||timer: 0.0768 sec.
iter 4150 || Loss: 3.7755 ||ti

  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)


timer: 0.0793 sec.
iter 4320 || Loss: 1.6713 ||timer: 0.0814 sec.
iter 4330 || Loss: 1.9246 ||timer: 0.0772 sec.
iter 4340 || Loss: 1.1712 ||timer: 0.0790 sec.
iter 4350 || Loss: 2.3535 ||timer: 0.0771 sec.
iter 4360 || Loss: 0.8578 ||timer: 0.0758 sec.
iter 4370 || Loss: 1.3189 ||timer: 0.0794 sec.
iter 4380 || Loss: 2.4917 ||timer: 0.0769 sec.
iter 4390 || Loss: 1.2553 ||timer: 0.0805 sec.
iter 4400 || Loss: 1.0852 ||timer: 0.0769 sec.
iter 4410 || Loss: 1.7552 ||timer: 0.0791 sec.
iter 4420 || Loss: 1.4779 ||timer: 0.0802 sec.
iter 4430 || Loss: 1.1629 ||timer: 0.0781 sec.
iter 4440 || Loss: 1.5345 ||timer: 0.0793 sec.
iter 4450 || Loss: 1.2731 ||timer: 0.0768 sec.
iter 4460 || Loss: 1.1697 ||timer: 0.0781 sec.
iter 4470 || Loss: 1.7941 ||timer: 0.0793 sec.
iter 4480 || Loss: 3.0042 ||timer: 0.0788 sec.
iter 4490 || Loss: 2.9984 ||timer: 0.0788 sec.
iter 4500 || Loss: 3.8053 ||Saving state, iter: 4500
timer: 0.0777 sec.
iter 4510 || Loss: 1.4171 ||timer: 0.0753 sec.
iter 4520 || Los

  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)


timer: 0.0853 sec.
iter 4680 || Loss: 1.4668 ||timer: 0.0770 sec.
iter 4690 || Loss: 2.7534 ||timer: 0.0798 sec.
iter 4700 || Loss: 0.7397 ||timer: 0.0763 sec.
iter 4710 || Loss: 1.2819 ||timer: 0.0789 sec.
iter 4720 || Loss: 1.6394 ||timer: 0.0778 sec.
iter 4730 || Loss: 1.7342 ||timer: 0.0758 sec.
iter 4740 || Loss: 2.3355 ||timer: 0.0756 sec.
iter 4750 || Loss: 2.8119 ||timer: 0.0773 sec.
iter 4760 || Loss: 1.4000 ||timer: 0.0762 sec.
iter 4770 || Loss: 6.1594 ||timer: 0.0770 sec.
iter 4780 || Loss: 1.5633 ||timer: 0.0790 sec.
iter 4790 || Loss: 1.2710 ||timer: 0.0755 sec.
iter 4800 || Loss: 1.6534 ||timer: 0.0793 sec.
iter 4810 || Loss: 1.4214 ||timer: 0.0762 sec.
iter 4820 || Loss: 1.9084 ||timer: 0.0773 sec.
iter 4830 || Loss: 1.1488 ||timer: 0.0752 sec.
iter 4840 || Loss: 2.1726 ||timer: 0.0762 sec.
iter 4850 || Loss: 1.6203 ||timer: 0.0764 sec.
iter 4860 || Loss: 1.8767 ||timer: 0.0750 sec.
iter 4870 || Loss: 1.0625 ||timer: 0.0778 sec.
iter 4880 || Loss: 0.6016 ||timer: 0.0755

  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)


timer: 0.0936 sec.
iter 5040 || Loss: 1.5728 ||timer: 0.0761 sec.
iter 5050 || Loss: 1.0231 ||timer: 0.0764 sec.
iter 5060 || Loss: 0.8201 ||timer: 0.0784 sec.
iter 5070 || Loss: 1.1452 ||timer: 0.0764 sec.
iter 5080 || Loss: 1.0430 ||timer: 0.0799 sec.
iter 5090 || Loss: 1.8246 ||timer: 0.0769 sec.
iter 5100 || Loss: 1.3630 ||timer: 0.0756 sec.
iter 5110 || Loss: 0.9248 ||timer: 0.0755 sec.
iter 5120 || Loss: 2.5001 ||timer: 0.0759 sec.
iter 5130 || Loss: 0.7390 ||timer: 0.0768 sec.
iter 5140 || Loss: 2.1621 ||timer: 0.0771 sec.
iter 5150 || Loss: 1.2293 ||timer: 0.0752 sec.
iter 5160 || Loss: 4.2146 ||timer: 0.0769 sec.
iter 5170 || Loss: 0.9658 ||timer: 0.0850 sec.
iter 5180 || Loss: 0.9724 ||timer: 0.0805 sec.
iter 5190 || Loss: 0.8213 ||timer: 0.0761 sec.
iter 5200 || Loss: 5.2176 ||timer: 0.0772 sec.
iter 5210 || Loss: 1.7178 ||timer: 0.0761 sec.
iter 5220 || Loss: 1.2633 ||timer: 0.0771 sec.
iter 5230 || Loss: 1.6263 ||timer: 0.0758 sec.
iter 5240 || Loss: 1.4655 ||timer: 0.0758

  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)


timer: 0.0857 sec.
iter 5400 || Loss: 1.6198 ||timer: 0.0762 sec.
iter 5410 || Loss: 2.0422 ||timer: 0.0760 sec.
iter 5420 || Loss: 2.0100 ||timer: 0.0756 sec.
iter 5430 || Loss: 0.9444 ||timer: 0.0784 sec.
iter 5440 || Loss: 1.1249 ||timer: 0.0764 sec.
iter 5450 || Loss: 1.7226 ||timer: 0.0773 sec.
iter 5460 || Loss: 1.4602 ||timer: 0.0794 sec.
iter 5470 || Loss: 2.7892 ||timer: 0.0773 sec.
iter 5480 || Loss: 1.4026 ||timer: 0.0793 sec.
iter 5490 || Loss: 1.2278 ||timer: 0.0756 sec.
iter 5500 || Loss: 2.2812 ||Saving state, iter: 5500
timer: 0.0778 sec.
iter 5510 || Loss: 1.9209 ||timer: 0.0785 sec.
iter 5520 || Loss: 0.8683 ||timer: 0.0801 sec.
iter 5530 || Loss: 1.2770 ||timer: 0.0779 sec.
iter 5540 || Loss: 1.9157 ||timer: 0.0751 sec.
iter 5550 || Loss: 1.1589 ||timer: 0.0768 sec.
iter 5560 || Loss: 1.8867 ||timer: 0.0755 sec.
iter 5570 || Loss: 0.6332 ||timer: 0.0772 sec.
iter 5580 || Loss: 1.7811 ||timer: 0.0789 sec.
iter 5590 || Loss: 1.5193 ||timer: 0.0751 sec.
iter 5600 || Los

  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)


timer: 0.0870 sec.
iter 5760 || Loss: 1.4811 ||timer: 0.0754 sec.
iter 5770 || Loss: 1.2023 ||timer: 0.0778 sec.
iter 5780 || Loss: 1.0449 ||timer: 0.0763 sec.
iter 5790 || Loss: 1.5218 ||timer: 0.0778 sec.
iter 5800 || Loss: 2.4061 ||timer: 0.0766 sec.
iter 5810 || Loss: 1.0441 ||timer: 0.0757 sec.
iter 5820 || Loss: 1.2881 ||timer: 0.0754 sec.
iter 5830 || Loss: 1.0702 ||timer: 0.0768 sec.
iter 5840 || Loss: 1.7401 ||timer: 0.0760 sec.
iter 5850 || Loss: 0.8931 ||timer: 0.0772 sec.
iter 5860 || Loss: 1.1217 ||timer: 0.0760 sec.
iter 5870 || Loss: 1.3151 ||timer: 0.0786 sec.
iter 5880 || Loss: 0.8701 ||timer: 0.0752 sec.
iter 5890 || Loss: 1.1641 ||timer: 0.0775 sec.
iter 5900 || Loss: 2.2479 ||timer: 0.0767 sec.
iter 5910 || Loss: 1.8186 ||timer: 0.0767 sec.
iter 5920 || Loss: 0.9623 ||timer: 0.0805 sec.
iter 5930 || Loss: 1.0503 ||timer: 0.0778 sec.
iter 5940 || Loss: 0.7618 ||timer: 0.0892 sec.
iter 5950 || Loss: 0.9955 ||timer: 0.0791 sec.
iter 5960 || Loss: 1.8091 ||timer: 0.0809

  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)


timer: 0.0804 sec.
iter 6120 || Loss: 1.2845 ||timer: 0.0766 sec.
iter 6130 || Loss: 1.9774 ||timer: 0.0773 sec.
iter 6140 || Loss: 0.7874 ||timer: 0.0827 sec.
iter 6150 || Loss: 0.8258 ||timer: 0.0810 sec.
iter 6160 || Loss: 1.5901 ||timer: 0.0775 sec.
iter 6170 || Loss: 1.1556 ||timer: 0.0791 sec.
iter 6180 || Loss: 2.6555 ||timer: 0.0779 sec.
iter 6190 || Loss: 2.3317 ||timer: 0.0814 sec.
iter 6200 || Loss: 1.3715 ||timer: 0.0826 sec.
iter 6210 || Loss: 2.3937 ||timer: 0.0773 sec.
iter 6220 || Loss: 2.4568 ||timer: 0.0805 sec.
iter 6230 || Loss: 1.3046 ||timer: 0.0840 sec.
iter 6240 || Loss: 1.1844 ||timer: 0.0766 sec.
iter 6250 || Loss: 1.2560 ||timer: 0.0783 sec.
iter 6260 || Loss: 0.4939 ||timer: 0.0791 sec.
iter 6270 || Loss: 2.0835 ||timer: 0.0842 sec.
iter 6280 || Loss: 1.0675 ||timer: 0.0800 sec.
iter 6290 || Loss: 1.2067 ||timer: 0.0838 sec.
iter 6300 || Loss: 3.3771 ||timer: 0.0826 sec.
iter 6310 || Loss: 2.1643 ||timer: 0.0834 sec.
iter 6320 || Loss: 0.8188 ||timer: 0.0813

  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)


timer: 0.0949 sec.
iter 6480 || Loss: 3.0429 ||timer: 0.0778 sec.
iter 6490 || Loss: 1.2234 ||timer: 0.0973 sec.
iter 6500 || Loss: 7.0384 ||Saving state, iter: 6500
timer: 0.0847 sec.
iter 6510 || Loss: 1.8751 ||timer: 0.0820 sec.
iter 6520 || Loss: 1.8138 ||timer: 0.0763 sec.
iter 6530 || Loss: 1.7381 ||timer: 0.0868 sec.
iter 6540 || Loss: 1.0143 ||timer: 0.0806 sec.
iter 6550 || Loss: 4.0090 ||timer: 0.0838 sec.
iter 6560 || Loss: 1.0567 ||timer: 0.0835 sec.
iter 6570 || Loss: 3.5278 ||timer: 0.0758 sec.
iter 6580 || Loss: 2.1263 ||timer: 0.0811 sec.
iter 6590 || Loss: 1.2351 ||timer: 0.0876 sec.
iter 6600 || Loss: 1.6845 ||timer: 0.0790 sec.
iter 6610 || Loss: 1.0162 ||timer: 0.0779 sec.
iter 6620 || Loss: 1.0616 ||timer: 0.0767 sec.
iter 6630 || Loss: 3.3310 ||timer: 0.0759 sec.
iter 6640 || Loss: 1.7232 ||timer: 0.0776 sec.
iter 6650 || Loss: 4.2961 ||timer: 0.0797 sec.
iter 6660 || Loss: 1.0316 ||timer: 0.0752 sec.
iter 6670 || Loss: 2.2457 ||timer: 0.0819 sec.
iter 6680 || Los

  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)


timer: 0.1113 sec.
iter 6840 || Loss: 0.8540 ||timer: 0.0867 sec.
iter 6850 || Loss: 3.0993 ||timer: 0.0848 sec.
iter 6860 || Loss: 1.1839 ||timer: 0.0915 sec.
iter 6870 || Loss: 0.9109 ||timer: 0.0839 sec.
iter 6880 || Loss: 1.0181 ||timer: 0.0856 sec.
iter 6890 || Loss: 4.5572 ||timer: 0.0911 sec.
iter 6900 || Loss: 1.2840 ||timer: 0.0818 sec.
iter 6910 || Loss: 2.2832 ||timer: 0.0834 sec.
iter 6920 || Loss: 0.8561 ||timer: 0.0761 sec.
iter 6930 || Loss: 1.2305 ||timer: 0.0781 sec.
iter 6940 || Loss: 0.7913 ||timer: 0.0778 sec.
iter 6950 || Loss: 1.3144 ||timer: 0.0933 sec.
iter 6960 || Loss: 2.1025 ||timer: 0.0769 sec.
iter 6970 || Loss: 2.7230 ||timer: 0.0815 sec.
iter 6980 || Loss: 0.9631 ||timer: 0.0831 sec.
iter 6990 || Loss: 0.7299 ||timer: 0.0795 sec.
iter 7000 || Loss: 1.3868 ||Saving state, iter: 7000
timer: 0.0829 sec.
iter 7010 || Loss: 0.9223 ||timer: 0.0798 sec.
iter 7020 || Loss: 1.9410 ||timer: 0.0768 sec.
iter 7030 || Loss: 1.4965 ||timer: 0.0885 sec.
iter 7040 || Los

  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)


timer: 0.0905 sec.
iter 7200 || Loss: 1.2463 ||timer: 0.0838 sec.
iter 7210 || Loss: 1.3029 ||timer: 0.0793 sec.
iter 7220 || Loss: 2.6862 ||timer: 0.0817 sec.
iter 7230 || Loss: 1.9237 ||timer: 0.0857 sec.
iter 7240 || Loss: 1.2609 ||timer: 0.0776 sec.
iter 7250 || Loss: 5.0588 ||timer: 0.0759 sec.
iter 7260 || Loss: 0.9186 ||timer: 0.0805 sec.
iter 7270 || Loss: 0.9939 ||timer: 0.0780 sec.
iter 7280 || Loss: 1.1147 ||timer: 0.0813 sec.
iter 7290 || Loss: 1.0803 ||timer: 0.0965 sec.
iter 7300 || Loss: 1.9976 ||timer: 0.0870 sec.
iter 7310 || Loss: 0.5523 ||timer: 0.0898 sec.
iter 7320 || Loss: 1.5234 ||timer: 0.0816 sec.
iter 7330 || Loss: 1.9077 ||timer: 0.0758 sec.
iter 7340 || Loss: 0.8137 ||timer: 0.0794 sec.
iter 7350 || Loss: 1.1021 ||timer: 0.0806 sec.
iter 7360 || Loss: 0.7434 ||timer: 0.0764 sec.
iter 7370 || Loss: 1.9593 ||timer: 0.0810 sec.
iter 7380 || Loss: 1.3381 ||timer: 0.0770 sec.
iter 7390 || Loss: 1.3003 ||timer: 0.0760 sec.
iter 7400 || Loss: 1.1137 ||timer: 0.0766

  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)


timer: 0.0809 sec.
iter 7560 || Loss: 1.3941 ||timer: 0.0788 sec.
iter 7570 || Loss: 2.8303 ||timer: 0.0766 sec.
iter 7580 || Loss: 2.1600 ||timer: 0.0810 sec.
iter 7590 || Loss: 1.4374 ||timer: 0.0776 sec.
iter 7600 || Loss: 1.0319 ||timer: 0.0807 sec.
iter 7610 || Loss: 1.9339 ||timer: 0.1097 sec.
iter 7620 || Loss: 1.0849 ||timer: 0.0868 sec.
iter 7630 || Loss: 2.4769 ||timer: 0.0837 sec.
iter 7640 || Loss: 2.0174 ||timer: 0.0762 sec.
iter 7650 || Loss: 1.9836 ||timer: 0.0791 sec.
iter 7660 || Loss: 1.5968 ||timer: 0.0792 sec.
iter 7670 || Loss: 0.9520 ||timer: 0.0801 sec.
iter 7680 || Loss: 1.0284 ||timer: 0.0865 sec.
iter 7690 || Loss: 2.5440 ||timer: 0.0851 sec.
iter 7700 || Loss: 0.9714 ||timer: 0.0786 sec.
iter 7710 || Loss: 0.9735 ||timer: 0.0832 sec.
iter 7720 || Loss: 1.3304 ||timer: 0.0781 sec.
iter 7730 || Loss: 1.1062 ||timer: 0.0776 sec.
iter 7740 || Loss: 0.7465 ||timer: 0.1027 sec.
iter 7750 || Loss: 4.2258 ||timer: 0.0787 sec.
iter 7760 || Loss: 0.7894 ||timer: 0.0790

  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)


timer: 0.0922 sec.
iter 7920 || Loss: 1.4018 ||timer: 0.0797 sec.
iter 7930 || Loss: 0.9546 ||timer: 0.0851 sec.
iter 7940 || Loss: 0.7198 ||timer: 0.0755 sec.
iter 7950 || Loss: 2.9011 ||timer: 0.0761 sec.
iter 7960 || Loss: 2.4683 ||timer: 0.0768 sec.
iter 7970 || Loss: 1.7071 ||timer: 0.0801 sec.
iter 7980 || Loss: 2.3111 ||timer: 0.0851 sec.
iter 7990 || Loss: 1.6153 ||Change learning rate to:  1.0000000000000003e-05
timer: 0.0807 sec.
iter 8000 || Loss: 1.1054 ||Saving state, iter: 8000
timer: 0.0810 sec.
iter 8010 || Loss: 0.7061 ||timer: 0.0863 sec.
iter 8020 || Loss: 1.2302 ||timer: 0.0863 sec.
iter 8030 || Loss: 1.0871 ||timer: 0.1004 sec.
iter 8040 || Loss: 2.0072 ||timer: 0.0905 sec.
iter 8050 || Loss: 2.3318 ||timer: 0.0885 sec.
iter 8060 || Loss: 3.3698 ||timer: 0.0886 sec.
iter 8070 || Loss: 1.1260 ||timer: 0.0868 sec.
iter 8080 || Loss: 0.8367 ||timer: 0.0876 sec.
iter 8090 || Loss: 1.4382 ||timer: 0.0763 sec.
iter 8100 || Loss: 2.0640 ||timer: 0.0800 sec.
iter 8110 || L

  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)


timer: 0.0868 sec.
iter 8280 || Loss: 1.5221 ||timer: 0.0803 sec.
iter 8290 || Loss: 1.5972 ||timer: 0.0805 sec.
iter 8300 || Loss: 1.1717 ||timer: 0.0835 sec.
iter 8310 || Loss: 1.2290 ||timer: 0.0805 sec.
iter 8320 || Loss: 0.7363 ||timer: 0.0774 sec.
iter 8330 || Loss: 1.0667 ||timer: 0.0769 sec.
iter 8340 || Loss: 3.7363 ||timer: 0.0765 sec.
iter 8350 || Loss: 0.5646 ||timer: 0.0813 sec.
iter 8360 || Loss: 0.9207 ||timer: 0.0834 sec.
iter 8370 || Loss: 0.9432 ||timer: 0.0838 sec.
iter 8380 || Loss: 1.2337 ||timer: 0.0812 sec.
iter 8390 || Loss: 1.3579 ||timer: 0.0794 sec.
iter 8400 || Loss: 1.2071 ||timer: 0.0804 sec.
iter 8410 || Loss: 1.1032 ||timer: 0.0840 sec.
iter 8420 || Loss: 3.3050 ||timer: 0.0815 sec.
iter 8430 || Loss: 0.7918 ||timer: 0.0767 sec.
iter 8440 || Loss: 1.0243 ||timer: 0.0838 sec.
iter 8450 || Loss: 1.1186 ||timer: 0.0824 sec.
iter 8460 || Loss: 2.2551 ||timer: 0.0895 sec.
iter 8470 || Loss: 2.2999 ||timer: 0.0817 sec.
iter 8480 || Loss: 1.1093 ||timer: 0.0781

  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)


timer: 0.0801 sec.
iter 8640 || Loss: 1.5111 ||timer: 0.0774 sec.
iter 8650 || Loss: 1.8237 ||timer: 0.0791 sec.
iter 8660 || Loss: 1.0133 ||timer: 0.0758 sec.
iter 8670 || Loss: 2.5143 ||timer: 0.0795 sec.
iter 8680 || Loss: 2.3021 ||timer: 0.0763 sec.
iter 8690 || Loss: 1.1208 ||timer: 0.0778 sec.
iter 8700 || Loss: 2.1699 ||timer: 0.0790 sec.
iter 8710 || Loss: 1.5768 ||timer: 0.0770 sec.
iter 8720 || Loss: 0.6186 ||timer: 0.0759 sec.
iter 8730 || Loss: 1.2407 ||timer: 0.0778 sec.
iter 8740 || Loss: 1.5641 ||timer: 0.0756 sec.
iter 8750 || Loss: 1.2045 ||timer: 0.0761 sec.
iter 8760 || Loss: 1.9024 ||timer: 0.0778 sec.
iter 8770 || Loss: 0.8061 ||timer: 0.0799 sec.
iter 8780 || Loss: 0.8798 ||timer: 0.0761 sec.
iter 8790 || Loss: 0.9959 ||timer: 0.0782 sec.
iter 8800 || Loss: 1.6815 ||timer: 0.0759 sec.
iter 8810 || Loss: 3.5193 ||timer: 0.0773 sec.
iter 8820 || Loss: 2.8999 ||timer: 0.0759 sec.
iter 8830 || Loss: 0.5801 ||timer: 0.0803 sec.
iter 8840 || Loss: 0.8537 ||timer: 0.0755

  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)


timer: 0.0893 sec.
iter 9000 || Loss: 1.2172 ||Saving state, iter: 9000
timer: 0.0761 sec.
iter 9010 || Loss: 1.1595 ||timer: 0.0763 sec.
iter 9020 || Loss: 0.7511 ||timer: 0.0779 sec.
iter 9030 || Loss: 1.2044 ||timer: 0.0759 sec.
iter 9040 || Loss: 2.1059 ||timer: 0.0773 sec.
iter 9050 || Loss: 1.4973 ||timer: 0.0767 sec.
iter 9060 || Loss: 1.6228 ||timer: 0.0775 sec.
iter 9070 || Loss: 2.1642 ||timer: 0.0788 sec.
iter 9080 || Loss: 1.9699 ||timer: 0.0772 sec.
iter 9090 || Loss: 2.0270 ||timer: 0.0782 sec.
iter 9100 || Loss: 0.9926 ||timer: 0.0782 sec.
iter 9110 || Loss: 0.9810 ||timer: 0.0803 sec.
iter 9120 || Loss: 1.7726 ||timer: 0.0778 sec.
iter 9130 || Loss: 0.4963 ||timer: 0.0783 sec.
iter 9140 || Loss: 0.8552 ||timer: 0.0767 sec.
iter 9150 || Loss: 1.7793 ||timer: 0.0773 sec.
iter 9160 || Loss: 0.8751 ||timer: 0.0787 sec.
iter 9170 || Loss: 1.0946 ||timer: 0.0766 sec.
iter 9180 || Loss: 1.1355 ||timer: 0.0766 sec.
iter 9190 || Loss: 0.8506 ||timer: 0.0757 sec.
iter 9200 || Los

  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)


timer: 0.0846 sec.
iter 9360 || Loss: 1.5151 ||timer: 0.0753 sec.
iter 9370 || Loss: 0.9068 ||timer: 0.0798 sec.
iter 9380 || Loss: 1.1891 ||timer: 0.0777 sec.
iter 9390 || Loss: 0.7823 ||timer: 0.0787 sec.
iter 9400 || Loss: 1.6601 ||timer: 0.0797 sec.
iter 9410 || Loss: 0.8618 ||timer: 0.0792 sec.
iter 9420 || Loss: 1.5777 ||timer: 0.0762 sec.
iter 9430 || Loss: 1.4199 ||timer: 0.0778 sec.
iter 9440 || Loss: 1.5777 ||timer: 0.0767 sec.
iter 9450 || Loss: 1.1468 ||timer: 0.0765 sec.
iter 9460 || Loss: 2.3009 ||timer: 0.0784 sec.
iter 9470 || Loss: 1.2812 ||timer: 0.0750 sec.
iter 9480 || Loss: 0.9672 ||timer: 0.0770 sec.
iter 9490 || Loss: 2.6355 ||timer: 0.0749 sec.
iter 9500 || Loss: 1.7482 ||Saving state, iter: 9500
timer: 0.0758 sec.
iter 9510 || Loss: 3.3833 ||timer: 0.0764 sec.
iter 9520 || Loss: 2.5638 ||timer: 0.0760 sec.
iter 9530 || Loss: 1.4368 ||timer: 0.0800 sec.
iter 9540 || Loss: 0.7537 ||timer: 0.0751 sec.
iter 9550 || Loss: 1.9187 ||timer: 0.0794 sec.
iter 9560 || Los

  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)


timer: 0.0832 sec.
iter 9720 || Loss: 2.2593 ||timer: 0.0756 sec.
iter 9730 || Loss: 1.2741 ||timer: 0.0780 sec.
iter 9740 || Loss: 1.3184 ||timer: 0.0770 sec.
iter 9750 || Loss: 1.6667 ||timer: 0.0774 sec.
iter 9760 || Loss: 1.4372 ||timer: 0.0772 sec.
iter 9770 || Loss: 2.1191 ||timer: 0.0793 sec.
iter 9780 || Loss: 1.2574 ||timer: 0.0797 sec.
iter 9790 || Loss: 1.2535 ||timer: 0.0786 sec.
iter 9800 || Loss: 1.4462 ||timer: 0.0752 sec.
iter 9810 || Loss: 1.0271 ||timer: 0.0795 sec.
iter 9820 || Loss: 0.7073 ||timer: 0.0788 sec.
iter 9830 || Loss: 1.0438 ||timer: 0.0792 sec.
iter 9840 || Loss: 1.5741 ||timer: 0.0800 sec.
iter 9850 || Loss: 2.8932 ||timer: 0.0801 sec.
iter 9860 || Loss: 1.4335 ||timer: 0.0798 sec.
iter 9870 || Loss: 1.0679 ||timer: 0.0758 sec.
iter 9880 || Loss: 1.0891 ||timer: 0.0757 sec.
iter 9890 || Loss: 2.3172 ||timer: 0.0784 sec.
iter 9900 || Loss: 0.4749 ||timer: 0.0817 sec.
iter 9910 || Loss: 1.3807 ||timer: 0.0794 sec.
iter 9920 || Loss: 1.0715 ||timer: 0.0777

  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)


timer: 0.0796 sec.
iter 10080 || Loss: 1.8580 ||timer: 0.0756 sec.
iter 10090 || Loss: 0.7519 ||timer: 0.0763 sec.
iter 10100 || Loss: 2.2179 ||timer: 0.0770 sec.
iter 10110 || Loss: 2.7253 ||timer: 0.0765 sec.
iter 10120 || Loss: 1.8849 ||timer: 0.0763 sec.
iter 10130 || Loss: 1.0008 ||timer: 0.0776 sec.
iter 10140 || Loss: 1.6902 ||timer: 0.0792 sec.
iter 10150 || Loss: 2.5188 ||timer: 0.0776 sec.
iter 10160 || Loss: 1.1895 ||timer: 0.0783 sec.
iter 10170 || Loss: 1.2821 ||timer: 0.0793 sec.
iter 10180 || Loss: 1.2753 ||timer: 0.0792 sec.
iter 10190 || Loss: 1.3690 ||timer: 0.0787 sec.
iter 10200 || Loss: 1.0341 ||timer: 0.0788 sec.
iter 10210 || Loss: 1.0232 ||timer: 0.0786 sec.
iter 10220 || Loss: 0.7916 ||timer: 0.0760 sec.
iter 10230 || Loss: 1.2386 ||timer: 0.0770 sec.
iter 10240 || Loss: 3.6657 ||timer: 0.0765 sec.
iter 10250 || Loss: 0.5687 ||timer: 0.0760 sec.
iter 10260 || Loss: 1.2907 ||timer: 0.0756 sec.
iter 10270 || Loss: 1.0639 ||timer: 0.0778 sec.
iter 10280 || Loss: 1

  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)


timer: 0.0920 sec.
iter 10440 || Loss: 1.5192 ||timer: 0.0782 sec.
iter 10450 || Loss: 1.3662 ||timer: 0.0762 sec.
iter 10460 || Loss: 1.0794 ||timer: 0.0773 sec.
iter 10470 || Loss: 1.7964 ||timer: 0.0767 sec.
iter 10480 || Loss: 1.1946 ||timer: 0.0785 sec.
iter 10490 || Loss: 2.6090 ||timer: 0.0788 sec.
iter 10500 || Loss: 2.4157 ||Saving state, iter: 10500
timer: 0.0786 sec.
iter 10510 || Loss: 2.1800 ||timer: 0.0754 sec.
iter 10520 || Loss: 1.8963 ||timer: 0.0785 sec.
iter 10530 || Loss: 2.1660 ||timer: 0.0773 sec.
iter 10540 || Loss: 1.3194 ||timer: 0.0755 sec.
iter 10550 || Loss: 3.9760 ||timer: 0.0782 sec.
iter 10560 || Loss: 1.5573 ||timer: 0.0772 sec.
iter 10570 || Loss: 1.1326 ||timer: 0.0775 sec.
iter 10580 || Loss: 1.4300 ||timer: 0.0762 sec.
iter 10590 || Loss: 1.6231 ||timer: 0.0787 sec.
iter 10600 || Loss: 1.2490 ||timer: 0.0800 sec.
iter 10610 || Loss: 3.6011 ||timer: 0.0773 sec.
iter 10620 || Loss: 1.0228 ||timer: 0.0772 sec.
iter 10630 || Loss: 1.2460 ||timer: 0.0794 

  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)


timer: 0.0885 sec.
iter 10800 || Loss: 1.1829 ||timer: 0.0774 sec.
iter 10810 || Loss: 1.2299 ||timer: 0.0754 sec.
iter 10820 || Loss: 1.0729 ||timer: 0.0765 sec.
iter 10830 || Loss: 2.0024 ||timer: 0.0771 sec.
iter 10840 || Loss: 0.5461 ||timer: 0.0754 sec.
iter 10850 || Loss: 0.9502 ||timer: 0.0753 sec.
iter 10860 || Loss: 3.2477 ||timer: 0.0795 sec.
iter 10870 || Loss: 1.5971 ||timer: 0.0783 sec.
iter 10880 || Loss: 2.3172 ||timer: 0.0772 sec.
iter 10890 || Loss: 1.9923 ||timer: 0.0754 sec.
iter 10900 || Loss: 0.5486 ||timer: 0.0771 sec.
iter 10910 || Loss: 1.1332 ||timer: 0.0792 sec.
iter 10920 || Loss: 1.6307 ||timer: 0.0773 sec.
iter 10930 || Loss: 1.9409 ||timer: 0.0800 sec.
iter 10940 || Loss: 1.1533 ||timer: 0.0758 sec.
iter 10950 || Loss: 1.4999 ||timer: 0.0773 sec.
iter 10960 || Loss: 0.8083 ||timer: 0.0797 sec.
iter 10970 || Loss: 3.5474 ||timer: 0.0782 sec.
iter 10980 || Loss: 2.4974 ||timer: 0.0777 sec.
iter 10990 || Loss: 1.8210 ||timer: 0.0758 sec.
iter 11000 || Loss: 2

  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)


timer: 0.0864 sec.
iter 11160 || Loss: 1.7270 ||timer: 0.0858 sec.
iter 11170 || Loss: 1.0404 ||timer: 0.0765 sec.
iter 11180 || Loss: 1.0291 ||timer: 0.0757 sec.
iter 11190 || Loss: 0.7998 ||timer: 0.0790 sec.
iter 11200 || Loss: 1.0967 ||timer: 0.0759 sec.
iter 11210 || Loss: 0.4798 ||timer: 0.0793 sec.
iter 11220 || Loss: 1.3294 ||timer: 0.0790 sec.
iter 11230 || Loss: 2.5579 ||timer: 0.0771 sec.
iter 11240 || Loss: 1.8435 ||timer: 0.0788 sec.
iter 11250 || Loss: 1.1737 ||timer: 0.0770 sec.
iter 11260 || Loss: 2.6554 ||timer: 0.0802 sec.
iter 11270 || Loss: 1.3574 ||timer: 0.0769 sec.
iter 11280 || Loss: 2.1277 ||timer: 0.0771 sec.
iter 11290 || Loss: 2.3854 ||timer: 0.0765 sec.
iter 11300 || Loss: 2.0177 ||timer: 0.0759 sec.
iter 11310 || Loss: 1.1185 ||timer: 0.0753 sec.
iter 11320 || Loss: 1.0386 ||timer: 0.0790 sec.
iter 11330 || Loss: 1.2572 ||timer: 0.0779 sec.
iter 11340 || Loss: 1.8094 ||timer: 0.0790 sec.
iter 11350 || Loss: 0.6913 ||timer: 0.0787 sec.
iter 11360 || Loss: 0

  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)


timer: 0.0832 sec.
iter 11520 || Loss: 1.4795 ||timer: 0.0755 sec.
iter 11530 || Loss: 0.9070 ||timer: 0.0786 sec.
iter 11540 || Loss: 2.1991 ||timer: 0.0760 sec.
iter 11550 || Loss: 1.4186 ||timer: 0.0756 sec.
iter 11560 || Loss: 0.8704 ||timer: 0.0767 sec.
iter 11570 || Loss: 1.4955 ||timer: 0.0789 sec.
iter 11580 || Loss: 2.3556 ||timer: 0.0753 sec.
iter 11590 || Loss: 2.7505 ||timer: 0.0764 sec.
iter 11600 || Loss: 1.1191 ||timer: 0.0774 sec.
iter 11610 || Loss: 2.8836 ||timer: 0.0779 sec.
iter 11620 || Loss: 0.9662 ||timer: 0.0797 sec.
iter 11630 || Loss: 1.4430 ||timer: 0.0794 sec.
iter 11640 || Loss: 0.8218 ||timer: 0.0804 sec.
iter 11650 || Loss: 1.8122 ||timer: 0.0770 sec.
iter 11660 || Loss: 1.6982 ||timer: 0.0771 sec.
iter 11670 || Loss: 1.1059 ||timer: 0.0794 sec.
iter 11680 || Loss: 1.3579 ||timer: 0.0753 sec.
iter 11690 || Loss: 1.5783 ||timer: 0.0801 sec.
iter 11700 || Loss: 1.0553 ||timer: 0.0775 sec.
iter 11710 || Loss: 0.9126 ||timer: 0.0768 sec.
iter 11720 || Loss: 3

  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)


timer: 0.0882 sec.
iter 11880 || Loss: 0.8494 ||timer: 0.0768 sec.
iter 11890 || Loss: 2.5590 ||timer: 0.0756 sec.
iter 11900 || Loss: 4.1760 ||timer: 0.0770 sec.
iter 11910 || Loss: 0.9960 ||timer: 0.0758 sec.
iter 11920 || Loss: 2.8341 ||timer: 0.0788 sec.
iter 11930 || Loss: 2.5275 ||timer: 0.0798 sec.
iter 11940 || Loss: 0.9264 ||timer: 0.0808 sec.
iter 11950 || Loss: 1.1527 ||timer: 0.0827 sec.
iter 11960 || Loss: 1.3524 ||timer: 0.0815 sec.
iter 11970 || Loss: 1.4201 ||timer: 0.0789 sec.
iter 11980 || Loss: 1.4168 ||timer: 0.0845 sec.
iter 11990 || Loss: 1.2637 ||Change learning rate to:  1.0000000000000002e-06
timer: 0.0758 sec.
iter 12000 || Loss: 0.9989 ||Saving state, iter: 12000
timer: 0.0794 sec.
iter 12010 || Loss: 0.9587 ||timer: 0.0771 sec.
iter 12020 || Loss: 0.7675 ||timer: 0.0830 sec.
iter 12030 || Loss: 1.4515 ||timer: 0.0828 sec.
iter 12040 || Loss: 0.9484 ||timer: 0.0822 sec.
iter 12050 || Loss: 1.0418 ||timer: 0.0763 sec.
iter 12060 || Loss: 1.4960 ||timer: 0.0762

  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)


timer: 0.0785 sec.
iter 12240 || Loss: 1.1276 ||timer: 0.0751 sec.
iter 12250 || Loss: 2.1024 ||timer: 0.0776 sec.
iter 12260 || Loss: 1.8684 ||timer: 0.0775 sec.
iter 12270 || Loss: 2.0994 ||timer: 0.0761 sec.
iter 12280 || Loss: 1.1915 ||timer: 0.0757 sec.
iter 12290 || Loss: 1.0387 ||timer: 0.0757 sec.
iter 12300 || Loss: 1.2463 ||timer: 0.0762 sec.
iter 12310 || Loss: 1.5373 ||timer: 0.0774 sec.
iter 12320 || Loss: 1.8366 ||timer: 0.0762 sec.
iter 12330 || Loss: 2.0142 ||timer: 0.0799 sec.
iter 12340 || Loss: 1.3378 ||timer: 0.0793 sec.
iter 12350 || Loss: 1.6365 ||timer: 0.0755 sec.
iter 12360 || Loss: 1.3815 ||timer: 0.0756 sec.
iter 12370 || Loss: 1.1496 ||timer: 0.0789 sec.
iter 12380 || Loss: 0.8756 ||timer: 0.0795 sec.
iter 12390 || Loss: 1.7125 ||timer: 0.0794 sec.
iter 12400 || Loss: 1.8704 ||timer: 0.0769 sec.
iter 12410 || Loss: 1.3590 ||timer: 0.0803 sec.
iter 12420 || Loss: 1.9319 ||timer: 0.0799 sec.
iter 12430 || Loss: 1.4079 ||timer: 0.0790 sec.
iter 12440 || Loss: 0

  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)


timer: 0.0784 sec.
iter 12600 || Loss: 1.9617 ||timer: 0.0774 sec.
iter 12610 || Loss: 1.1850 ||timer: 0.0761 sec.
iter 12620 || Loss: 1.3246 ||timer: 0.0830 sec.
iter 12630 || Loss: 2.2574 ||timer: 0.0813 sec.
iter 12640 || Loss: 0.6349 ||timer: 0.0818 sec.
iter 12650 || Loss: 2.1414 ||timer: 0.0844 sec.
iter 12660 || Loss: 0.6391 ||timer: 0.0756 sec.
iter 12670 || Loss: 2.0055 ||timer: 0.0770 sec.
iter 12680 || Loss: 1.0197 ||timer: 0.0759 sec.
iter 12690 || Loss: 1.2081 ||timer: 0.0775 sec.
iter 12700 || Loss: 2.5431 ||timer: 0.0790 sec.
iter 12710 || Loss: 2.0128 ||timer: 0.0797 sec.
iter 12720 || Loss: 0.8564 ||timer: 0.0764 sec.
iter 12730 || Loss: 1.0510 ||timer: 0.0792 sec.
iter 12740 || Loss: 1.2082 ||timer: 0.0796 sec.
iter 12750 || Loss: 0.9591 ||timer: 0.0793 sec.
iter 12760 || Loss: 1.1471 ||timer: 0.0800 sec.
iter 12770 || Loss: 1.9258 ||timer: 0.0781 sec.
iter 12780 || Loss: 1.0903 ||timer: 0.0780 sec.
iter 12790 || Loss: 1.5232 ||timer: 0.0754 sec.
iter 12800 || Loss: 2

  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)


timer: 0.0794 sec.
iter 12960 || Loss: 2.8388 ||timer: 0.0753 sec.
iter 12970 || Loss: 1.3680 ||timer: 0.0755 sec.
iter 12980 || Loss: 0.9698 ||timer: 0.0756 sec.
iter 12990 || Loss: 1.3444 ||timer: 0.0796 sec.
iter 13000 || Loss: 2.5192 ||Saving state, iter: 13000
timer: 0.0757 sec.
iter 13010 || Loss: 0.6353 ||timer: 0.0798 sec.
iter 13020 || Loss: 1.1511 ||timer: 0.0765 sec.
iter 13030 || Loss: 3.2567 ||timer: 0.0779 sec.
iter 13040 || Loss: 1.0734 ||timer: 0.0784 sec.
iter 13050 || Loss: 1.5157 ||timer: 0.0781 sec.
iter 13060 || Loss: 0.9568 ||timer: 0.0795 sec.
iter 13070 || Loss: 1.3141 ||timer: 0.0773 sec.
iter 13080 || Loss: 1.2251 ||timer: 0.0794 sec.
iter 13090 || Loss: 1.7429 ||timer: 0.0776 sec.
iter 13100 || Loss: 1.3130 ||timer: 0.0789 sec.
iter 13110 || Loss: 1.4061 ||timer: 0.0784 sec.
iter 13120 || Loss: 0.8824 ||timer: 0.0802 sec.
iter 13130 || Loss: 1.4472 ||timer: 0.0783 sec.
iter 13140 || Loss: 3.1764 ||timer: 0.0764 sec.
iter 13150 || Loss: 1.3899 ||timer: 0.0782 

  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)


timer: 0.0922 sec.
iter 13320 || Loss: 1.3065 ||timer: 0.0755 sec.
iter 13330 || Loss: 1.2544 ||timer: 0.0760 sec.
iter 13340 || Loss: 2.0007 ||timer: 0.0772 sec.
iter 13350 || Loss: 1.2996 ||timer: 0.0762 sec.
iter 13360 || Loss: 2.0849 ||timer: 0.0786 sec.
iter 13370 || Loss: 0.4736 ||timer: 0.0792 sec.
iter 13380 || Loss: 7.6418 ||timer: 0.0795 sec.
iter 13390 || Loss: 1.1954 ||timer: 0.0766 sec.
iter 13400 || Loss: 0.7239 ||timer: 0.0783 sec.
iter 13410 || Loss: 1.1432 ||timer: 0.0798 sec.
iter 13420 || Loss: 1.5039 ||timer: 0.0789 sec.
iter 13430 || Loss: 2.6982 ||timer: 0.0798 sec.
iter 13440 || Loss: 1.2895 ||timer: 0.0791 sec.
iter 13450 || Loss: 1.1086 ||timer: 0.0801 sec.
iter 13460 || Loss: 1.5550 ||timer: 0.0792 sec.
iter 13470 || Loss: 1.7056 ||timer: 0.0759 sec.
iter 13480 || Loss: 1.5149 ||timer: 0.0768 sec.
iter 13490 || Loss: 2.5679 ||timer: 0.0763 sec.
iter 13500 || Loss: 0.7130 ||Saving state, iter: 13500
timer: 0.0757 sec.
iter 13510 || Loss: 1.0123 ||timer: 0.0779 

  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)


timer: 0.0838 sec.
iter 13680 || Loss: 1.0564 ||timer: 0.0781 sec.
iter 13690 || Loss: 1.3714 ||timer: 0.0754 sec.
iter 13700 || Loss: 1.5314 ||timer: 0.0811 sec.
iter 13710 || Loss: 2.8202 ||timer: 0.0780 sec.
iter 13720 || Loss: 1.1600 ||timer: 0.0760 sec.
iter 13730 || Loss: 1.1747 ||timer: 0.0759 sec.
iter 13740 || Loss: 1.4462 ||timer: 0.0773 sec.
iter 13750 || Loss: 1.5544 ||timer: 0.0784 sec.
iter 13760 || Loss: 1.2780 ||timer: 0.0791 sec.
iter 13770 || Loss: 1.2602 ||timer: 0.0790 sec.
iter 13780 || Loss: 0.7117 ||timer: 0.0760 sec.
iter 13790 || Loss: 2.0509 ||timer: 0.0764 sec.
iter 13800 || Loss: 1.7964 ||timer: 0.0762 sec.
iter 13810 || Loss: 3.7208 ||timer: 0.0777 sec.
iter 13820 || Loss: 0.5796 ||timer: 0.0759 sec.
iter 13830 || Loss: 1.3591 ||timer: 0.0763 sec.
iter 13840 || Loss: 0.9888 ||timer: 0.0760 sec.
iter 13850 || Loss: 0.5059 ||timer: 0.0766 sec.
iter 13860 || Loss: 1.3457 ||timer: 0.0774 sec.
iter 13870 || Loss: 1.4603 ||timer: 0.0792 sec.
iter 13880 || Loss: 1

  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)


timer: 0.0922 sec.
iter 14040 || Loss: 1.5760 ||timer: 0.0770 sec.
iter 14050 || Loss: 1.1507 ||timer: 0.0766 sec.
iter 14060 || Loss: 2.4110 ||timer: 0.0778 sec.
iter 14070 || Loss: 0.8569 ||timer: 0.0771 sec.
iter 14080 || Loss: 0.7231 ||timer: 0.0801 sec.
iter 14090 || Loss: 0.8619 ||timer: 0.0782 sec.
iter 14100 || Loss: 1.2780 ||timer: 0.0809 sec.
iter 14110 || Loss: 1.2839 ||timer: 0.0801 sec.
iter 14120 || Loss: 0.8151 ||timer: 0.0786 sec.
iter 14130 || Loss: 1.9879 ||timer: 0.0757 sec.
iter 14140 || Loss: 0.9276 ||timer: 0.0803 sec.
iter 14150 || Loss: 1.2406 ||timer: 0.0789 sec.
iter 14160 || Loss: 1.7646 ||timer: 0.0774 sec.
iter 14170 || Loss: 2.4705 ||timer: 0.0778 sec.
iter 14180 || Loss: 2.0781 ||timer: 0.0786 sec.
iter 14190 || Loss: 3.0768 ||timer: 0.0756 sec.
iter 14200 || Loss: 0.6599 ||timer: 0.0799 sec.
iter 14210 || Loss: 1.2428 ||timer: 0.0772 sec.
iter 14220 || Loss: 1.4052 ||timer: 0.0797 sec.
iter 14230 || Loss: 1.0428 ||timer: 0.0803 sec.
iter 14240 || Loss: 1

  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)


timer: 0.0831 sec.
iter 14400 || Loss: 0.8349 ||timer: 0.0780 sec.
iter 14410 || Loss: 1.6484 ||timer: 0.0753 sec.
iter 14420 || Loss: 1.0334 ||timer: 0.0809 sec.
iter 14430 || Loss: 1.8753 ||timer: 0.0801 sec.
iter 14440 || Loss: 1.1647 ||timer: 0.0757 sec.
iter 14450 || Loss: 1.7800 ||timer: 0.0782 sec.
iter 14460 || Loss: 2.2481 ||timer: 0.0785 sec.
iter 14470 || Loss: 0.9344 ||timer: 0.0789 sec.
iter 14480 || Loss: 0.7249 ||timer: 0.0803 sec.
iter 14490 || Loss: 1.3596 ||timer: 0.0785 sec.
iter 14500 || Loss: 2.1531 ||Saving state, iter: 14500
timer: 0.0782 sec.
iter 14510 || Loss: 0.8887 ||timer: 0.0775 sec.
iter 14520 || Loss: 1.2719 ||timer: 0.0763 sec.
iter 14530 || Loss: 0.9336 ||timer: 0.0759 sec.
iter 14540 || Loss: 1.4627 ||timer: 0.0794 sec.
iter 14550 || Loss: 1.6279 ||timer: 0.0778 sec.
iter 14560 || Loss: 1.4986 ||timer: 0.0760 sec.
iter 14570 || Loss: 1.8509 ||timer: 0.0783 sec.
iter 14580 || Loss: 1.3794 ||timer: 0.0779 sec.
iter 14590 || Loss: 0.7714 ||timer: 0.0763 

  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)
  mode = random.choice(self.sample_options)


timer: 0.0990 sec.
iter 14760 || Loss: 2.2087 ||timer: 0.0770 sec.
iter 14770 || Loss: 0.7899 ||timer: 0.0767 sec.
iter 14780 || Loss: 0.7812 ||timer: 0.0761 sec.
iter 14790 || Loss: 1.2642 ||timer: 0.0757 sec.
iter 14800 || Loss: 0.7595 ||timer: 0.0804 sec.
iter 14810 || Loss: 1.2602 ||timer: 0.0816 sec.
iter 14820 || Loss: 1.2626 ||timer: 0.0780 sec.
iter 14830 || Loss: 3.2965 ||timer: 0.0776 sec.
iter 14840 || Loss: 2.2917 ||timer: 0.0800 sec.
iter 14850 || Loss: 1.0362 ||timer: 0.0797 sec.
iter 14860 || Loss: 0.7668 ||timer: 0.0764 sec.
iter 14870 || Loss: 0.9689 ||timer: 0.0791 sec.
iter 14880 || Loss: 1.1097 ||timer: 0.0763 sec.
iter 14890 || Loss: 1.1897 ||timer: 0.0771 sec.
iter 14900 || Loss: 3.5127 ||timer: 0.0791 sec.
iter 14910 || Loss: 1.2925 ||timer: 0.0769 sec.
iter 14920 || Loss: 1.5548 ||timer: 0.0786 sec.
iter 14930 || Loss: 0.8008 ||timer: 0.0797 sec.
iter 14940 || Loss: 2.0783 ||timer: 0.0771 sec.
iter 14950 || Loss: 1.6965 ||timer: 0.0797 sec.
iter 14960 || Loss: 0