## Vanilla Vision Transformer From Scratch

In [1]:
import math
import time
import numpy as np
import copy

from utils import dataset
from models import VanillaVisionTransformer

import matplotlib.pyplot as plt
import matplotlib

# Pytorch packages
import torch
import torch.optim as optim
import torch.nn as nn

# torchvision
import torchvision
from torchvision import transforms

# Tqdm progress bar
from tqdm import tqdm_notebook

# obtain reproducible results in PyTorch
def seed_everything(seed: int):
    import random, os
    import numpy as np
    import torch
    
    random.seed(seed)
    os.environ['PYTHONHASHSEED'] = str(seed)
    np.random.seed(seed)
    torch.manual_seed(seed)
    torch.cuda.manual_seed(seed)
    torch.backends.cudnn.deterministic = True
    torch.backends.cudnn.benchmark = True
    
seed_everything(42)

In [2]:
# Check device availability
device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
print("You are using device: %s" % device)

You are using device: cuda


In [3]:
LEARNING_RATE = 0.003
MOMENTUM = 0.5
WEIGHT_DECAY_REGULARIZATION_TERM = 0.005
NUM_EPOCHS = 1
BATCH_SIZE = 1

PATCH_SIZE = 4
HIDDEN_DIM = 512
EMBED_DIM = 256 # aka mlp_dim
NUM_CHANNELS = 3
NUM_HEADS = 8
NUM_LAYERS = 6
DROPOUT = 0.2

# converts image into patches. patch_size is the size of each patch
def img_to_patches(x, patch_size, flatten_channels=True):
    B, C, H, W = x.shape
    x = x.reshape(B, C, H//patch_size, patch_size, W//patch_size, patch_size)
    x = x.permute(0, 2, 4, 1, 3, 5) # [B, H', W', C, p_H, p_W]
    x = x.flatten(1,2)              # [B, H'*W', C, p_H, p_W]
    if flatten_channels:
        x = x.flatten(2,4)          # [B, H'*W', C*p_H*p_W]
    return x

class AverageMeter(object):
    """Computes and stores the average and current value"""

    def __init__(self):
        self.reset()

    def reset(self):
        self.val = 0
        self.avg = 0
        self.sum = 0
        self.count = 0

    def update(self, val, n=1):
        self.val = val
        self.sum += val * n
        self.count += n

        self.avg = self.sum / self.count

def train(epoch, data_loader, model, optimizer, criterion, scaler=None):
    iter_time = AverageMeter()
    losses = AverageMeter()

    for idx, (data, target) in enumerate(data_loader):
        start = time.time()
        
        if torch.cuda.is_available():
            data = data.cuda()
            target = target.cuda()

        with torch.autocast("cuda"): #Automatic Mixed precision
            data = img_to_patches(data, patch_size = PATCH_SIZE, flatten_channels=True)
            out = model(data).to(device)
#             loss = torch.sqrt(criterion(out, target))
            loss = criterion(out, target)
    
#         print("DATA TYPES")
#         print(out.dtype)
#         print(target.dtype)

#         optimizer.zero_grad()
#         loss.backward()
#         optimizer.step()

        for param in model.parameters():
            param.grad = None
        scaler.scale(loss).backward()
        scaler.step(optimizer)

        scaler.update()
        losses.update(loss, out.shape[0])

        iter_time.update(time.time() - start)
        if idx % 10 == 0:
            print(('Epoch: [{0}][{1}/{2}]\t'
                   'Time {iter_time.val:.3f} ({iter_time.avg:.3f})\t'
                   'Loss {loss.val:.4f} ({loss.avg:.4f})\t'
                  .format(epoch, idx, len(data_loader), iter_time=iter_time, loss=losses)))
    
    return losses.avg

def validate(epoch, validation_loader, model, criterion):
    iter_time = AverageMeter()
    losses = AverageMeter()

    for idx, (data, target) in enumerate(validation_loader):
        start = time.time()

        if torch.cuda.is_available():
            data = data.cuda()
            target = target.cuda()
        target = target.to(torch.float16)

        out = None
        loss = None
        data = img_to_patches(data, patch_size = PATCH_SIZE, flatten_channels=True)

        with torch.no_grad():
            out = model(data).to(device)
#             loss = torch.sqrt(criterion(out, target))
            loss = criterion(out, target)


        losses.update(loss, out.shape[0])

        iter_time.update(time.time() - start)
        if idx % 10 == 0:
            print(('Epoch: [{0}][{1}/{2}]\t'
                   'Time {iter_time.val:.3f} ({iter_time.avg:.3f})\t')
                  .format(epoch, idx, len(validation_loader), iter_time=iter_time, loss=losses))

    print("* Average Loss @1: {loss.avg:.4f}".format(loss=losses))
    return losses.avg

def RMSELoss(yhat, y, eps=1e-6):
    return torch.sqrt(torch.mean((yhat-y)**2) + eps)

def plots(losses, lr=LEARNING_RATE, reg=WEIGHT_DECAY_REGULARIZATION_TERM, batch=BATCH_SIZE): #, momentum=MOMENTUM):
    fig1, ax1 = plt.subplots(figsize=(8, 10))
    ax1.plot(losses[0], label='Training Losses')
    ax1.plot(losses[1], label='Validation Losses')
    ax1.set_xlabel('Epochs')
    ax1.set_ylabel('RMSE Loss')
    ax1.set_title(f'CNN Loss Curve; LR={lr}; Batch={batch}')
    ax1.legend(loc="best")
    plt.grid()
    plt.show()

In [14]:
## SKIP FOR SIGOPT EXPERIMENT ##

def main():
    torch.cuda.empty_cache()
    # Normalizing images per the paper and resizing each image to 64 x 192.
    transform = transforms.Compose([
        # Citation:
        # https://pytorch.org/vision/stable/transforms.html#scriptable-transforms
        transforms.Resize((64, 192)),
    ])
    # Loading in images with normalization and resizing applied.
    training_set, validation_set, test_set = dataset.load_nvidia_dataset(batch_size=BATCH_SIZE, transform=transform)
    
    image_size = training_set.dataset[0][0].shape

    model = VanillaVisionTransformer.VisionTransformer(device,
                                                image_size,
                                               PATCH_SIZE, 
                                               HIDDEN_DIM,
                                               EMBED_DIM,
                                               NUM_CHANNELS,
                                               NUM_HEADS,
                                               NUM_LAYERS,
                                               DROPOUT).to(device)
    
    criterion = nn.MSELoss()
#     criterion = RMSELoss

    optimizer = torch.optim.Adam(model.parameters(), lr=LEARNING_RATE, weight_decay=WEIGHT_DECAY_REGULARIZATION_TERM)
    scheduler = torch.optim.lr_scheduler.ReduceLROnPlateau(optimizer)
    
    best = float('inf')
    best_model = None
    best_epoch = None
    train_losses = []
    valid_losses = []
    scaler = torch.cuda.amp.GradScaler()


    for epoch in range(NUM_EPOCHS):
        
        # Training.
        train_loss = train(epoch, training_set, model, optimizer, criterion, scaler=scaler)
        temp = train_loss
        temp.cpu()
        temp = float(temp)
        train_losses.append(temp)
        print(f"Average training loss this epoch: {temp:.4f}")
                
        # Validation.
        valid_loss = validate(epoch, validation_set, model, criterion)
        temp = valid_loss
        temp.cpu()
        temp = float(temp)
        valid_losses.append(temp)
        
        scheduler.step(train_loss)
        
        if valid_loss < best:
            best = valid_loss
            best_model = copy.deepcopy(model)
            best_epoch = epoch

            
    print('Best Loss @1: {:.4f}'.format(best))

    torch.save(best_model.state_dict(), './checkpoints/vanilla_vision_transformer.pth')
    
    losses_to_plot = train_losses, valid_losses
    plots(losses_to_plot, 
          lr=LEARNING_RATE, 
          reg=WEIGHT_DECAY_REGULARIZATION_TERM,
          batch=BATCH_SIZE, 
          # momentum=MOMENTUM  # not necessary for ADAM
         )
    
if __name__ == '__main__':
    main()

  return F.mse_loss(input, target, reduction=self.reduction)


Epoch: [0][0/27046]	Time 0.041 (0.041)	Loss 0.3975 (0.3975)	
Epoch: [0][10/27046]	Time 0.018 (0.032)	Loss 3.1339 (2.6590)	
Epoch: [0][20/27046]	Time 0.019 (0.026)	Loss 0.8026 (2.0294)	
Epoch: [0][30/27046]	Time 0.019 (0.024)	Loss 1.1191 (1.6820)	
Epoch: [0][40/27046]	Time 0.018 (0.022)	Loss 0.3027 (1.3419)	
Epoch: [0][50/27046]	Time 0.019 (0.022)	Loss 0.0801 (1.1123)	
Epoch: [0][60/27046]	Time 0.019 (0.021)	Loss 0.0005 (0.9762)	
Epoch: [0][70/27046]	Time 0.019 (0.021)	Loss 0.3077 (0.8651)	
Epoch: [0][80/27046]	Time 0.019 (0.021)	Loss 0.2335 (0.7997)	
Epoch: [0][90/27046]	Time 0.018 (0.020)	Loss 0.2479 (0.7289)	
Epoch: [0][100/27046]	Time 0.019 (0.020)	Loss 0.0162 (0.6837)	
Epoch: [0][110/27046]	Time 0.018 (0.020)	Loss 0.0300 (0.6321)	
Epoch: [0][120/27046]	Time 0.018 (0.020)	Loss 0.0347 (0.5935)	
Epoch: [0][130/27046]	Time 0.018 (0.020)	Loss 0.0876 (0.5621)	
Epoch: [0][140/27046]	Time 0.018 (0.020)	Loss 0.4939 (0.5414)	
Epoch: [0][150/27046]	Time 0.020 (0.020)	Loss 0.3776 (0.5157)	
Epo

Epoch: [0][1300/27046]	Time 0.020 (0.019)	Loss 0.9544 (0.2178)	
Epoch: [0][1310/27046]	Time 0.019 (0.019)	Loss 0.1553 (0.2171)	
Epoch: [0][1320/27046]	Time 0.020 (0.019)	Loss 0.0053 (0.2176)	
Epoch: [0][1330/27046]	Time 0.018 (0.019)	Loss 0.0918 (0.2173)	
Epoch: [0][1340/27046]	Time 0.018 (0.019)	Loss 0.0187 (0.2170)	
Epoch: [0][1350/27046]	Time 0.018 (0.019)	Loss 0.1652 (0.2165)	
Epoch: [0][1360/27046]	Time 0.021 (0.019)	Loss 0.0368 (0.2164)	
Epoch: [0][1370/27046]	Time 0.019 (0.019)	Loss 0.0251 (0.2161)	
Epoch: [0][1380/27046]	Time 0.019 (0.019)	Loss 0.0544 (0.2156)	
Epoch: [0][1390/27046]	Time 0.019 (0.019)	Loss 0.0373 (0.2150)	
Epoch: [0][1400/27046]	Time 0.019 (0.019)	Loss 0.5469 (0.2147)	
Epoch: [0][1410/27046]	Time 0.018 (0.019)	Loss 0.0303 (0.2142)	
Epoch: [0][1420/27046]	Time 0.019 (0.019)	Loss 0.2607 (0.2136)	
Epoch: [0][1430/27046]	Time 0.018 (0.019)	Loss 0.1020 (0.2129)	
Epoch: [0][1440/27046]	Time 0.018 (0.019)	Loss 0.0715 (0.2127)	
Epoch: [0][1450/27046]	Time 0.019 (0.019

Epoch: [0][2590/27046]	Time 0.022 (0.019)	Loss 0.0375 (0.1845)	
Epoch: [0][2600/27046]	Time 0.022 (0.019)	Loss 0.0250 (0.1847)	
Epoch: [0][2610/27046]	Time 0.020 (0.019)	Loss 0.0914 (0.1848)	
Epoch: [0][2620/27046]	Time 0.021 (0.019)	Loss 0.1529 (0.1844)	
Epoch: [0][2630/27046]	Time 0.020 (0.019)	Loss 0.0327 (0.1842)	
Epoch: [0][2640/27046]	Time 0.022 (0.019)	Loss 0.3849 (0.1842)	
Epoch: [0][2650/27046]	Time 0.022 (0.019)	Loss 0.0747 (0.1840)	
Epoch: [0][2660/27046]	Time 0.023 (0.019)	Loss 0.0124 (0.1837)	
Epoch: [0][2670/27046]	Time 0.021 (0.019)	Loss 0.2318 (0.1839)	
Epoch: [0][2680/27046]	Time 0.021 (0.019)	Loss 0.2622 (0.1837)	
Epoch: [0][2690/27046]	Time 0.033 (0.019)	Loss 0.0070 (0.1839)	
Epoch: [0][2700/27046]	Time 0.021 (0.019)	Loss 0.0179 (0.1835)	
Epoch: [0][2710/27046]	Time 0.021 (0.019)	Loss 0.0214 (0.1831)	
Epoch: [0][2720/27046]	Time 0.021 (0.019)	Loss 0.0256 (0.1826)	
Epoch: [0][2730/27046]	Time 0.024 (0.019)	Loss 0.0463 (0.1822)	
Epoch: [0][2740/27046]	Time 0.021 (0.019

Epoch: [0][3890/27046]	Time 0.021 (0.020)	Loss 0.0334 (0.1742)	
Epoch: [0][3900/27046]	Time 0.020 (0.020)	Loss 0.3489 (0.1740)	
Epoch: [0][3910/27046]	Time 0.020 (0.020)	Loss 0.0871 (0.1741)	
Epoch: [0][3920/27046]	Time 0.019 (0.020)	Loss 0.0342 (0.1740)	
Epoch: [0][3930/27046]	Time 0.020 (0.020)	Loss 0.0187 (0.1741)	
Epoch: [0][3940/27046]	Time 0.020 (0.020)	Loss 0.0177 (0.1741)	
Epoch: [0][3950/27046]	Time 0.020 (0.020)	Loss 0.0895 (0.1739)	
Epoch: [0][3960/27046]	Time 0.020 (0.020)	Loss 0.0742 (0.1738)	
Epoch: [0][3970/27046]	Time 0.021 (0.020)	Loss 0.2480 (0.1736)	
Epoch: [0][3980/27046]	Time 0.020 (0.020)	Loss 0.0014 (0.1734)	
Epoch: [0][3990/27046]	Time 0.020 (0.020)	Loss 0.3140 (0.1735)	
Epoch: [0][4000/27046]	Time 0.021 (0.020)	Loss 0.0294 (0.1736)	
Epoch: [0][4010/27046]	Time 0.020 (0.020)	Loss 0.0193 (0.1735)	
Epoch: [0][4020/27046]	Time 0.019 (0.020)	Loss 0.4602 (0.1734)	
Epoch: [0][4030/27046]	Time 0.020 (0.020)	Loss 0.1697 (0.1734)	
Epoch: [0][4040/27046]	Time 0.020 (0.020

Epoch: [0][5180/27046]	Time 0.019 (0.020)	Loss 0.0143 (0.1699)	
Epoch: [0][5190/27046]	Time 0.021 (0.020)	Loss 0.0979 (0.1700)	
Epoch: [0][5200/27046]	Time 0.022 (0.020)	Loss 0.0439 (0.1700)	
Epoch: [0][5210/27046]	Time 0.020 (0.020)	Loss 0.0901 (0.1699)	
Epoch: [0][5220/27046]	Time 0.019 (0.020)	Loss 0.6356 (0.1699)	
Epoch: [0][5230/27046]	Time 0.021 (0.020)	Loss 0.2286 (0.1697)	
Epoch: [0][5240/27046]	Time 0.020 (0.020)	Loss 0.0086 (0.1696)	
Epoch: [0][5250/27046]	Time 0.019 (0.020)	Loss 0.0583 (0.1695)	
Epoch: [0][5260/27046]	Time 0.019 (0.020)	Loss 0.4782 (0.1698)	
Epoch: [0][5270/27046]	Time 0.020 (0.020)	Loss 0.0449 (0.1699)	
Epoch: [0][5280/27046]	Time 0.020 (0.020)	Loss 0.0948 (0.1698)	
Epoch: [0][5290/27046]	Time 0.019 (0.020)	Loss 0.0260 (0.1698)	
Epoch: [0][5300/27046]	Time 0.022 (0.020)	Loss 0.0865 (0.1698)	
Epoch: [0][5310/27046]	Time 0.020 (0.020)	Loss 0.1726 (0.1700)	
Epoch: [0][5320/27046]	Time 0.019 (0.020)	Loss 0.0907 (0.1703)	
Epoch: [0][5330/27046]	Time 0.019 (0.020

Epoch: [0][6480/27046]	Time 0.020 (0.020)	Loss 1.5551 (0.1682)	
Epoch: [0][6490/27046]	Time 0.032 (0.020)	Loss 0.0441 (0.1682)	
Epoch: [0][6500/27046]	Time 0.020 (0.020)	Loss 0.1594 (0.1684)	
Epoch: [0][6510/27046]	Time 0.019 (0.020)	Loss 0.0317 (0.1684)	
Epoch: [0][6520/27046]	Time 0.020 (0.020)	Loss 0.0871 (0.1684)	
Epoch: [0][6530/27046]	Time 0.021 (0.020)	Loss 0.0105 (0.1683)	
Epoch: [0][6540/27046]	Time 0.019 (0.020)	Loss 0.0504 (0.1682)	
Epoch: [0][6550/27046]	Time 0.022 (0.020)	Loss 0.9777 (0.1683)	
Epoch: [0][6560/27046]	Time 0.022 (0.020)	Loss 0.3569 (0.1682)	
Epoch: [0][6570/27046]	Time 0.021 (0.020)	Loss 0.0741 (0.1682)	
Epoch: [0][6580/27046]	Time 0.024 (0.020)	Loss 0.0077 (0.1682)	
Epoch: [0][6590/27046]	Time 0.021 (0.020)	Loss 0.1123 (0.1681)	
Epoch: [0][6600/27046]	Time 0.021 (0.020)	Loss 0.1487 (0.1680)	
Epoch: [0][6610/27046]	Time 0.021 (0.020)	Loss 0.0252 (0.1680)	
Epoch: [0][6620/27046]	Time 0.022 (0.020)	Loss 0.2688 (0.1679)	
Epoch: [0][6630/27046]	Time 0.022 (0.020

Epoch: [0][7770/27046]	Time 0.025 (0.020)	Loss 0.0796 (0.1647)	
Epoch: [0][7780/27046]	Time 0.021 (0.020)	Loss 0.0050 (0.1646)	
Epoch: [0][7790/27046]	Time 0.020 (0.020)	Loss 0.0085 (0.1645)	
Epoch: [0][7800/27046]	Time 0.020 (0.020)	Loss 0.0227 (0.1644)	
Epoch: [0][7810/27046]	Time 0.021 (0.020)	Loss 0.2395 (0.1643)	
Epoch: [0][7820/27046]	Time 0.020 (0.020)	Loss 0.0467 (0.1643)	
Epoch: [0][7830/27046]	Time 0.021 (0.020)	Loss 0.0172 (0.1642)	
Epoch: [0][7840/27046]	Time 0.020 (0.020)	Loss 0.1863 (0.1643)	
Epoch: [0][7850/27046]	Time 0.021 (0.020)	Loss 0.0974 (0.1642)	
Epoch: [0][7860/27046]	Time 0.019 (0.020)	Loss 0.0174 (0.1641)	
Epoch: [0][7870/27046]	Time 0.020 (0.020)	Loss 0.2294 (0.1640)	
Epoch: [0][7880/27046]	Time 0.020 (0.020)	Loss 0.0513 (0.1640)	
Epoch: [0][7890/27046]	Time 0.024 (0.020)	Loss 0.0160 (0.1639)	
Epoch: [0][7900/27046]	Time 0.020 (0.020)	Loss 0.0197 (0.1639)	
Epoch: [0][7910/27046]	Time 0.020 (0.020)	Loss 0.0034 (0.1638)	
Epoch: [0][7920/27046]	Time 0.021 (0.020

Epoch: [0][9060/27046]	Time 0.020 (0.020)	Loss 0.1105 (0.1631)	
Epoch: [0][9070/27046]	Time 0.020 (0.020)	Loss 0.0812 (0.1632)	
Epoch: [0][9080/27046]	Time 0.023 (0.020)	Loss 0.1889 (0.1631)	
Epoch: [0][9090/27046]	Time 0.020 (0.020)	Loss 0.0344 (0.1631)	
Epoch: [0][9100/27046]	Time 0.019 (0.020)	Loss 0.0539 (0.1631)	
Epoch: [0][9110/27046]	Time 0.019 (0.020)	Loss 0.1339 (0.1630)	
Epoch: [0][9120/27046]	Time 0.018 (0.020)	Loss 0.0057 (0.1630)	
Epoch: [0][9130/27046]	Time 0.019 (0.020)	Loss 0.2627 (0.1630)	
Epoch: [0][9140/27046]	Time 0.020 (0.020)	Loss 0.4659 (0.1631)	
Epoch: [0][9150/27046]	Time 0.019 (0.020)	Loss 0.1246 (0.1632)	
Epoch: [0][9160/27046]	Time 0.020 (0.020)	Loss 0.1776 (0.1632)	
Epoch: [0][9170/27046]	Time 0.019 (0.020)	Loss 0.0052 (0.1632)	
Epoch: [0][9180/27046]	Time 0.020 (0.020)	Loss 0.0252 (0.1633)	
Epoch: [0][9190/27046]	Time 0.021 (0.020)	Loss 0.0343 (0.1634)	
Epoch: [0][9200/27046]	Time 0.021 (0.020)	Loss 0.0369 (0.1636)	
Epoch: [0][9210/27046]	Time 0.019 (0.020

Epoch: [0][10340/27046]	Time 0.019 (0.020)	Loss 0.0024 (0.1625)	
Epoch: [0][10350/27046]	Time 0.021 (0.020)	Loss 0.0036 (0.1624)	
Epoch: [0][10360/27046]	Time 0.020 (0.020)	Loss 1.1129 (0.1625)	
Epoch: [0][10370/27046]	Time 0.021 (0.020)	Loss 0.0240 (0.1625)	
Epoch: [0][10380/27046]	Time 0.020 (0.020)	Loss 0.0367 (0.1626)	
Epoch: [0][10390/27046]	Time 0.020 (0.020)	Loss 0.0068 (0.1625)	
Epoch: [0][10400/27046]	Time 0.020 (0.020)	Loss 0.0090 (0.1624)	
Epoch: [0][10410/27046]	Time 0.021 (0.020)	Loss 0.3205 (0.1623)	
Epoch: [0][10420/27046]	Time 0.019 (0.020)	Loss 0.0144 (0.1623)	
Epoch: [0][10430/27046]	Time 0.019 (0.020)	Loss 0.2513 (0.1622)	
Epoch: [0][10440/27046]	Time 0.021 (0.020)	Loss 0.0190 (0.1622)	
Epoch: [0][10450/27046]	Time 0.019 (0.020)	Loss 0.1903 (0.1622)	
Epoch: [0][10460/27046]	Time 0.020 (0.020)	Loss 0.1111 (0.1622)	
Epoch: [0][10470/27046]	Time 0.019 (0.020)	Loss 0.0730 (0.1621)	
Epoch: [0][10480/27046]	Time 0.020 (0.020)	Loss 0.1244 (0.1622)	
Epoch: [0][10490/27046]	T

Epoch: [0][11620/27046]	Time 0.020 (0.020)	Loss 0.0253 (0.1602)	
Epoch: [0][11630/27046]	Time 0.021 (0.020)	Loss 0.0018 (0.1602)	
Epoch: [0][11640/27046]	Time 0.020 (0.020)	Loss 0.0216 (0.1602)	
Epoch: [0][11650/27046]	Time 0.020 (0.020)	Loss 0.5046 (0.1605)	
Epoch: [0][11660/27046]	Time 0.019 (0.020)	Loss 0.0639 (0.1605)	
Epoch: [0][11670/27046]	Time 0.023 (0.020)	Loss 0.0897 (0.1605)	
Epoch: [0][11680/27046]	Time 0.020 (0.020)	Loss 0.1097 (0.1605)	
Epoch: [0][11690/27046]	Time 0.021 (0.020)	Loss 0.1315 (0.1605)	
Epoch: [0][11700/27046]	Time 0.020 (0.020)	Loss 0.2240 (0.1604)	
Epoch: [0][11710/27046]	Time 0.021 (0.020)	Loss 0.0163 (0.1604)	
Epoch: [0][11720/27046]	Time 0.020 (0.020)	Loss 0.2376 (0.1604)	
Epoch: [0][11730/27046]	Time 0.019 (0.020)	Loss 0.1246 (0.1603)	
Epoch: [0][11740/27046]	Time 0.023 (0.020)	Loss 0.1275 (0.1603)	
Epoch: [0][11750/27046]	Time 0.021 (0.020)	Loss 0.3202 (0.1602)	
Epoch: [0][11760/27046]	Time 0.020 (0.020)	Loss 0.1238 (0.1602)	
Epoch: [0][11770/27046]	T

Epoch: [0][12890/27046]	Time 0.020 (0.020)	Loss 0.0385 (0.1600)	
Epoch: [0][12900/27046]	Time 0.019 (0.020)	Loss 0.0973 (0.1600)	
Epoch: [0][12910/27046]	Time 0.020 (0.020)	Loss 0.0694 (0.1600)	
Epoch: [0][12920/27046]	Time 0.019 (0.020)	Loss 0.0079 (0.1601)	
Epoch: [0][12930/27046]	Time 0.020 (0.020)	Loss 0.1761 (0.1600)	
Epoch: [0][12940/27046]	Time 0.019 (0.020)	Loss 0.0065 (0.1600)	
Epoch: [0][12950/27046]	Time 0.020 (0.020)	Loss 0.0093 (0.1599)	
Epoch: [0][12960/27046]	Time 0.021 (0.020)	Loss 0.0172 (0.1598)	
Epoch: [0][12970/27046]	Time 0.021 (0.020)	Loss 0.4502 (0.1598)	
Epoch: [0][12980/27046]	Time 0.019 (0.020)	Loss 0.0434 (0.1598)	
Epoch: [0][12990/27046]	Time 0.020 (0.020)	Loss 0.1070 (0.1597)	
Epoch: [0][13000/27046]	Time 0.019 (0.020)	Loss 0.0422 (0.1596)	
Epoch: [0][13010/27046]	Time 0.019 (0.020)	Loss 0.1138 (0.1596)	
Epoch: [0][13020/27046]	Time 0.019 (0.020)	Loss 0.0180 (0.1595)	
Epoch: [0][13030/27046]	Time 0.019 (0.020)	Loss 0.3034 (0.1595)	
Epoch: [0][13040/27046]	T

Epoch: [0][14160/27046]	Time 0.025 (0.020)	Loss 0.3955 (0.1585)	
Epoch: [0][14170/27046]	Time 0.021 (0.020)	Loss 0.0078 (0.1585)	
Epoch: [0][14180/27046]	Time 0.019 (0.020)	Loss 0.0350 (0.1585)	
Epoch: [0][14190/27046]	Time 0.019 (0.020)	Loss 0.0209 (0.1585)	
Epoch: [0][14200/27046]	Time 0.020 (0.020)	Loss 0.0019 (0.1586)	
Epoch: [0][14210/27046]	Time 0.025 (0.020)	Loss 0.0372 (0.1585)	
Epoch: [0][14220/27046]	Time 0.020 (0.020)	Loss 0.1120 (0.1585)	
Epoch: [0][14230/27046]	Time 0.022 (0.020)	Loss 1.0022 (0.1586)	
Epoch: [0][14240/27046]	Time 0.024 (0.020)	Loss 0.0471 (0.1586)	
Epoch: [0][14250/27046]	Time 0.022 (0.020)	Loss 0.0864 (0.1586)	
Epoch: [0][14260/27046]	Time 0.021 (0.020)	Loss 0.0359 (0.1586)	
Epoch: [0][14270/27046]	Time 0.020 (0.020)	Loss 0.1020 (0.1586)	
Epoch: [0][14280/27046]	Time 0.022 (0.020)	Loss 0.0884 (0.1586)	
Epoch: [0][14290/27046]	Time 0.020 (0.020)	Loss 1.0091 (0.1586)	
Epoch: [0][14300/27046]	Time 0.021 (0.020)	Loss 0.0320 (0.1586)	
Epoch: [0][14310/27046]	T

Epoch: [0][15430/27046]	Time 0.019 (0.020)	Loss 0.0606 (0.1577)	
Epoch: [0][15440/27046]	Time 0.020 (0.020)	Loss 0.0683 (0.1576)	
Epoch: [0][15450/27046]	Time 0.019 (0.020)	Loss 0.1086 (0.1576)	
Epoch: [0][15460/27046]	Time 0.021 (0.020)	Loss 0.3557 (0.1576)	
Epoch: [0][15470/27046]	Time 0.020 (0.020)	Loss 0.0739 (0.1576)	
Epoch: [0][15480/27046]	Time 0.019 (0.020)	Loss 0.2931 (0.1576)	
Epoch: [0][15490/27046]	Time 0.021 (0.020)	Loss 0.0288 (0.1576)	
Epoch: [0][15500/27046]	Time 0.021 (0.020)	Loss 0.0003 (0.1577)	
Epoch: [0][15510/27046]	Time 0.020 (0.020)	Loss 0.0020 (0.1576)	
Epoch: [0][15520/27046]	Time 0.020 (0.020)	Loss 0.1968 (0.1576)	
Epoch: [0][15530/27046]	Time 0.020 (0.020)	Loss 0.0111 (0.1576)	
Epoch: [0][15540/27046]	Time 0.020 (0.020)	Loss 0.0337 (0.1576)	
Epoch: [0][15550/27046]	Time 0.020 (0.020)	Loss 0.0190 (0.1575)	
Epoch: [0][15560/27046]	Time 0.019 (0.020)	Loss 0.1325 (0.1575)	
Epoch: [0][15570/27046]	Time 0.020 (0.020)	Loss 0.0400 (0.1575)	
Epoch: [0][15580/27046]	T

Epoch: [0][16710/27046]	Time 0.021 (0.020)	Loss 0.0187 (0.1582)	
Epoch: [0][16720/27046]	Time 0.020 (0.020)	Loss 0.1375 (0.1582)	
Epoch: [0][16730/27046]	Time 0.020 (0.020)	Loss 0.0362 (0.1582)	
Epoch: [0][16740/27046]	Time 0.022 (0.020)	Loss 0.1028 (0.1582)	
Epoch: [0][16750/27046]	Time 0.020 (0.020)	Loss 0.2299 (0.1582)	
Epoch: [0][16760/27046]	Time 0.020 (0.020)	Loss 0.6068 (0.1583)	
Epoch: [0][16770/27046]	Time 0.020 (0.020)	Loss 0.9161 (0.1584)	
Epoch: [0][16780/27046]	Time 0.020 (0.020)	Loss 0.0227 (0.1583)	
Epoch: [0][16790/27046]	Time 0.020 (0.020)	Loss 0.0716 (0.1584)	
Epoch: [0][16800/27046]	Time 0.023 (0.020)	Loss 0.6795 (0.1584)	
Epoch: [0][16810/27046]	Time 0.020 (0.020)	Loss 0.3852 (0.1585)	
Epoch: [0][16820/27046]	Time 0.020 (0.020)	Loss 0.4017 (0.1585)	
Epoch: [0][16830/27046]	Time 0.022 (0.020)	Loss 0.0457 (0.1584)	
Epoch: [0][16840/27046]	Time 0.020 (0.020)	Loss 0.0450 (0.1585)	
Epoch: [0][16850/27046]	Time 0.020 (0.020)	Loss 0.0417 (0.1585)	
Epoch: [0][16860/27046]	T

Epoch: [0][17980/27046]	Time 0.019 (0.020)	Loss 0.0682 (0.1574)	
Epoch: [0][17990/27046]	Time 0.020 (0.020)	Loss 0.1337 (0.1573)	
Epoch: [0][18000/27046]	Time 0.019 (0.020)	Loss 0.0266 (0.1574)	
Epoch: [0][18010/27046]	Time 0.015 (0.020)	Loss 1.4069 (0.1574)	
Epoch: [0][18020/27046]	Time 0.019 (0.020)	Loss 0.0494 (0.1574)	
Epoch: [0][18030/27046]	Time 0.019 (0.020)	Loss 0.0467 (0.1573)	
Epoch: [0][18040/27046]	Time 0.020 (0.020)	Loss 0.1943 (0.1573)	
Epoch: [0][18050/27046]	Time 0.020 (0.020)	Loss 0.0408 (0.1573)	
Epoch: [0][18060/27046]	Time 0.019 (0.020)	Loss 0.0883 (0.1572)	
Epoch: [0][18070/27046]	Time 0.021 (0.020)	Loss 0.1985 (0.1572)	
Epoch: [0][18080/27046]	Time 0.022 (0.020)	Loss 0.0017 (0.1572)	
Epoch: [0][18090/27046]	Time 0.020 (0.020)	Loss 0.2461 (0.1572)	
Epoch: [0][18100/27046]	Time 0.020 (0.020)	Loss 0.0127 (0.1572)	
Epoch: [0][18110/27046]	Time 0.019 (0.020)	Loss 0.0049 (0.1572)	
Epoch: [0][18120/27046]	Time 0.020 (0.020)	Loss 0.1078 (0.1572)	
Epoch: [0][18130/27046]	T

Epoch: [0][19250/27046]	Time 0.019 (0.020)	Loss 0.0049 (0.1569)	
Epoch: [0][19260/27046]	Time 0.021 (0.020)	Loss 0.3056 (0.1570)	
Epoch: [0][19270/27046]	Time 0.021 (0.020)	Loss 0.0100 (0.1570)	
Epoch: [0][19280/27046]	Time 0.019 (0.020)	Loss 0.0302 (0.1569)	
Epoch: [0][19290/27046]	Time 0.019 (0.020)	Loss 0.2205 (0.1569)	
Epoch: [0][19300/27046]	Time 0.019 (0.020)	Loss 0.1909 (0.1569)	
Epoch: [0][19310/27046]	Time 0.019 (0.020)	Loss 0.2417 (0.1569)	
Epoch: [0][19320/27046]	Time 0.021 (0.020)	Loss 0.0690 (0.1569)	
Epoch: [0][19330/27046]	Time 0.019 (0.020)	Loss 0.1042 (0.1568)	
Epoch: [0][19340/27046]	Time 0.021 (0.020)	Loss 0.0352 (0.1569)	
Epoch: [0][19350/27046]	Time 0.020 (0.020)	Loss 0.0760 (0.1569)	
Epoch: [0][19360/27046]	Time 0.020 (0.020)	Loss 0.0200 (0.1569)	
Epoch: [0][19370/27046]	Time 0.021 (0.020)	Loss 0.1031 (0.1568)	
Epoch: [0][19380/27046]	Time 0.020 (0.020)	Loss 0.0291 (0.1568)	
Epoch: [0][19390/27046]	Time 0.020 (0.020)	Loss 0.0134 (0.1568)	
Epoch: [0][19400/27046]	T

Epoch: [0][20520/27046]	Time 0.023 (0.020)	Loss 0.1120 (0.1566)	
Epoch: [0][20530/27046]	Time 0.021 (0.020)	Loss 0.3843 (0.1566)	
Epoch: [0][20540/27046]	Time 0.022 (0.020)	Loss 0.2493 (0.1566)	
Epoch: [0][20550/27046]	Time 0.023 (0.020)	Loss 0.0478 (0.1567)	
Epoch: [0][20560/27046]	Time 0.024 (0.020)	Loss 0.0076 (0.1567)	
Epoch: [0][20570/27046]	Time 0.022 (0.020)	Loss 0.0516 (0.1567)	
Epoch: [0][20580/27046]	Time 0.021 (0.020)	Loss 0.0262 (0.1567)	
Epoch: [0][20590/27046]	Time 0.021 (0.020)	Loss 1.4055 (0.1568)	
Epoch: [0][20600/27046]	Time 0.021 (0.020)	Loss 0.0932 (0.1568)	
Epoch: [0][20610/27046]	Time 0.030 (0.020)	Loss 0.0104 (0.1567)	
Epoch: [0][20620/27046]	Time 0.021 (0.020)	Loss 0.0125 (0.1567)	
Epoch: [0][20630/27046]	Time 0.025 (0.020)	Loss 0.0746 (0.1567)	
Epoch: [0][20640/27046]	Time 0.022 (0.020)	Loss 0.0074 (0.1567)	
Epoch: [0][20650/27046]	Time 0.021 (0.020)	Loss 0.4525 (0.1567)	
Epoch: [0][20660/27046]	Time 0.022 (0.020)	Loss 0.1659 (0.1567)	
Epoch: [0][20670/27046]	T

Epoch: [0][21790/27046]	Time 0.026 (0.020)	Loss 0.0092 (0.1569)	
Epoch: [0][21800/27046]	Time 0.019 (0.020)	Loss 0.6386 (0.1570)	
Epoch: [0][21810/27046]	Time 0.019 (0.020)	Loss 0.2076 (0.1569)	
Epoch: [0][21820/27046]	Time 0.019 (0.020)	Loss 0.0167 (0.1569)	
Epoch: [0][21830/27046]	Time 0.020 (0.020)	Loss 0.0326 (0.1569)	
Epoch: [0][21840/27046]	Time 0.020 (0.020)	Loss 0.0526 (0.1569)	
Epoch: [0][21850/27046]	Time 0.020 (0.020)	Loss 0.2006 (0.1569)	
Epoch: [0][21860/27046]	Time 0.019 (0.020)	Loss 0.1175 (0.1569)	
Epoch: [0][21870/27046]	Time 0.019 (0.020)	Loss 0.6410 (0.1569)	
Epoch: [0][21880/27046]	Time 0.020 (0.020)	Loss 0.0868 (0.1569)	
Epoch: [0][21890/27046]	Time 0.020 (0.020)	Loss 0.1467 (0.1569)	
Epoch: [0][21900/27046]	Time 0.020 (0.020)	Loss 0.0409 (0.1568)	
Epoch: [0][21910/27046]	Time 0.019 (0.020)	Loss 0.3932 (0.1568)	
Epoch: [0][21920/27046]	Time 0.019 (0.020)	Loss 0.3848 (0.1568)	
Epoch: [0][21930/27046]	Time 0.019 (0.020)	Loss 0.0248 (0.1568)	
Epoch: [0][21940/27046]	T

Epoch: [0][23060/27046]	Time 0.020 (0.020)	Loss 0.0174 (0.1570)	
Epoch: [0][23070/27046]	Time 0.022 (0.020)	Loss 0.0431 (0.1569)	
Epoch: [0][23080/27046]	Time 0.020 (0.020)	Loss 0.0203 (0.1569)	
Epoch: [0][23090/27046]	Time 0.022 (0.020)	Loss 0.0018 (0.1569)	
Epoch: [0][23100/27046]	Time 0.021 (0.020)	Loss 0.1211 (0.1569)	
Epoch: [0][23110/27046]	Time 0.021 (0.020)	Loss 1.0886 (0.1570)	
Epoch: [0][23120/27046]	Time 0.021 (0.020)	Loss 0.0514 (0.1571)	
Epoch: [0][23130/27046]	Time 0.019 (0.020)	Loss 0.0003 (0.1571)	
Epoch: [0][23140/27046]	Time 0.022 (0.020)	Loss 0.3979 (0.1571)	
Epoch: [0][23150/27046]	Time 0.021 (0.020)	Loss 0.0300 (0.1570)	
Epoch: [0][23160/27046]	Time 0.019 (0.020)	Loss 0.0897 (0.1571)	
Epoch: [0][23170/27046]	Time 0.023 (0.020)	Loss 0.0303 (0.1571)	
Epoch: [0][23180/27046]	Time 0.020 (0.020)	Loss 0.0175 (0.1571)	
Epoch: [0][23190/27046]	Time 0.021 (0.020)	Loss 0.5198 (0.1572)	
Epoch: [0][23200/27046]	Time 0.022 (0.020)	Loss 0.2165 (0.1571)	
Epoch: [0][23210/27046]	T

Epoch: [0][24340/27046]	Time 0.020 (0.020)	Loss 0.0323 (0.1572)	
Epoch: [0][24350/27046]	Time 0.021 (0.020)	Loss 0.1090 (0.1571)	
Epoch: [0][24360/27046]	Time 0.023 (0.020)	Loss 0.4940 (0.1572)	
Epoch: [0][24370/27046]	Time 0.019 (0.020)	Loss 0.0283 (0.1571)	
Epoch: [0][24380/27046]	Time 0.019 (0.020)	Loss 0.0619 (0.1571)	
Epoch: [0][24390/27046]	Time 0.020 (0.020)	Loss 0.0224 (0.1571)	
Epoch: [0][24400/27046]	Time 0.021 (0.020)	Loss 0.3212 (0.1571)	
Epoch: [0][24410/27046]	Time 0.023 (0.020)	Loss 0.0093 (0.1571)	
Epoch: [0][24420/27046]	Time 0.020 (0.020)	Loss 0.2008 (0.1571)	
Epoch: [0][24430/27046]	Time 0.020 (0.020)	Loss 0.2037 (0.1571)	
Epoch: [0][24440/27046]	Time 0.020 (0.020)	Loss 0.0353 (0.1570)	
Epoch: [0][24450/27046]	Time 0.022 (0.020)	Loss 0.1856 (0.1570)	
Epoch: [0][24460/27046]	Time 0.022 (0.020)	Loss 0.8380 (0.1571)	
Epoch: [0][24470/27046]	Time 0.022 (0.020)	Loss 0.0402 (0.1571)	
Epoch: [0][24480/27046]	Time 0.020 (0.020)	Loss 0.0980 (0.1571)	
Epoch: [0][24490/27046]	T

Epoch: [0][25610/27046]	Time 0.020 (0.020)	Loss 0.4426 (0.1569)	
Epoch: [0][25620/27046]	Time 0.021 (0.020)	Loss 0.0080 (0.1569)	
Epoch: [0][25630/27046]	Time 0.020 (0.020)	Loss 0.2370 (0.1568)	
Epoch: [0][25640/27046]	Time 0.021 (0.020)	Loss 0.2517 (0.1568)	
Epoch: [0][25650/27046]	Time 0.023 (0.020)	Loss 0.1797 (0.1568)	
Epoch: [0][25660/27046]	Time 0.022 (0.020)	Loss 0.2071 (0.1568)	
Epoch: [0][25670/27046]	Time 0.020 (0.020)	Loss 0.0464 (0.1568)	
Epoch: [0][25680/27046]	Time 0.021 (0.020)	Loss 0.0287 (0.1568)	
Epoch: [0][25690/27046]	Time 0.022 (0.020)	Loss 0.0261 (0.1568)	
Epoch: [0][25700/27046]	Time 0.021 (0.020)	Loss 0.0352 (0.1567)	
Epoch: [0][25710/27046]	Time 0.020 (0.020)	Loss 0.0068 (0.1567)	
Epoch: [0][25720/27046]	Time 0.020 (0.020)	Loss 0.2228 (0.1568)	
Epoch: [0][25730/27046]	Time 0.020 (0.020)	Loss 0.2844 (0.1568)	
Epoch: [0][25740/27046]	Time 0.020 (0.020)	Loss 0.2645 (0.1568)	
Epoch: [0][25750/27046]	Time 0.021 (0.020)	Loss 0.0071 (0.1568)	
Epoch: [0][25760/27046]	T

Epoch: [0][26890/27046]	Time 0.019 (0.020)	Loss 0.4767 (0.1564)	
Epoch: [0][26900/27046]	Time 0.020 (0.020)	Loss 0.0409 (0.1564)	
Epoch: [0][26910/27046]	Time 0.019 (0.020)	Loss 0.0145 (0.1564)	
Epoch: [0][26920/27046]	Time 0.019 (0.020)	Loss 0.4018 (0.1564)	
Epoch: [0][26930/27046]	Time 0.019 (0.020)	Loss 0.2477 (0.1564)	
Epoch: [0][26940/27046]	Time 0.019 (0.020)	Loss 0.0048 (0.1564)	
Epoch: [0][26950/27046]	Time 0.021 (0.020)	Loss 0.0865 (0.1564)	
Epoch: [0][26960/27046]	Time 0.023 (0.020)	Loss 0.0153 (0.1564)	
Epoch: [0][26970/27046]	Time 0.021 (0.020)	Loss 0.0097 (0.1564)	
Epoch: [0][26980/27046]	Time 0.020 (0.020)	Loss 0.0827 (0.1564)	
Epoch: [0][26990/27046]	Time 0.019 (0.020)	Loss 0.0050 (0.1564)	
Epoch: [0][27000/27046]	Time 0.019 (0.020)	Loss 0.1679 (0.1564)	
Epoch: [0][27010/27046]	Time 0.020 (0.020)	Loss 0.0862 (0.1564)	
Epoch: [0][27020/27046]	Time 0.020 (0.020)	Loss 0.0278 (0.1564)	
Epoch: [0][27030/27046]	Time 0.020 (0.020)	Loss 0.0070 (0.1564)	
Epoch: [0][27040/27046]	T

Epoch: [0][1740/6762]	Time 0.003 (0.004)	
Epoch: [0][1750/6762]	Time 0.004 (0.004)	
Epoch: [0][1760/6762]	Time 0.004 (0.004)	
Epoch: [0][1770/6762]	Time 0.003 (0.004)	
Epoch: [0][1780/6762]	Time 0.006 (0.004)	
Epoch: [0][1790/6762]	Time 0.004 (0.004)	
Epoch: [0][1800/6762]	Time 0.004 (0.004)	
Epoch: [0][1810/6762]	Time 0.003 (0.004)	
Epoch: [0][1820/6762]	Time 0.004 (0.004)	
Epoch: [0][1830/6762]	Time 0.003 (0.004)	
Epoch: [0][1840/6762]	Time 0.004 (0.004)	
Epoch: [0][1850/6762]	Time 0.004 (0.004)	
Epoch: [0][1860/6762]	Time 0.003 (0.004)	
Epoch: [0][1870/6762]	Time 0.004 (0.004)	
Epoch: [0][1880/6762]	Time 0.004 (0.004)	
Epoch: [0][1890/6762]	Time 0.005 (0.004)	
Epoch: [0][1900/6762]	Time 0.004 (0.004)	
Epoch: [0][1910/6762]	Time 0.004 (0.004)	
Epoch: [0][1920/6762]	Time 0.003 (0.004)	
Epoch: [0][1930/6762]	Time 0.003 (0.004)	
Epoch: [0][1940/6762]	Time 0.004 (0.004)	
Epoch: [0][1950/6762]	Time 0.003 (0.004)	
Epoch: [0][1960/6762]	Time 0.003 (0.004)	
Epoch: [0][1970/6762]	Time 0.003 (

Epoch: [0][3720/6762]	Time 0.004 (0.004)	
Epoch: [0][3730/6762]	Time 0.004 (0.004)	
Epoch: [0][3740/6762]	Time 0.004 (0.004)	
Epoch: [0][3750/6762]	Time 0.003 (0.004)	
Epoch: [0][3760/6762]	Time 0.004 (0.004)	
Epoch: [0][3770/6762]	Time 0.004 (0.004)	
Epoch: [0][3780/6762]	Time 0.003 (0.004)	
Epoch: [0][3790/6762]	Time 0.004 (0.004)	
Epoch: [0][3800/6762]	Time 0.004 (0.004)	
Epoch: [0][3810/6762]	Time 0.003 (0.004)	
Epoch: [0][3820/6762]	Time 0.004 (0.004)	
Epoch: [0][3830/6762]	Time 0.004 (0.004)	
Epoch: [0][3840/6762]	Time 0.005 (0.004)	
Epoch: [0][3850/6762]	Time 0.004 (0.004)	
Epoch: [0][3860/6762]	Time 0.004 (0.004)	
Epoch: [0][3870/6762]	Time 0.004 (0.004)	
Epoch: [0][3880/6762]	Time 0.004 (0.004)	
Epoch: [0][3890/6762]	Time 0.004 (0.004)	
Epoch: [0][3900/6762]	Time 0.004 (0.004)	
Epoch: [0][3910/6762]	Time 0.004 (0.004)	
Epoch: [0][3920/6762]	Time 0.004 (0.004)	
Epoch: [0][3930/6762]	Time 0.003 (0.004)	
Epoch: [0][3940/6762]	Time 0.004 (0.004)	
Epoch: [0][3950/6762]	Time 0.004 (

Epoch: [0][5720/6762]	Time 0.004 (0.004)	
Epoch: [0][5730/6762]	Time 0.003 (0.004)	
Epoch: [0][5740/6762]	Time 0.004 (0.004)	
Epoch: [0][5750/6762]	Time 0.003 (0.004)	
Epoch: [0][5760/6762]	Time 0.006 (0.004)	
Epoch: [0][5770/6762]	Time 0.003 (0.004)	
Epoch: [0][5780/6762]	Time 0.003 (0.004)	
Epoch: [0][5790/6762]	Time 0.003 (0.004)	
Epoch: [0][5800/6762]	Time 0.004 (0.004)	
Epoch: [0][5810/6762]	Time 0.003 (0.004)	
Epoch: [0][5820/6762]	Time 0.004 (0.004)	
Epoch: [0][5830/6762]	Time 0.004 (0.004)	
Epoch: [0][5840/6762]	Time 0.004 (0.004)	
Epoch: [0][5850/6762]	Time 0.004 (0.004)	
Epoch: [0][5860/6762]	Time 0.003 (0.004)	
Epoch: [0][5870/6762]	Time 0.004 (0.004)	
Epoch: [0][5880/6762]	Time 0.003 (0.004)	
Epoch: [0][5890/6762]	Time 0.004 (0.004)	
Epoch: [0][5900/6762]	Time 0.004 (0.004)	
Epoch: [0][5910/6762]	Time 0.003 (0.004)	
Epoch: [0][5920/6762]	Time 0.004 (0.004)	
Epoch: [0][5930/6762]	Time 0.004 (0.004)	
Epoch: [0][5940/6762]	Time 0.004 (0.004)	
Epoch: [0][5950/6762]	Time 0.004 (

Epoch: [1][610/27046]	Time 0.018 (0.021)	Loss 0.0216 (0.1463)	
Epoch: [1][620/27046]	Time 0.019 (0.021)	Loss 0.1544 (0.1451)	
Epoch: [1][630/27046]	Time 0.020 (0.021)	Loss 0.0000 (0.1452)	
Epoch: [1][640/27046]	Time 0.020 (0.021)	Loss 0.0227 (0.1463)	
Epoch: [1][650/27046]	Time 0.020 (0.021)	Loss 0.0825 (0.1460)	
Epoch: [1][660/27046]	Time 0.019 (0.021)	Loss 0.0042 (0.1467)	
Epoch: [1][670/27046]	Time 0.019 (0.021)	Loss 0.2417 (0.1462)	
Epoch: [1][680/27046]	Time 0.019 (0.021)	Loss 0.1192 (0.1478)	
Epoch: [1][690/27046]	Time 0.019 (0.021)	Loss 0.2419 (0.1480)	
Epoch: [1][700/27046]	Time 0.022 (0.021)	Loss 0.0456 (0.1484)	
Epoch: [1][710/27046]	Time 0.018 (0.021)	Loss 0.0581 (0.1473)	
Epoch: [1][720/27046]	Time 0.020 (0.021)	Loss 0.3829 (0.1474)	
Epoch: [1][730/27046]	Time 0.021 (0.021)	Loss 0.0216 (0.1478)	
Epoch: [1][740/27046]	Time 0.021 (0.021)	Loss 0.1103 (0.1479)	
Epoch: [1][750/27046]	Time 0.019 (0.021)	Loss 0.0182 (0.1469)	
Epoch: [1][760/27046]	Time 0.020 (0.021)	Loss 0.6600 (0

Epoch: [1][1900/27046]	Time 0.020 (0.020)	Loss 0.0678 (0.1524)	
Epoch: [1][1910/27046]	Time 0.020 (0.020)	Loss 0.0923 (0.1524)	
Epoch: [1][1920/27046]	Time 0.020 (0.020)	Loss 0.0374 (0.1523)	
Epoch: [1][1930/27046]	Time 0.019 (0.020)	Loss 0.3468 (0.1520)	
Epoch: [1][1940/27046]	Time 0.019 (0.020)	Loss 0.0321 (0.1518)	
Epoch: [1][1950/27046]	Time 0.018 (0.020)	Loss 0.2187 (0.1518)	
Epoch: [1][1960/27046]	Time 0.020 (0.020)	Loss 0.1004 (0.1522)	
Epoch: [1][1970/27046]	Time 0.019 (0.020)	Loss 0.0288 (0.1518)	
Epoch: [1][1980/27046]	Time 0.020 (0.020)	Loss 0.2592 (0.1520)	
Epoch: [1][1990/27046]	Time 0.020 (0.020)	Loss 0.0528 (0.1517)	
Epoch: [1][2000/27046]	Time 0.020 (0.020)	Loss 0.0100 (0.1526)	
Epoch: [1][2010/27046]	Time 0.020 (0.020)	Loss 0.0504 (0.1530)	
Epoch: [1][2020/27046]	Time 0.019 (0.020)	Loss 0.1314 (0.1531)	
Epoch: [1][2030/27046]	Time 0.019 (0.020)	Loss 0.1387 (0.1537)	
Epoch: [1][2040/27046]	Time 0.021 (0.020)	Loss 0.0803 (0.1532)	
Epoch: [1][2050/27046]	Time 0.021 (0.020

Epoch: [1][3190/27046]	Time 0.020 (0.020)	Loss 0.2875 (0.1571)	
Epoch: [1][3200/27046]	Time 0.020 (0.020)	Loss 0.0660 (0.1571)	
Epoch: [1][3210/27046]	Time 0.019 (0.020)	Loss 0.0027 (0.1572)	
Epoch: [1][3220/27046]	Time 0.020 (0.020)	Loss 0.0055 (0.1575)	
Epoch: [1][3230/27046]	Time 0.019 (0.020)	Loss 0.3002 (0.1575)	
Epoch: [1][3240/27046]	Time 0.020 (0.020)	Loss 0.0048 (0.1573)	
Epoch: [1][3250/27046]	Time 0.019 (0.020)	Loss 0.0119 (0.1574)	
Epoch: [1][3260/27046]	Time 0.020 (0.020)	Loss 0.1817 (0.1572)	
Epoch: [1][3270/27046]	Time 0.021 (0.020)	Loss 0.1132 (0.1569)	
Epoch: [1][3280/27046]	Time 0.022 (0.020)	Loss 0.1130 (0.1569)	
Epoch: [1][3290/27046]	Time 0.022 (0.020)	Loss 0.1173 (0.1571)	
Epoch: [1][3300/27046]	Time 0.021 (0.020)	Loss 0.1175 (0.1569)	
Epoch: [1][3310/27046]	Time 0.020 (0.020)	Loss 0.0385 (0.1566)	
Epoch: [1][3320/27046]	Time 0.019 (0.020)	Loss 0.1014 (0.1565)	
Epoch: [1][3330/27046]	Time 0.019 (0.020)	Loss 0.4487 (0.1566)	
Epoch: [1][3340/27046]	Time 0.020 (0.020

Epoch: [1][4490/27046]	Time 0.020 (0.020)	Loss 0.0357 (0.1579)	
Epoch: [1][4500/27046]	Time 0.020 (0.020)	Loss 0.1922 (0.1580)	
Epoch: [1][4510/27046]	Time 0.020 (0.020)	Loss 0.0057 (0.1581)	
Epoch: [1][4520/27046]	Time 0.020 (0.020)	Loss 0.0424 (0.1580)	
Epoch: [1][4530/27046]	Time 0.019 (0.020)	Loss 0.0140 (0.1579)	
Epoch: [1][4540/27046]	Time 0.020 (0.020)	Loss 0.2475 (0.1579)	
Epoch: [1][4550/27046]	Time 0.020 (0.020)	Loss 0.0681 (0.1579)	
Epoch: [1][4560/27046]	Time 0.021 (0.020)	Loss 0.0124 (0.1577)	
Epoch: [1][4570/27046]	Time 0.019 (0.020)	Loss 0.1024 (0.1576)	
Epoch: [1][4580/27046]	Time 0.019 (0.020)	Loss 0.0215 (0.1576)	
Epoch: [1][4590/27046]	Time 0.018 (0.020)	Loss 0.2363 (0.1575)	
Epoch: [1][4600/27046]	Time 0.019 (0.020)	Loss 0.1926 (0.1573)	
Epoch: [1][4610/27046]	Time 0.020 (0.020)	Loss 0.3862 (0.1575)	
Epoch: [1][4620/27046]	Time 0.020 (0.020)	Loss 0.0602 (0.1574)	
Epoch: [1][4630/27046]	Time 0.020 (0.020)	Loss 0.2405 (0.1573)	
Epoch: [1][4640/27046]	Time 0.019 (0.020

Epoch: [1][5790/27046]	Time 0.020 (0.020)	Loss 0.0060 (0.1553)	
Epoch: [1][5800/27046]	Time 0.020 (0.020)	Loss 0.5016 (0.1556)	
Epoch: [1][5810/27046]	Time 0.019 (0.020)	Loss 0.1241 (0.1556)	
Epoch: [1][5820/27046]	Time 0.019 (0.020)	Loss 1.0117 (0.1559)	
Epoch: [1][5830/27046]	Time 0.019 (0.020)	Loss 0.1121 (0.1558)	
Epoch: [1][5840/27046]	Time 0.020 (0.020)	Loss 0.0047 (0.1559)	
Epoch: [1][5850/27046]	Time 0.020 (0.020)	Loss 0.0493 (0.1558)	
Epoch: [1][5860/27046]	Time 0.020 (0.020)	Loss 0.0226 (0.1556)	
Epoch: [1][5870/27046]	Time 0.020 (0.020)	Loss 0.3030 (0.1555)	
Epoch: [1][5880/27046]	Time 0.020 (0.020)	Loss 0.0022 (0.1553)	
Epoch: [1][5890/27046]	Time 0.020 (0.020)	Loss 0.0460 (0.1554)	
Epoch: [1][5900/27046]	Time 0.020 (0.020)	Loss 0.0378 (0.1554)	
Epoch: [1][5910/27046]	Time 0.020 (0.020)	Loss 0.0134 (0.1554)	
Epoch: [1][5920/27046]	Time 0.020 (0.020)	Loss 0.1030 (0.1554)	
Epoch: [1][5930/27046]	Time 0.019 (0.020)	Loss 1.5870 (0.1555)	
Epoch: [1][5940/27046]	Time 0.019 (0.020

Epoch: [1][7090/27046]	Time 0.023 (0.020)	Loss 0.3036 (0.1550)	
Epoch: [1][7100/27046]	Time 0.021 (0.020)	Loss 0.0074 (0.1550)	
Epoch: [1][7110/27046]	Time 0.021 (0.020)	Loss 0.0222 (0.1551)	
Epoch: [1][7120/27046]	Time 0.020 (0.020)	Loss 0.0806 (0.1551)	
Epoch: [1][7130/27046]	Time 0.020 (0.020)	Loss 0.0325 (0.1550)	
Epoch: [1][7140/27046]	Time 0.020 (0.020)	Loss 0.0106 (0.1550)	
Epoch: [1][7150/27046]	Time 0.020 (0.020)	Loss 0.0276 (0.1553)	
Epoch: [1][7160/27046]	Time 0.019 (0.020)	Loss 0.0095 (0.1552)	
Epoch: [1][7170/27046]	Time 0.021 (0.020)	Loss 0.0993 (0.1551)	
Epoch: [1][7180/27046]	Time 0.021 (0.020)	Loss 0.0847 (0.1551)	
Epoch: [1][7190/27046]	Time 0.020 (0.020)	Loss 0.3645 (0.1553)	
Epoch: [1][7200/27046]	Time 0.021 (0.020)	Loss 0.1517 (0.1552)	
Epoch: [1][7210/27046]	Time 0.022 (0.020)	Loss 0.1324 (0.1553)	
Epoch: [1][7220/27046]	Time 0.023 (0.020)	Loss 0.0099 (0.1552)	
Epoch: [1][7230/27046]	Time 0.021 (0.020)	Loss 0.3186 (0.1555)	
Epoch: [1][7240/27046]	Time 0.042 (0.020

Epoch: [1][8380/27046]	Time 0.019 (0.020)	Loss 0.3256 (0.1562)	
Epoch: [1][8390/27046]	Time 0.022 (0.020)	Loss 0.0794 (0.1562)	
Epoch: [1][8400/27046]	Time 0.022 (0.020)	Loss 0.0373 (0.1561)	
Epoch: [1][8410/27046]	Time 0.020 (0.020)	Loss 0.0087 (0.1564)	
Epoch: [1][8420/27046]	Time 0.021 (0.020)	Loss 0.0003 (0.1565)	
Epoch: [1][8430/27046]	Time 0.020 (0.020)	Loss 0.2308 (0.1565)	
Epoch: [1][8440/27046]	Time 0.020 (0.020)	Loss 0.1744 (0.1564)	
Epoch: [1][8450/27046]	Time 0.020 (0.020)	Loss 0.0834 (0.1564)	
Epoch: [1][8460/27046]	Time 0.019 (0.020)	Loss 0.1353 (0.1564)	
Epoch: [1][8470/27046]	Time 0.022 (0.020)	Loss 0.0056 (0.1566)	
Epoch: [1][8480/27046]	Time 0.020 (0.020)	Loss 0.0024 (0.1565)	
Epoch: [1][8490/27046]	Time 0.021 (0.020)	Loss 0.0055 (0.1564)	
Epoch: [1][8500/27046]	Time 0.022 (0.020)	Loss 0.2735 (0.1564)	
Epoch: [1][8510/27046]	Time 0.019 (0.020)	Loss 0.3133 (0.1564)	
Epoch: [1][8520/27046]	Time 0.034 (0.020)	Loss 0.2076 (0.1564)	
Epoch: [1][8530/27046]	Time 0.021 (0.020

Epoch: [1][9670/27046]	Time 0.020 (0.020)	Loss 0.0054 (0.1569)	
Epoch: [1][9680/27046]	Time 0.021 (0.020)	Loss 0.0212 (0.1569)	
Epoch: [1][9690/27046]	Time 0.019 (0.020)	Loss 0.2292 (0.1568)	
Epoch: [1][9700/27046]	Time 0.021 (0.020)	Loss 0.0152 (0.1568)	
Epoch: [1][9710/27046]	Time 0.020 (0.020)	Loss 0.3350 (0.1567)	
Epoch: [1][9720/27046]	Time 0.020 (0.020)	Loss 0.0193 (0.1568)	
Epoch: [1][9730/27046]	Time 0.020 (0.020)	Loss 0.1250 (0.1568)	
Epoch: [1][9740/27046]	Time 0.022 (0.020)	Loss 0.0101 (0.1567)	
Epoch: [1][9750/27046]	Time 0.020 (0.020)	Loss 0.0292 (0.1568)	
Epoch: [1][9760/27046]	Time 0.022 (0.020)	Loss 0.0032 (0.1568)	
Epoch: [1][9770/27046]	Time 0.019 (0.020)	Loss 0.0101 (0.1567)	
Epoch: [1][9780/27046]	Time 0.021 (0.020)	Loss 0.1162 (0.1567)	
Epoch: [1][9790/27046]	Time 0.025 (0.020)	Loss 0.2452 (0.1567)	
Epoch: [1][9800/27046]	Time 0.037 (0.020)	Loss 0.0659 (0.1570)	
Epoch: [1][9810/27046]	Time 0.020 (0.020)	Loss 0.0185 (0.1569)	
Epoch: [1][9820/27046]	Time 0.020 (0.020

Epoch: [1][10950/27046]	Time 0.020 (0.020)	Loss 0.0514 (0.1565)	
Epoch: [1][10960/27046]	Time 0.020 (0.020)	Loss 0.0279 (0.1565)	
Epoch: [1][10970/27046]	Time 0.020 (0.020)	Loss 0.0501 (0.1567)	
Epoch: [1][10980/27046]	Time 0.020 (0.020)	Loss 0.2121 (0.1566)	
Epoch: [1][10990/27046]	Time 0.019 (0.020)	Loss 0.0235 (0.1566)	
Epoch: [1][11000/27046]	Time 0.020 (0.020)	Loss 0.2882 (0.1565)	
Epoch: [1][11010/27046]	Time 0.018 (0.020)	Loss 0.0260 (0.1565)	
Epoch: [1][11020/27046]	Time 0.019 (0.020)	Loss 0.0863 (0.1565)	
Epoch: [1][11030/27046]	Time 0.018 (0.020)	Loss 0.3477 (0.1565)	
Epoch: [1][11040/27046]	Time 0.018 (0.020)	Loss 0.1836 (0.1566)	
Epoch: [1][11050/27046]	Time 0.020 (0.020)	Loss 0.0104 (0.1565)	
Epoch: [1][11060/27046]	Time 0.018 (0.020)	Loss 0.0123 (0.1565)	
Epoch: [1][11070/27046]	Time 0.022 (0.020)	Loss 0.0680 (0.1565)	
Epoch: [1][11080/27046]	Time 0.036 (0.020)	Loss 0.0253 (0.1564)	
Epoch: [1][11090/27046]	Time 0.022 (0.020)	Loss 0.0001 (0.1564)	
Epoch: [1][11100/27046]	T

Epoch: [1][12230/27046]	Time 0.018 (0.020)	Loss 0.0073 (0.1558)	
Epoch: [1][12240/27046]	Time 0.021 (0.020)	Loss 0.0148 (0.1558)	
Epoch: [1][12250/27046]	Time 0.020 (0.020)	Loss 0.0079 (0.1557)	
Epoch: [1][12260/27046]	Time 0.020 (0.020)	Loss 0.0612 (0.1556)	
Epoch: [1][12270/27046]	Time 0.020 (0.020)	Loss 0.1628 (0.1556)	
Epoch: [1][12280/27046]	Time 0.019 (0.020)	Loss 0.2086 (0.1556)	
Epoch: [1][12290/27046]	Time 0.020 (0.020)	Loss 0.1464 (0.1556)	
Epoch: [1][12300/27046]	Time 0.019 (0.020)	Loss 0.2335 (0.1556)	
Epoch: [1][12310/27046]	Time 0.019 (0.020)	Loss 0.1075 (0.1556)	
Epoch: [1][12320/27046]	Time 0.019 (0.020)	Loss 0.0064 (0.1555)	
Epoch: [1][12330/27046]	Time 0.020 (0.020)	Loss 0.6254 (0.1555)	
Epoch: [1][12340/27046]	Time 0.019 (0.020)	Loss 0.0037 (0.1555)	
Epoch: [1][12350/27046]	Time 0.019 (0.020)	Loss 0.0362 (0.1554)	
Epoch: [1][12360/27046]	Time 0.037 (0.020)	Loss 0.7817 (0.1555)	
Epoch: [1][12370/27046]	Time 0.019 (0.020)	Loss 0.0068 (0.1555)	
Epoch: [1][12380/27046]	T

Epoch: [1][13510/27046]	Time 0.019 (0.020)	Loss 0.0271 (0.1553)	
Epoch: [1][13520/27046]	Time 0.021 (0.020)	Loss 0.2978 (0.1553)	
Epoch: [1][13530/27046]	Time 0.018 (0.020)	Loss 0.0463 (0.1552)	
Epoch: [1][13540/27046]	Time 0.020 (0.020)	Loss 0.0101 (0.1552)	
Epoch: [1][13550/27046]	Time 0.019 (0.020)	Loss 0.2280 (0.1554)	
Epoch: [1][13560/27046]	Time 0.018 (0.020)	Loss 0.2890 (0.1553)	
Epoch: [1][13570/27046]	Time 0.019 (0.020)	Loss 0.1480 (0.1553)	
Epoch: [1][13580/27046]	Time 0.025 (0.020)	Loss 0.0045 (0.1552)	
Epoch: [1][13590/27046]	Time 0.020 (0.020)	Loss 0.0080 (0.1552)	
Epoch: [1][13600/27046]	Time 0.019 (0.020)	Loss 0.0016 (0.1553)	
Epoch: [1][13610/27046]	Time 0.018 (0.020)	Loss 0.0083 (0.1552)	
Epoch: [1][13620/27046]	Time 0.021 (0.020)	Loss 0.1152 (0.1553)	
Epoch: [1][13630/27046]	Time 0.019 (0.020)	Loss 0.7694 (0.1552)	
Epoch: [1][13640/27046]	Time 0.034 (0.020)	Loss 0.0177 (0.1552)	
Epoch: [1][13650/27046]	Time 0.019 (0.020)	Loss 0.2404 (0.1552)	
Epoch: [1][13660/27046]	T

Epoch: [1][14790/27046]	Time 0.019 (0.020)	Loss 0.2752 (0.1553)	
Epoch: [1][14800/27046]	Time 0.022 (0.020)	Loss 0.1218 (0.1553)	
Epoch: [1][14810/27046]	Time 0.021 (0.020)	Loss 0.0291 (0.1553)	
Epoch: [1][14820/27046]	Time 0.021 (0.020)	Loss 0.1527 (0.1553)	
Epoch: [1][14830/27046]	Time 0.019 (0.020)	Loss 0.0305 (0.1553)	
Epoch: [1][14840/27046]	Time 0.019 (0.020)	Loss 0.0213 (0.1553)	
Epoch: [1][14850/27046]	Time 0.019 (0.020)	Loss 0.0378 (0.1552)	
Epoch: [1][14860/27046]	Time 0.019 (0.020)	Loss 0.4614 (0.1553)	
Epoch: [1][14870/27046]	Time 0.021 (0.020)	Loss 0.1962 (0.1553)	
Epoch: [1][14880/27046]	Time 0.020 (0.020)	Loss 0.0040 (0.1553)	
Epoch: [1][14890/27046]	Time 0.021 (0.020)	Loss 0.0673 (0.1553)	
Epoch: [1][14900/27046]	Time 0.020 (0.020)	Loss 0.3716 (0.1553)	
Epoch: [1][14910/27046]	Time 0.020 (0.020)	Loss 0.0277 (0.1554)	
Epoch: [1][14920/27046]	Time 0.037 (0.020)	Loss 0.1135 (0.1553)	
Epoch: [1][14930/27046]	Time 0.020 (0.020)	Loss 0.0290 (0.1553)	
Epoch: [1][14940/27046]	T

Epoch: [1][16060/27046]	Time 0.021 (0.020)	Loss 0.1304 (0.1556)	
Epoch: [1][16070/27046]	Time 0.019 (0.020)	Loss 0.0108 (0.1556)	
Epoch: [1][16080/27046]	Time 0.019 (0.020)	Loss 0.0337 (0.1556)	
Epoch: [1][16090/27046]	Time 0.021 (0.020)	Loss 0.1981 (0.1556)	
Epoch: [1][16100/27046]	Time 0.019 (0.020)	Loss 0.0112 (0.1555)	
Epoch: [1][16110/27046]	Time 0.018 (0.020)	Loss 0.0071 (0.1555)	
Epoch: [1][16120/27046]	Time 0.019 (0.020)	Loss 0.0042 (0.1555)	
Epoch: [1][16130/27046]	Time 0.019 (0.020)	Loss 0.0890 (0.1554)	
Epoch: [1][16140/27046]	Time 0.020 (0.020)	Loss 1.2422 (0.1555)	
Epoch: [1][16150/27046]	Time 0.020 (0.020)	Loss 0.1387 (0.1554)	
Epoch: [1][16160/27046]	Time 0.021 (0.020)	Loss 0.1416 (0.1554)	
Epoch: [1][16170/27046]	Time 0.022 (0.020)	Loss 0.0964 (0.1555)	
Epoch: [1][16180/27046]	Time 0.020 (0.020)	Loss 0.0031 (0.1554)	
Epoch: [1][16190/27046]	Time 0.021 (0.020)	Loss 0.7883 (0.1555)	
Epoch: [1][16200/27046]	Time 0.037 (0.020)	Loss 0.6068 (0.1556)	
Epoch: [1][16210/27046]	T

Epoch: [1][17340/27046]	Time 0.020 (0.020)	Loss 0.0536 (0.1557)	
Epoch: [1][17350/27046]	Time 0.022 (0.020)	Loss 0.0019 (0.1556)	
Epoch: [1][17360/27046]	Time 0.022 (0.020)	Loss 1.0157 (0.1557)	
Epoch: [1][17370/27046]	Time 0.020 (0.020)	Loss 0.0131 (0.1557)	
Epoch: [1][17380/27046]	Time 0.020 (0.020)	Loss 0.8911 (0.1557)	
Epoch: [1][17390/27046]	Time 0.019 (0.020)	Loss 0.0519 (0.1557)	
Epoch: [1][17400/27046]	Time 0.019 (0.020)	Loss 0.4914 (0.1557)	
Epoch: [1][17410/27046]	Time 0.020 (0.020)	Loss 0.4704 (0.1558)	
Epoch: [1][17420/27046]	Time 0.019 (0.020)	Loss 0.0058 (0.1557)	
Epoch: [1][17430/27046]	Time 0.020 (0.020)	Loss 0.0059 (0.1558)	
Epoch: [1][17440/27046]	Time 0.020 (0.020)	Loss 0.0557 (0.1557)	
Epoch: [1][17450/27046]	Time 0.020 (0.020)	Loss 0.2153 (0.1557)	
Epoch: [1][17460/27046]	Time 0.020 (0.020)	Loss 0.0076 (0.1557)	
Epoch: [1][17470/27046]	Time 0.020 (0.020)	Loss 0.0585 (0.1556)	
Epoch: [1][17480/27046]	Time 0.035 (0.020)	Loss 0.0136 (0.1556)	
Epoch: [1][17490/27046]	T

Epoch: [1][18610/27046]	Time 0.023 (0.020)	Loss 0.1845 (0.1552)	
Epoch: [1][18620/27046]	Time 0.025 (0.020)	Loss 0.6212 (0.1552)	
Epoch: [1][18630/27046]	Time 0.022 (0.020)	Loss 0.0060 (0.1551)	
Epoch: [1][18640/27046]	Time 0.022 (0.020)	Loss 0.0280 (0.1551)	
Epoch: [1][18650/27046]	Time 0.022 (0.020)	Loss 0.0698 (0.1551)	
Epoch: [1][18660/27046]	Time 0.021 (0.020)	Loss 0.0493 (0.1551)	
Epoch: [1][18670/27046]	Time 0.023 (0.020)	Loss 0.0150 (0.1551)	
Epoch: [1][18680/27046]	Time 0.020 (0.020)	Loss 0.6278 (0.1551)	
Epoch: [1][18690/27046]	Time 0.023 (0.020)	Loss 0.2172 (0.1551)	
Epoch: [1][18700/27046]	Time 0.021 (0.020)	Loss 0.1282 (0.1551)	
Epoch: [1][18710/27046]	Time 0.021 (0.020)	Loss 0.1502 (0.1551)	
Epoch: [1][18720/27046]	Time 0.020 (0.020)	Loss 0.0714 (0.1551)	
Epoch: [1][18730/27046]	Time 0.022 (0.020)	Loss 0.1341 (0.1551)	
Epoch: [1][18740/27046]	Time 0.020 (0.020)	Loss 0.0053 (0.1551)	
Epoch: [1][18750/27046]	Time 0.020 (0.020)	Loss 0.0493 (0.1552)	
Epoch: [1][18760/27046]	T

Epoch: [1][19890/27046]	Time 0.021 (0.020)	Loss 0.0994 (0.1552)	
Epoch: [1][19900/27046]	Time 0.021 (0.020)	Loss 0.6324 (0.1552)	
Epoch: [1][19910/27046]	Time 0.020 (0.020)	Loss 0.0009 (0.1552)	
Epoch: [1][19920/27046]	Time 0.023 (0.020)	Loss 0.2523 (0.1553)	
Epoch: [1][19930/27046]	Time 0.021 (0.020)	Loss 0.0013 (0.1552)	
Epoch: [1][19940/27046]	Time 0.023 (0.020)	Loss 0.1336 (0.1552)	
Epoch: [1][19950/27046]	Time 0.022 (0.020)	Loss 0.3169 (0.1552)	
Epoch: [1][19960/27046]	Time 0.022 (0.020)	Loss 0.3029 (0.1552)	
Epoch: [1][19970/27046]	Time 0.023 (0.020)	Loss 0.0712 (0.1552)	
Epoch: [1][19980/27046]	Time 0.022 (0.020)	Loss 0.0655 (0.1552)	
Epoch: [1][19990/27046]	Time 0.024 (0.020)	Loss 0.0264 (0.1552)	
Epoch: [1][20000/27046]	Time 0.023 (0.020)	Loss 0.0476 (0.1552)	
Epoch: [1][20010/27046]	Time 0.021 (0.020)	Loss 0.1284 (0.1552)	
Epoch: [1][20020/27046]	Time 0.020 (0.020)	Loss 0.0440 (0.1552)	
Epoch: [1][20030/27046]	Time 0.020 (0.020)	Loss 0.1052 (0.1552)	
Epoch: [1][20040/27046]	T

Epoch: [1][21170/27046]	Time 0.019 (0.020)	Loss 1.1947 (0.1550)	
Epoch: [1][21180/27046]	Time 0.021 (0.020)	Loss 0.0415 (0.1550)	
Epoch: [1][21190/27046]	Time 0.019 (0.020)	Loss 0.3328 (0.1550)	
Epoch: [1][21200/27046]	Time 0.022 (0.020)	Loss 0.1432 (0.1550)	
Epoch: [1][21210/27046]	Time 0.020 (0.020)	Loss 0.4450 (0.1550)	
Epoch: [1][21220/27046]	Time 0.021 (0.020)	Loss 0.1517 (0.1550)	
Epoch: [1][21230/27046]	Time 0.021 (0.020)	Loss 0.4971 (0.1550)	
Epoch: [1][21240/27046]	Time 0.021 (0.020)	Loss 0.1309 (0.1549)	
Epoch: [1][21250/27046]	Time 0.020 (0.020)	Loss 0.0765 (0.1549)	
Epoch: [1][21260/27046]	Time 0.021 (0.020)	Loss 0.0211 (0.1549)	
Epoch: [1][21270/27046]	Time 0.022 (0.020)	Loss 0.0420 (0.1549)	
Epoch: [1][21280/27046]	Time 0.020 (0.020)	Loss 0.2794 (0.1549)	
Epoch: [1][21290/27046]	Time 0.020 (0.020)	Loss 0.2393 (0.1549)	
Epoch: [1][21300/27046]	Time 0.020 (0.020)	Loss 0.1452 (0.1548)	
Epoch: [1][21310/27046]	Time 0.020 (0.020)	Loss 0.1882 (0.1548)	
Epoch: [1][21320/27046]	T

Epoch: [1][22450/27046]	Time 0.020 (0.020)	Loss 0.0615 (0.1551)	
Epoch: [1][22460/27046]	Time 0.021 (0.020)	Loss 0.2037 (0.1551)	
Epoch: [1][22470/27046]	Time 0.019 (0.020)	Loss 0.1105 (0.1551)	
Epoch: [1][22480/27046]	Time 0.023 (0.020)	Loss 0.3589 (0.1551)	
Epoch: [1][22490/27046]	Time 0.020 (0.020)	Loss 0.0390 (0.1551)	
Epoch: [1][22500/27046]	Time 0.021 (0.020)	Loss 0.0118 (0.1551)	
Epoch: [1][22510/27046]	Time 0.022 (0.020)	Loss 0.1227 (0.1550)	
Epoch: [1][22520/27046]	Time 0.020 (0.020)	Loss 0.1341 (0.1550)	
Epoch: [1][22530/27046]	Time 0.020 (0.020)	Loss 0.0939 (0.1550)	
Epoch: [1][22540/27046]	Time 0.021 (0.020)	Loss 0.0448 (0.1550)	
Epoch: [1][22550/27046]	Time 0.020 (0.020)	Loss 0.3178 (0.1550)	
Epoch: [1][22560/27046]	Time 0.020 (0.020)	Loss 0.0002 (0.1549)	
Epoch: [1][22570/27046]	Time 0.023 (0.020)	Loss 0.2152 (0.1550)	
Epoch: [1][22580/27046]	Time 0.019 (0.020)	Loss 0.2369 (0.1549)	
Epoch: [1][22590/27046]	Time 0.019 (0.020)	Loss 0.0141 (0.1549)	
Epoch: [1][22600/27046]	T

Epoch: [1][23730/27046]	Time 0.019 (0.020)	Loss 0.1148 (0.1546)	
Epoch: [1][23740/27046]	Time 0.018 (0.020)	Loss 0.2286 (0.1546)	
Epoch: [1][23750/27046]	Time 0.020 (0.020)	Loss 0.2770 (0.1546)	
Epoch: [1][23760/27046]	Time 0.021 (0.020)	Loss 0.0120 (0.1546)	
Epoch: [1][23770/27046]	Time 0.020 (0.020)	Loss 0.0726 (0.1546)	
Epoch: [1][23780/27046]	Time 0.019 (0.020)	Loss 0.0386 (0.1545)	
Epoch: [1][23790/27046]	Time 0.021 (0.020)	Loss 0.0211 (0.1545)	
Epoch: [1][23800/27046]	Time 0.020 (0.020)	Loss 0.0055 (0.1545)	
Epoch: [1][23810/27046]	Time 0.020 (0.020)	Loss 0.5654 (0.1544)	
Epoch: [1][23820/27046]	Time 0.019 (0.020)	Loss 0.0215 (0.1544)	
Epoch: [1][23830/27046]	Time 0.019 (0.020)	Loss 0.0206 (0.1545)	
Epoch: [1][23840/27046]	Time 0.019 (0.020)	Loss 0.0153 (0.1545)	
Epoch: [1][23850/27046]	Time 0.019 (0.020)	Loss 0.1040 (0.1545)	
Epoch: [1][23860/27046]	Time 0.019 (0.020)	Loss 0.1019 (0.1545)	
Epoch: [1][23870/27046]	Time 0.019 (0.020)	Loss 0.0605 (0.1545)	
Epoch: [1][23880/27046]	T

Epoch: [1][25010/27046]	Time 0.023 (0.020)	Loss 0.0039 (0.1548)	
Epoch: [1][25020/27046]	Time 0.021 (0.020)	Loss 0.0705 (0.1549)	
Epoch: [1][25030/27046]	Time 0.020 (0.020)	Loss 0.1230 (0.1549)	
Epoch: [1][25040/27046]	Time 0.020 (0.020)	Loss 0.0638 (0.1549)	
Epoch: [1][25050/27046]	Time 0.024 (0.020)	Loss 0.0756 (0.1548)	
Epoch: [1][25060/27046]	Time 0.020 (0.020)	Loss 0.2414 (0.1548)	
Epoch: [1][25070/27046]	Time 0.020 (0.020)	Loss 0.2607 (0.1548)	
Epoch: [1][25080/27046]	Time 0.021 (0.020)	Loss 0.1742 (0.1548)	
Epoch: [1][25090/27046]	Time 0.020 (0.020)	Loss 0.0791 (0.1548)	
Epoch: [1][25100/27046]	Time 0.023 (0.020)	Loss 0.0299 (0.1547)	
Epoch: [1][25110/27046]	Time 0.020 (0.020)	Loss 0.0027 (0.1548)	
Epoch: [1][25120/27046]	Time 0.020 (0.020)	Loss 0.4546 (0.1547)	
Epoch: [1][25130/27046]	Time 0.020 (0.020)	Loss 0.1118 (0.1548)	
Epoch: [1][25140/27046]	Time 0.021 (0.020)	Loss 0.0036 (0.1547)	
Epoch: [1][25150/27046]	Time 0.022 (0.020)	Loss 0.0372 (0.1547)	
Epoch: [1][25160/27046]	T

Epoch: [1][26290/27046]	Time 0.019 (0.020)	Loss 0.1063 (0.1541)	
Epoch: [1][26300/27046]	Time 0.021 (0.020)	Loss 0.0253 (0.1541)	
Epoch: [1][26310/27046]	Time 0.020 (0.020)	Loss 0.0310 (0.1542)	
Epoch: [1][26320/27046]	Time 0.020 (0.020)	Loss 0.0162 (0.1541)	
Epoch: [1][26330/27046]	Time 0.018 (0.020)	Loss 0.0787 (0.1541)	
Epoch: [1][26340/27046]	Time 0.020 (0.020)	Loss 0.0745 (0.1541)	
Epoch: [1][26350/27046]	Time 0.021 (0.020)	Loss 0.0066 (0.1541)	
Epoch: [1][26360/27046]	Time 0.020 (0.020)	Loss 0.0457 (0.1541)	
Epoch: [1][26370/27046]	Time 0.019 (0.020)	Loss 0.0559 (0.1541)	
Epoch: [1][26380/27046]	Time 0.020 (0.020)	Loss 0.0284 (0.1541)	
Epoch: [1][26390/27046]	Time 0.020 (0.020)	Loss 0.3653 (0.1542)	
Epoch: [1][26400/27046]	Time 0.019 (0.020)	Loss 0.3102 (0.1542)	
Epoch: [1][26410/27046]	Time 0.020 (0.020)	Loss 0.0810 (0.1542)	
Epoch: [1][26420/27046]	Time 0.020 (0.020)	Loss 0.0064 (0.1542)	
Epoch: [1][26430/27046]	Time 0.019 (0.020)	Loss 0.2636 (0.1541)	
Epoch: [1][26440/27046]	T

Epoch: [1][820/6762]	Time 0.004 (0.004)	
Epoch: [1][830/6762]	Time 0.004 (0.004)	
Epoch: [1][840/6762]	Time 0.004 (0.004)	
Epoch: [1][850/6762]	Time 0.004 (0.004)	
Epoch: [1][860/6762]	Time 0.003 (0.004)	
Epoch: [1][870/6762]	Time 0.004 (0.004)	
Epoch: [1][880/6762]	Time 0.004 (0.004)	
Epoch: [1][890/6762]	Time 0.004 (0.004)	
Epoch: [1][900/6762]	Time 0.004 (0.004)	
Epoch: [1][910/6762]	Time 0.005 (0.004)	
Epoch: [1][920/6762]	Time 0.005 (0.004)	
Epoch: [1][930/6762]	Time 0.004 (0.004)	
Epoch: [1][940/6762]	Time 0.004 (0.004)	
Epoch: [1][950/6762]	Time 0.004 (0.004)	
Epoch: [1][960/6762]	Time 0.004 (0.004)	
Epoch: [1][970/6762]	Time 0.004 (0.004)	
Epoch: [1][980/6762]	Time 0.004 (0.004)	
Epoch: [1][990/6762]	Time 0.004 (0.004)	
Epoch: [1][1000/6762]	Time 0.004 (0.004)	
Epoch: [1][1010/6762]	Time 0.003 (0.004)	
Epoch: [1][1020/6762]	Time 0.004 (0.004)	
Epoch: [1][1030/6762]	Time 0.003 (0.004)	
Epoch: [1][1040/6762]	Time 0.004 (0.004)	
Epoch: [1][1050/6762]	Time 0.003 (0.004)	
Epoch: [1]

Epoch: [1][2810/6762]	Time 0.004 (0.004)	
Epoch: [1][2820/6762]	Time 0.003 (0.004)	
Epoch: [1][2830/6762]	Time 0.004 (0.004)	
Epoch: [1][2840/6762]	Time 0.003 (0.004)	
Epoch: [1][2850/6762]	Time 0.004 (0.004)	
Epoch: [1][2860/6762]	Time 0.003 (0.004)	
Epoch: [1][2870/6762]	Time 0.004 (0.004)	
Epoch: [1][2880/6762]	Time 0.004 (0.004)	
Epoch: [1][2890/6762]	Time 0.004 (0.004)	
Epoch: [1][2900/6762]	Time 0.004 (0.004)	
Epoch: [1][2910/6762]	Time 0.004 (0.004)	
Epoch: [1][2920/6762]	Time 0.004 (0.004)	
Epoch: [1][2930/6762]	Time 0.003 (0.004)	
Epoch: [1][2940/6762]	Time 0.004 (0.004)	
Epoch: [1][2950/6762]	Time 0.003 (0.004)	
Epoch: [1][2960/6762]	Time 0.004 (0.004)	
Epoch: [1][2970/6762]	Time 0.004 (0.004)	
Epoch: [1][2980/6762]	Time 0.005 (0.004)	
Epoch: [1][2990/6762]	Time 0.004 (0.004)	
Epoch: [1][3000/6762]	Time 0.004 (0.004)	
Epoch: [1][3010/6762]	Time 0.004 (0.004)	
Epoch: [1][3020/6762]	Time 0.003 (0.004)	
Epoch: [1][3030/6762]	Time 0.004 (0.004)	
Epoch: [1][3040/6762]	Time 0.004 (

Epoch: [1][4800/6762]	Time 0.004 (0.004)	
Epoch: [1][4810/6762]	Time 0.004 (0.004)	
Epoch: [1][4820/6762]	Time 0.003 (0.004)	
Epoch: [1][4830/6762]	Time 0.003 (0.004)	
Epoch: [1][4840/6762]	Time 0.004 (0.004)	
Epoch: [1][4850/6762]	Time 0.004 (0.004)	
Epoch: [1][4860/6762]	Time 0.003 (0.004)	
Epoch: [1][4870/6762]	Time 0.003 (0.004)	
Epoch: [1][4880/6762]	Time 0.003 (0.004)	
Epoch: [1][4890/6762]	Time 0.003 (0.004)	
Epoch: [1][4900/6762]	Time 0.004 (0.004)	
Epoch: [1][4910/6762]	Time 0.003 (0.004)	
Epoch: [1][4920/6762]	Time 0.004 (0.004)	
Epoch: [1][4930/6762]	Time 0.004 (0.004)	
Epoch: [1][4940/6762]	Time 0.004 (0.004)	
Epoch: [1][4950/6762]	Time 0.004 (0.004)	
Epoch: [1][4960/6762]	Time 0.004 (0.004)	
Epoch: [1][4970/6762]	Time 0.003 (0.004)	
Epoch: [1][4980/6762]	Time 0.003 (0.004)	
Epoch: [1][4990/6762]	Time 0.004 (0.004)	
Epoch: [1][5000/6762]	Time 0.003 (0.004)	
Epoch: [1][5010/6762]	Time 0.004 (0.004)	
Epoch: [1][5020/6762]	Time 0.004 (0.004)	
Epoch: [1][5030/6762]	Time 0.004 (

Epoch: [1][6750/6762]	Time 0.003 (0.004)	
Epoch: [1][6760/6762]	Time 0.004 (0.004)	
* Average Loss @1: 0.1539
Epoch: [2][0/27046]	Time 0.020 (0.020)	Loss 0.5011 (0.5011)	
Epoch: [2][10/27046]	Time 0.019 (0.019)	Loss 0.0583 (0.3075)	
Epoch: [2][20/27046]	Time 0.019 (0.019)	Loss 0.5498 (0.2479)	
Epoch: [2][30/27046]	Time 0.018 (0.019)	Loss 0.2827 (0.2080)	
Epoch: [2][40/27046]	Time 0.019 (0.019)	Loss 0.0774 (0.1737)	
Epoch: [2][50/27046]	Time 0.018 (0.019)	Loss 0.1290 (0.1639)	
Epoch: [2][60/27046]	Time 0.019 (0.019)	Loss 2.0347 (0.1902)	
Epoch: [2][70/27046]	Time 0.019 (0.019)	Loss 0.2937 (0.1781)	
Epoch: [2][80/27046]	Time 0.019 (0.019)	Loss 0.0812 (0.1741)	
Epoch: [2][90/27046]	Time 0.020 (0.019)	Loss 0.0168 (0.1909)	
Epoch: [2][100/27046]	Time 0.019 (0.019)	Loss 0.0039 (0.1853)	
Epoch: [2][110/27046]	Time 0.019 (0.019)	Loss 0.0461 (0.1729)	
Epoch: [2][120/27046]	Time 0.023 (0.019)	Loss 0.0042 (0.1803)	
Epoch: [2][130/27046]	Time 0.018 (0.019)	Loss 0.0076 (0.1768)	
Epoch: [2][140/2704

Epoch: [2][1300/27046]	Time 0.020 (0.019)	Loss 0.0009 (0.1502)	
Epoch: [2][1310/27046]	Time 0.018 (0.019)	Loss 0.2441 (0.1505)	
Epoch: [2][1320/27046]	Time 0.019 (0.019)	Loss 0.0036 (0.1497)	
Epoch: [2][1330/27046]	Time 0.019 (0.019)	Loss 0.0189 (0.1491)	
Epoch: [2][1340/27046]	Time 0.020 (0.019)	Loss 0.0122 (0.1490)	
Epoch: [2][1350/27046]	Time 0.019 (0.019)	Loss 0.1977 (0.1489)	
Epoch: [2][1360/27046]	Time 0.018 (0.019)	Loss 0.3913 (0.1498)	
Epoch: [2][1370/27046]	Time 0.018 (0.019)	Loss 0.0045 (0.1495)	
Epoch: [2][1380/27046]	Time 0.019 (0.019)	Loss 0.0289 (0.1493)	
Epoch: [2][1390/27046]	Time 0.019 (0.019)	Loss 0.0898 (0.1494)	
Epoch: [2][1400/27046]	Time 0.024 (0.019)	Loss 0.0687 (0.1501)	
Epoch: [2][1410/27046]	Time 0.020 (0.019)	Loss 0.0162 (0.1499)	
Epoch: [2][1420/27046]	Time 0.019 (0.019)	Loss 0.1063 (0.1503)	
Epoch: [2][1430/27046]	Time 0.019 (0.019)	Loss 0.2380 (0.1501)	
Epoch: [2][1440/27046]	Time 0.020 (0.019)	Loss 0.3107 (0.1510)	
Epoch: [2][1450/27046]	Time 0.018 (0.019

Epoch: [2][2600/27046]	Time 0.018 (0.019)	Loss 0.0089 (0.1520)	
Epoch: [2][2610/27046]	Time 0.019 (0.019)	Loss 0.0139 (0.1526)	
Epoch: [2][2620/27046]	Time 0.019 (0.019)	Loss 1.2275 (0.1528)	
Epoch: [2][2630/27046]	Time 0.019 (0.019)	Loss 0.1261 (0.1531)	
Epoch: [2][2640/27046]	Time 0.019 (0.019)	Loss 0.0927 (0.1529)	
Epoch: [2][2650/27046]	Time 0.019 (0.019)	Loss 0.0613 (0.1537)	
Epoch: [2][2660/27046]	Time 0.019 (0.019)	Loss 0.4282 (0.1537)	
Epoch: [2][2670/27046]	Time 0.019 (0.019)	Loss 0.0272 (0.1536)	
Epoch: [2][2680/27046]	Time 0.024 (0.019)	Loss 0.0210 (0.1535)	
Epoch: [2][2690/27046]	Time 0.019 (0.019)	Loss 0.0476 (0.1532)	
Epoch: [2][2700/27046]	Time 0.020 (0.019)	Loss 0.1328 (0.1536)	
Epoch: [2][2710/27046]	Time 0.020 (0.019)	Loss 0.3306 (0.1545)	
Epoch: [2][2720/27046]	Time 0.020 (0.019)	Loss 1.6425 (0.1554)	
Epoch: [2][2730/27046]	Time 0.020 (0.019)	Loss 0.0067 (0.1554)	
Epoch: [2][2740/27046]	Time 0.019 (0.019)	Loss 0.3782 (0.1553)	
Epoch: [2][2750/27046]	Time 0.018 (0.019

Epoch: [2][3890/27046]	Time 0.018 (0.019)	Loss 0.0387 (0.1548)	
Epoch: [2][3900/27046]	Time 0.020 (0.019)	Loss 0.1036 (0.1548)	
Epoch: [2][3910/27046]	Time 0.019 (0.019)	Loss 0.0060 (0.1548)	
Epoch: [2][3920/27046]	Time 0.019 (0.019)	Loss 0.0788 (0.1548)	
Epoch: [2][3930/27046]	Time 0.019 (0.019)	Loss 0.2393 (0.1548)	
Epoch: [2][3940/27046]	Time 0.019 (0.019)	Loss 0.0803 (0.1546)	
Epoch: [2][3950/27046]	Time 0.020 (0.019)	Loss 0.0939 (0.1545)	
Epoch: [2][3960/27046]	Time 0.024 (0.019)	Loss 0.1399 (0.1544)	
Epoch: [2][3970/27046]	Time 0.020 (0.019)	Loss 0.2374 (0.1547)	
Epoch: [2][3980/27046]	Time 0.019 (0.019)	Loss 0.0448 (0.1545)	
Epoch: [2][3990/27046]	Time 0.018 (0.019)	Loss 0.7545 (0.1545)	
Epoch: [2][4000/27046]	Time 0.019 (0.019)	Loss 0.0186 (0.1544)	
Epoch: [2][4010/27046]	Time 0.018 (0.019)	Loss 0.0972 (0.1545)	
Epoch: [2][4020/27046]	Time 0.019 (0.019)	Loss 0.3953 (0.1544)	
Epoch: [2][4030/27046]	Time 0.018 (0.019)	Loss 0.0809 (0.1545)	
Epoch: [2][4040/27046]	Time 0.020 (0.019

Epoch: [2][5180/27046]	Time 0.018 (0.019)	Loss 0.0289 (0.1519)	
Epoch: [2][5190/27046]	Time 0.020 (0.019)	Loss 0.2975 (0.1518)	
Epoch: [2][5200/27046]	Time 0.019 (0.019)	Loss 0.0402 (0.1517)	
Epoch: [2][5210/27046]	Time 0.019 (0.019)	Loss 0.4314 (0.1517)	
Epoch: [2][5220/27046]	Time 0.020 (0.019)	Loss 0.5798 (0.1517)	
Epoch: [2][5230/27046]	Time 0.018 (0.019)	Loss 0.0675 (0.1517)	
Epoch: [2][5240/27046]	Time 0.024 (0.019)	Loss 0.0889 (0.1519)	
Epoch: [2][5250/27046]	Time 0.020 (0.019)	Loss 0.0449 (0.1520)	
Epoch: [2][5260/27046]	Time 0.018 (0.019)	Loss 0.0221 (0.1518)	
Epoch: [2][5270/27046]	Time 0.019 (0.019)	Loss 0.0447 (0.1520)	
Epoch: [2][5280/27046]	Time 0.019 (0.019)	Loss 0.0052 (0.1518)	
Epoch: [2][5290/27046]	Time 0.019 (0.019)	Loss 0.0569 (0.1517)	
Epoch: [2][5300/27046]	Time 0.020 (0.019)	Loss 0.0564 (0.1516)	
Epoch: [2][5310/27046]	Time 0.019 (0.019)	Loss 0.0864 (0.1515)	
Epoch: [2][5320/27046]	Time 0.020 (0.019)	Loss 0.0164 (0.1514)	
Epoch: [2][5330/27046]	Time 0.019 (0.019

Epoch: [2][6480/27046]	Time 0.019 (0.019)	Loss 0.0011 (0.1512)	
Epoch: [2][6490/27046]	Time 0.019 (0.019)	Loss 0.0233 (0.1513)	
Epoch: [2][6500/27046]	Time 0.019 (0.019)	Loss 0.6706 (0.1515)	
Epoch: [2][6510/27046]	Time 0.020 (0.019)	Loss 0.0154 (0.1515)	
Epoch: [2][6520/27046]	Time 0.024 (0.019)	Loss 0.3315 (0.1515)	
Epoch: [2][6530/27046]	Time 0.019 (0.019)	Loss 0.0305 (0.1514)	
Epoch: [2][6540/27046]	Time 0.019 (0.019)	Loss 0.0696 (0.1514)	
Epoch: [2][6550/27046]	Time 0.019 (0.019)	Loss 0.3457 (0.1514)	
Epoch: [2][6560/27046]	Time 0.021 (0.019)	Loss 0.1028 (0.1514)	
Epoch: [2][6570/27046]	Time 0.019 (0.019)	Loss 0.2440 (0.1513)	
Epoch: [2][6580/27046]	Time 0.020 (0.019)	Loss 0.4866 (0.1514)	
Epoch: [2][6590/27046]	Time 0.020 (0.019)	Loss 1.1330 (0.1517)	
Epoch: [2][6600/27046]	Time 0.020 (0.019)	Loss 0.1007 (0.1516)	
Epoch: [2][6610/27046]	Time 0.018 (0.019)	Loss 0.1811 (0.1515)	
Epoch: [2][6620/27046]	Time 0.020 (0.019)	Loss 0.0531 (0.1514)	
Epoch: [2][6630/27046]	Time 0.019 (0.019

Epoch: [2][7780/27046]	Time 0.020 (0.019)	Loss 1.0397 (0.1517)	
Epoch: [2][7790/27046]	Time 0.018 (0.019)	Loss 0.0772 (0.1517)	
Epoch: [2][7800/27046]	Time 0.027 (0.019)	Loss 0.1164 (0.1516)	
Epoch: [2][7810/27046]	Time 0.021 (0.019)	Loss 0.0401 (0.1515)	
Epoch: [2][7820/27046]	Time 0.019 (0.019)	Loss 0.0486 (0.1514)	
Epoch: [2][7830/27046]	Time 0.020 (0.019)	Loss 0.2671 (0.1515)	
Epoch: [2][7840/27046]	Time 0.019 (0.019)	Loss 0.1074 (0.1516)	
Epoch: [2][7850/27046]	Time 0.019 (0.019)	Loss 0.0039 (0.1516)	
Epoch: [2][7860/27046]	Time 0.020 (0.019)	Loss 0.1284 (0.1517)	
Epoch: [2][7870/27046]	Time 0.019 (0.019)	Loss 0.5183 (0.1519)	
Epoch: [2][7880/27046]	Time 0.019 (0.019)	Loss 0.0897 (0.1520)	
Epoch: [2][7890/27046]	Time 0.019 (0.019)	Loss 0.1030 (0.1519)	
Epoch: [2][7900/27046]	Time 0.019 (0.019)	Loss 0.2928 (0.1519)	
Epoch: [2][7910/27046]	Time 0.020 (0.019)	Loss 0.3490 (0.1519)	
Epoch: [2][7920/27046]	Time 0.019 (0.019)	Loss 0.0720 (0.1521)	
Epoch: [2][7930/27046]	Time 0.020 (0.019

Epoch: [2][9080/27046]	Time 0.027 (0.019)	Loss 0.0662 (0.1519)	
Epoch: [2][9090/27046]	Time 0.019 (0.019)	Loss 0.0496 (0.1518)	
Epoch: [2][9100/27046]	Time 0.019 (0.019)	Loss 0.1832 (0.1518)	
Epoch: [2][9110/27046]	Time 0.020 (0.019)	Loss 0.1714 (0.1518)	
Epoch: [2][9120/27046]	Time 0.020 (0.019)	Loss 0.0326 (0.1518)	
Epoch: [2][9130/27046]	Time 0.019 (0.019)	Loss 0.0048 (0.1520)	
Epoch: [2][9140/27046]	Time 0.019 (0.019)	Loss 0.0356 (0.1521)	
Epoch: [2][9150/27046]	Time 0.019 (0.019)	Loss 0.1325 (0.1520)	
Epoch: [2][9160/27046]	Time 0.019 (0.019)	Loss 0.1809 (0.1520)	
Epoch: [2][9170/27046]	Time 0.020 (0.019)	Loss 0.0321 (0.1522)	
Epoch: [2][9180/27046]	Time 0.020 (0.019)	Loss 0.4361 (0.1522)	
Epoch: [2][9190/27046]	Time 0.019 (0.019)	Loss 0.9850 (0.1523)	
Epoch: [2][9200/27046]	Time 0.019 (0.019)	Loss 0.3563 (0.1522)	
Epoch: [2][9210/27046]	Time 0.020 (0.019)	Loss 1.2339 (0.1523)	
Epoch: [2][9220/27046]	Time 0.019 (0.019)	Loss 0.0660 (0.1522)	
Epoch: [2][9230/27046]	Time 0.020 (0.019

Epoch: [2][10370/27046]	Time 0.020 (0.020)	Loss 0.0613 (0.1522)	
Epoch: [2][10380/27046]	Time 0.019 (0.020)	Loss 0.0799 (0.1522)	
Epoch: [2][10390/27046]	Time 0.018 (0.020)	Loss 0.0122 (0.1522)	
Epoch: [2][10400/27046]	Time 0.019 (0.020)	Loss 0.2213 (0.1521)	
Epoch: [2][10410/27046]	Time 0.018 (0.020)	Loss 0.0007 (0.1521)	
Epoch: [2][10420/27046]	Time 0.019 (0.020)	Loss 0.0119 (0.1520)	
Epoch: [2][10430/27046]	Time 0.019 (0.020)	Loss 0.0088 (0.1519)	
Epoch: [2][10440/27046]	Time 0.019 (0.020)	Loss 0.0313 (0.1520)	
Epoch: [2][10450/27046]	Time 0.019 (0.020)	Loss 0.0175 (0.1519)	
Epoch: [2][10460/27046]	Time 0.019 (0.020)	Loss 0.0697 (0.1518)	
Epoch: [2][10470/27046]	Time 0.019 (0.020)	Loss 0.0720 (0.1520)	
Epoch: [2][10480/27046]	Time 0.019 (0.020)	Loss 0.5570 (0.1520)	
Epoch: [2][10490/27046]	Time 0.019 (0.020)	Loss 0.0651 (0.1519)	
Epoch: [2][10500/27046]	Time 0.019 (0.020)	Loss 0.0031 (0.1518)	
Epoch: [2][10510/27046]	Time 0.018 (0.020)	Loss 0.2472 (0.1518)	
Epoch: [2][10520/27046]	T

Epoch: [2][11640/27046]	Time 0.029 (0.019)	Loss 0.5994 (0.1529)	
Epoch: [2][11650/27046]	Time 0.021 (0.019)	Loss 0.0607 (0.1529)	
Epoch: [2][11660/27046]	Time 0.019 (0.019)	Loss 0.1988 (0.1528)	
Epoch: [2][11670/27046]	Time 0.019 (0.019)	Loss 0.2710 (0.1529)	
Epoch: [2][11680/27046]	Time 0.019 (0.019)	Loss 0.0383 (0.1529)	
Epoch: [2][11690/27046]	Time 0.020 (0.019)	Loss 0.4792 (0.1529)	
Epoch: [2][11700/27046]	Time 0.020 (0.019)	Loss 0.5100 (0.1530)	
Epoch: [2][11710/27046]	Time 0.019 (0.019)	Loss 0.0724 (0.1530)	
Epoch: [2][11720/27046]	Time 0.021 (0.019)	Loss 0.2342 (0.1530)	
Epoch: [2][11730/27046]	Time 0.022 (0.019)	Loss 0.0079 (0.1530)	
Epoch: [2][11740/27046]	Time 0.019 (0.019)	Loss 0.2419 (0.1529)	
Epoch: [2][11750/27046]	Time 0.020 (0.019)	Loss 0.0015 (0.1528)	
Epoch: [2][11760/27046]	Time 0.020 (0.019)	Loss 0.4357 (0.1528)	
Epoch: [2][11770/27046]	Time 0.019 (0.019)	Loss 0.1474 (0.1528)	
Epoch: [2][11780/27046]	Time 0.020 (0.019)	Loss 0.0060 (0.1527)	
Epoch: [2][11790/27046]	T

Epoch: [2][12910/27046]	Time 0.026 (0.020)	Loss 0.0912 (0.1535)	
Epoch: [2][12920/27046]	Time 0.034 (0.020)	Loss 0.0254 (0.1535)	
Epoch: [2][12930/27046]	Time 0.022 (0.020)	Loss 0.0048 (0.1535)	
Epoch: [2][12940/27046]	Time 0.025 (0.020)	Loss 0.0081 (0.1534)	
Epoch: [2][12950/27046]	Time 0.024 (0.020)	Loss 0.6571 (0.1534)	
Epoch: [2][12960/27046]	Time 0.027 (0.020)	Loss 0.0114 (0.1533)	
Epoch: [2][12970/27046]	Time 0.022 (0.020)	Loss 0.4343 (0.1533)	
Epoch: [2][12980/27046]	Time 0.023 (0.020)	Loss 0.0429 (0.1534)	
Epoch: [2][12990/27046]	Time 0.022 (0.020)	Loss 0.0135 (0.1534)	
Epoch: [2][13000/27046]	Time 0.023 (0.020)	Loss 0.1590 (0.1534)	
Epoch: [2][13010/27046]	Time 0.029 (0.020)	Loss 0.0261 (0.1535)	
Epoch: [2][13020/27046]	Time 0.021 (0.020)	Loss 0.0442 (0.1535)	
Epoch: [2][13030/27046]	Time 0.023 (0.020)	Loss 0.5668 (0.1535)	
Epoch: [2][13040/27046]	Time 0.020 (0.020)	Loss 0.2516 (0.1535)	
Epoch: [2][13050/27046]	Time 0.019 (0.020)	Loss 0.0026 (0.1536)	
Epoch: [2][13060/27046]	T

Epoch: [2][14180/27046]	Time 0.020 (0.020)	Loss 0.0132 (0.1537)	
Epoch: [2][14190/27046]	Time 0.021 (0.020)	Loss 0.0206 (0.1537)	
Epoch: [2][14200/27046]	Time 0.045 (0.020)	Loss 0.0045 (0.1537)	
Epoch: [2][14210/27046]	Time 0.024 (0.020)	Loss 0.0148 (0.1538)	
Epoch: [2][14220/27046]	Time 0.019 (0.020)	Loss 1.3203 (0.1539)	
Epoch: [2][14230/27046]	Time 0.019 (0.020)	Loss 0.0423 (0.1539)	
Epoch: [2][14240/27046]	Time 0.022 (0.020)	Loss 0.0115 (0.1539)	
Epoch: [2][14250/27046]	Time 0.023 (0.020)	Loss 0.0230 (0.1540)	
Epoch: [2][14260/27046]	Time 0.020 (0.020)	Loss 0.1650 (0.1540)	
Epoch: [2][14270/27046]	Time 0.020 (0.020)	Loss 0.0127 (0.1539)	
Epoch: [2][14280/27046]	Time 0.020 (0.020)	Loss 0.0228 (0.1540)	
Epoch: [2][14290/27046]	Time 0.023 (0.020)	Loss 0.1765 (0.1540)	
Epoch: [2][14300/27046]	Time 0.022 (0.020)	Loss 0.0383 (0.1540)	
Epoch: [2][14310/27046]	Time 0.022 (0.020)	Loss 0.1664 (0.1540)	
Epoch: [2][14320/27046]	Time 0.022 (0.020)	Loss 0.0404 (0.1539)	
Epoch: [2][14330/27046]	T

Epoch: [2][15450/27046]	Time 0.024 (0.020)	Loss 0.0225 (0.1540)	
Epoch: [2][15460/27046]	Time 0.034 (0.020)	Loss 0.1249 (0.1540)	
Epoch: [2][15470/27046]	Time 0.024 (0.020)	Loss 0.0810 (0.1540)	
Epoch: [2][15480/27046]	Time 0.041 (0.020)	Loss 0.2504 (0.1542)	
Epoch: [2][15490/27046]	Time 0.024 (0.020)	Loss 0.0236 (0.1541)	
Epoch: [2][15500/27046]	Time 0.024 (0.020)	Loss 0.1332 (0.1541)	
Epoch: [2][15510/27046]	Time 0.022 (0.020)	Loss 0.0715 (0.1542)	
Epoch: [2][15520/27046]	Time 0.022 (0.020)	Loss 0.6966 (0.1542)	
Epoch: [2][15530/27046]	Time 0.023 (0.020)	Loss 0.0017 (0.1542)	
Epoch: [2][15540/27046]	Time 0.022 (0.020)	Loss 0.2326 (0.1542)	
Epoch: [2][15550/27046]	Time 0.020 (0.020)	Loss 0.0531 (0.1542)	
Epoch: [2][15560/27046]	Time 0.021 (0.020)	Loss 0.1140 (0.1543)	
Epoch: [2][15570/27046]	Time 0.023 (0.020)	Loss 0.1055 (0.1544)	
Epoch: [2][15580/27046]	Time 0.024 (0.020)	Loss 0.0337 (0.1545)	
Epoch: [2][15590/27046]	Time 0.023 (0.020)	Loss 0.3777 (0.1545)	
Epoch: [2][15600/27046]	T

Epoch: [2][16730/27046]	Time 0.021 (0.020)	Loss 0.0971 (0.1548)	
Epoch: [2][16740/27046]	Time 0.019 (0.020)	Loss 0.0342 (0.1548)	
Epoch: [2][16750/27046]	Time 0.019 (0.020)	Loss 0.0384 (0.1547)	
Epoch: [2][16760/27046]	Time 0.042 (0.020)	Loss 0.0190 (0.1546)	
Epoch: [2][16770/27046]	Time 0.020 (0.020)	Loss 0.0105 (0.1546)	
Epoch: [2][16780/27046]	Time 0.021 (0.020)	Loss 0.3379 (0.1546)	
Epoch: [2][16790/27046]	Time 0.019 (0.020)	Loss 0.0424 (0.1546)	
Epoch: [2][16800/27046]	Time 0.021 (0.020)	Loss 0.1224 (0.1545)	
Epoch: [2][16810/27046]	Time 0.022 (0.020)	Loss 0.0562 (0.1545)	
Epoch: [2][16820/27046]	Time 0.020 (0.020)	Loss 0.0201 (0.1545)	
Epoch: [2][16830/27046]	Time 0.021 (0.020)	Loss 0.0122 (0.1545)	
Epoch: [2][16840/27046]	Time 0.020 (0.020)	Loss 0.0232 (0.1545)	
Epoch: [2][16850/27046]	Time 0.019 (0.020)	Loss 0.0282 (0.1544)	
Epoch: [2][16860/27046]	Time 0.019 (0.020)	Loss 0.0041 (0.1543)	
Epoch: [2][16870/27046]	Time 0.020 (0.020)	Loss 0.2920 (0.1544)	
Epoch: [2][16880/27046]	T

Epoch: [2][18000/27046]	Time 0.019 (0.020)	Loss 0.0634 (0.1544)	
Epoch: [2][18010/27046]	Time 0.020 (0.020)	Loss 0.0458 (0.1543)	
Epoch: [2][18020/27046]	Time 0.019 (0.020)	Loss 0.0274 (0.1544)	
Epoch: [2][18030/27046]	Time 0.020 (0.020)	Loss 0.1130 (0.1543)	
Epoch: [2][18040/27046]	Time 0.042 (0.020)	Loss 0.0224 (0.1543)	
Epoch: [2][18050/27046]	Time 0.020 (0.020)	Loss 0.1114 (0.1543)	
Epoch: [2][18060/27046]	Time 0.019 (0.020)	Loss 0.2823 (0.1544)	
Epoch: [2][18070/27046]	Time 0.019 (0.020)	Loss 0.0491 (0.1544)	
Epoch: [2][18080/27046]	Time 0.019 (0.020)	Loss 0.2025 (0.1544)	
Epoch: [2][18090/27046]	Time 0.020 (0.020)	Loss 0.2998 (0.1544)	
Epoch: [2][18100/27046]	Time 0.021 (0.020)	Loss 0.2251 (0.1544)	
Epoch: [2][18110/27046]	Time 0.022 (0.020)	Loss 0.1208 (0.1544)	
Epoch: [2][18120/27046]	Time 0.021 (0.020)	Loss 0.0965 (0.1544)	
Epoch: [2][18130/27046]	Time 0.019 (0.020)	Loss 0.0887 (0.1544)	
Epoch: [2][18140/27046]	Time 0.019 (0.020)	Loss 0.0069 (0.1543)	
Epoch: [2][18150/27046]	T

Epoch: [2][19280/27046]	Time 0.020 (0.020)	Loss 0.5283 (0.1541)	
Epoch: [2][19290/27046]	Time 0.022 (0.020)	Loss 0.6545 (0.1541)	
Epoch: [2][19300/27046]	Time 0.021 (0.020)	Loss 0.0557 (0.1541)	
Epoch: [2][19310/27046]	Time 0.021 (0.020)	Loss 0.0080 (0.1540)	
Epoch: [2][19320/27046]	Time 0.042 (0.020)	Loss 0.3242 (0.1540)	
Epoch: [2][19330/27046]	Time 0.021 (0.020)	Loss 0.0926 (0.1540)	
Epoch: [2][19340/27046]	Time 0.020 (0.020)	Loss 0.0604 (0.1540)	
Epoch: [2][19350/27046]	Time 0.020 (0.020)	Loss 0.0903 (0.1540)	
Epoch: [2][19360/27046]	Time 0.020 (0.020)	Loss 0.0087 (0.1540)	
Epoch: [2][19370/27046]	Time 0.019 (0.020)	Loss 0.3693 (0.1541)	
Epoch: [2][19380/27046]	Time 0.020 (0.020)	Loss 0.0069 (0.1541)	
Epoch: [2][19390/27046]	Time 0.020 (0.020)	Loss 0.0852 (0.1541)	
Epoch: [2][19400/27046]	Time 0.020 (0.020)	Loss 0.0350 (0.1541)	
Epoch: [2][19410/27046]	Time 0.021 (0.020)	Loss 0.0885 (0.1541)	
Epoch: [2][19420/27046]	Time 0.020 (0.020)	Loss 0.6418 (0.1541)	
Epoch: [2][19430/27046]	T

Epoch: [2][20560/27046]	Time 0.019 (0.020)	Loss 0.0827 (0.1542)	
Epoch: [2][20570/27046]	Time 0.019 (0.020)	Loss 0.5224 (0.1542)	
Epoch: [2][20580/27046]	Time 0.019 (0.020)	Loss 0.0126 (0.1542)	
Epoch: [2][20590/27046]	Time 0.020 (0.020)	Loss 0.3083 (0.1542)	
Epoch: [2][20600/27046]	Time 0.041 (0.020)	Loss 0.1551 (0.1542)	
Epoch: [2][20610/27046]	Time 0.019 (0.020)	Loss 0.1238 (0.1542)	
Epoch: [2][20620/27046]	Time 0.019 (0.020)	Loss 0.0618 (0.1542)	
Epoch: [2][20630/27046]	Time 0.020 (0.020)	Loss 0.0987 (0.1542)	
Epoch: [2][20640/27046]	Time 0.020 (0.020)	Loss 0.4408 (0.1542)	
Epoch: [2][20650/27046]	Time 0.020 (0.020)	Loss 0.1054 (0.1541)	
Epoch: [2][20660/27046]	Time 0.019 (0.020)	Loss 0.0565 (0.1541)	
Epoch: [2][20670/27046]	Time 0.021 (0.020)	Loss 0.0030 (0.1541)	
Epoch: [2][20680/27046]	Time 0.020 (0.020)	Loss 0.0182 (0.1540)	
Epoch: [2][20690/27046]	Time 0.021 (0.020)	Loss 0.0084 (0.1540)	
Epoch: [2][20700/27046]	Time 0.019 (0.020)	Loss 0.0096 (0.1540)	
Epoch: [2][20710/27046]	T

Epoch: [2][21840/27046]	Time 0.021 (0.020)	Loss 0.0822 (0.1545)	
Epoch: [2][21850/27046]	Time 0.026 (0.020)	Loss 0.4917 (0.1546)	
Epoch: [2][21860/27046]	Time 0.022 (0.020)	Loss 1.2213 (0.1547)	
Epoch: [2][21870/27046]	Time 0.020 (0.020)	Loss 0.0097 (0.1547)	
Epoch: [2][21880/27046]	Time 0.040 (0.020)	Loss 0.0483 (0.1547)	
Epoch: [2][21890/27046]	Time 0.019 (0.020)	Loss 0.0010 (0.1546)	
Epoch: [2][21900/27046]	Time 0.019 (0.020)	Loss 0.0467 (0.1547)	
Epoch: [2][21910/27046]	Time 0.019 (0.020)	Loss 0.4553 (0.1546)	
Epoch: [2][21920/27046]	Time 0.020 (0.020)	Loss 0.0073 (0.1546)	
Epoch: [2][21930/27046]	Time 0.019 (0.020)	Loss 0.0578 (0.1546)	
Epoch: [2][21940/27046]	Time 0.018 (0.020)	Loss 0.0362 (0.1546)	
Epoch: [2][21950/27046]	Time 0.022 (0.020)	Loss 0.4917 (0.1546)	
Epoch: [2][21960/27046]	Time 0.019 (0.020)	Loss 0.1276 (0.1546)	
Epoch: [2][21970/27046]	Time 0.025 (0.020)	Loss 0.1901 (0.1546)	
Epoch: [2][21980/27046]	Time 0.030 (0.020)	Loss 0.0239 (0.1546)	
Epoch: [2][21990/27046]	T

Epoch: [2][23120/27046]	Time 0.019 (0.020)	Loss 0.1162 (0.1551)	
Epoch: [2][23130/27046]	Time 0.019 (0.020)	Loss 0.1373 (0.1551)	
Epoch: [2][23140/27046]	Time 0.019 (0.020)	Loss 0.0068 (0.1551)	
Epoch: [2][23150/27046]	Time 0.021 (0.020)	Loss 0.0197 (0.1551)	
Epoch: [2][23160/27046]	Time 0.042 (0.020)	Loss 0.0349 (0.1551)	
Epoch: [2][23170/27046]	Time 0.019 (0.020)	Loss 0.0275 (0.1551)	
Epoch: [2][23180/27046]	Time 0.018 (0.020)	Loss 0.6145 (0.1551)	
Epoch: [2][23190/27046]	Time 0.019 (0.020)	Loss 0.1344 (0.1551)	
Epoch: [2][23200/27046]	Time 0.019 (0.020)	Loss 0.0264 (0.1551)	
Epoch: [2][23210/27046]	Time 0.020 (0.020)	Loss 0.0817 (0.1551)	
Epoch: [2][23220/27046]	Time 0.019 (0.020)	Loss 0.3862 (0.1551)	
Epoch: [2][23230/27046]	Time 0.020 (0.020)	Loss 0.0058 (0.1551)	
Epoch: [2][23240/27046]	Time 0.019 (0.020)	Loss 0.1953 (0.1551)	
Epoch: [2][23250/27046]	Time 0.020 (0.020)	Loss 0.0644 (0.1551)	
Epoch: [2][23260/27046]	Time 0.018 (0.020)	Loss 0.0397 (0.1551)	
Epoch: [2][23270/27046]	T

Epoch: [2][24400/27046]	Time 0.019 (0.020)	Loss 0.5142 (0.1548)	
Epoch: [2][24410/27046]	Time 0.019 (0.020)	Loss 0.0220 (0.1548)	
Epoch: [2][24420/27046]	Time 0.020 (0.020)	Loss 0.1348 (0.1548)	
Epoch: [2][24430/27046]	Time 0.019 (0.020)	Loss 0.1216 (0.1548)	
Epoch: [2][24440/27046]	Time 0.040 (0.020)	Loss 0.2381 (0.1548)	
Epoch: [2][24450/27046]	Time 0.019 (0.020)	Loss 0.0245 (0.1548)	
Epoch: [2][24460/27046]	Time 0.020 (0.020)	Loss 0.1728 (0.1549)	
Epoch: [2][24470/27046]	Time 0.018 (0.020)	Loss 0.3779 (0.1549)	
Epoch: [2][24480/27046]	Time 0.019 (0.020)	Loss 0.0700 (0.1549)	
Epoch: [2][24490/27046]	Time 0.019 (0.020)	Loss 0.0534 (0.1549)	
Epoch: [2][24500/27046]	Time 0.019 (0.020)	Loss 0.5092 (0.1549)	
Epoch: [2][24510/27046]	Time 0.021 (0.020)	Loss 0.0489 (0.1549)	
Epoch: [2][24520/27046]	Time 0.018 (0.020)	Loss 0.4291 (0.1549)	
Epoch: [2][24530/27046]	Time 0.018 (0.020)	Loss 0.0744 (0.1549)	
Epoch: [2][24540/27046]	Time 0.021 (0.020)	Loss 0.0788 (0.1548)	
Epoch: [2][24550/27046]	T

Epoch: [2][25680/27046]	Time 0.020 (0.020)	Loss 0.4066 (0.1550)	
Epoch: [2][25690/27046]	Time 0.019 (0.020)	Loss 0.1856 (0.1550)	
Epoch: [2][25700/27046]	Time 0.019 (0.020)	Loss 0.0231 (0.1550)	
Epoch: [2][25710/27046]	Time 0.019 (0.020)	Loss 0.0132 (0.1550)	
Epoch: [2][25720/27046]	Time 0.042 (0.020)	Loss 0.1122 (0.1550)	
Epoch: [2][25730/27046]	Time 0.020 (0.020)	Loss 0.0155 (0.1550)	
Epoch: [2][25740/27046]	Time 0.019 (0.020)	Loss 0.0660 (0.1549)	
Epoch: [2][25750/27046]	Time 0.018 (0.020)	Loss 0.0390 (0.1549)	
Epoch: [2][25760/27046]	Time 0.019 (0.020)	Loss 0.1227 (0.1549)	
Epoch: [2][25770/27046]	Time 0.020 (0.020)	Loss 0.0552 (0.1550)	
Epoch: [2][25780/27046]	Time 0.020 (0.020)	Loss 0.6034 (0.1550)	
Epoch: [2][25790/27046]	Time 0.021 (0.020)	Loss 0.0290 (0.1550)	
Epoch: [2][25800/27046]	Time 0.019 (0.020)	Loss 0.0094 (0.1550)	
Epoch: [2][25810/27046]	Time 0.020 (0.020)	Loss 0.5230 (0.1550)	
Epoch: [2][25820/27046]	Time 0.019 (0.020)	Loss 0.2879 (0.1550)	
Epoch: [2][25830/27046]	T

Epoch: [2][26960/27046]	Time 0.022 (0.020)	Loss 0.0402 (0.1545)	
Epoch: [2][26970/27046]	Time 0.021 (0.020)	Loss 0.0576 (0.1545)	
Epoch: [2][26980/27046]	Time 0.022 (0.020)	Loss 0.1039 (0.1545)	
Epoch: [2][26990/27046]	Time 0.022 (0.020)	Loss 0.1142 (0.1545)	
Epoch: [2][27000/27046]	Time 0.045 (0.020)	Loss 0.0494 (0.1545)	
Epoch: [2][27010/27046]	Time 0.020 (0.020)	Loss 0.0333 (0.1546)	
Epoch: [2][27020/27046]	Time 0.020 (0.020)	Loss 0.2292 (0.1546)	
Epoch: [2][27030/27046]	Time 0.020 (0.020)	Loss 0.0834 (0.1545)	
Epoch: [2][27040/27046]	Time 0.019 (0.020)	Loss 0.0161 (0.1546)	
Average training loss this epoch: 0.1546
Epoch: [2][0/6762]	Time 0.003 (0.003)	
Epoch: [2][10/6762]	Time 0.003 (0.003)	
Epoch: [2][20/6762]	Time 0.004 (0.004)	
Epoch: [2][30/6762]	Time 0.004 (0.004)	
Epoch: [2][40/6762]	Time 0.004 (0.004)	
Epoch: [2][50/6762]	Time 0.004 (0.004)	
Epoch: [2][60/6762]	Time 0.003 (0.004)	
Epoch: [2][70/6762]	Time 0.004 (0.004)	
Epoch: [2][80/6762]	Time 0.003 (0.004)	
Epoch: [2][90/6

Epoch: [2][1830/6762]	Time 0.003 (0.004)	
Epoch: [2][1840/6762]	Time 0.004 (0.004)	
Epoch: [2][1850/6762]	Time 0.004 (0.004)	
Epoch: [2][1860/6762]	Time 0.004 (0.004)	
Epoch: [2][1870/6762]	Time 0.003 (0.004)	
Epoch: [2][1880/6762]	Time 0.004 (0.004)	
Epoch: [2][1890/6762]	Time 0.004 (0.004)	
Epoch: [2][1900/6762]	Time 0.003 (0.004)	
Epoch: [2][1910/6762]	Time 0.004 (0.004)	
Epoch: [2][1920/6762]	Time 0.004 (0.004)	
Epoch: [2][1930/6762]	Time 0.004 (0.004)	
Epoch: [2][1940/6762]	Time 0.004 (0.004)	
Epoch: [2][1950/6762]	Time 0.003 (0.004)	
Epoch: [2][1960/6762]	Time 0.004 (0.004)	
Epoch: [2][1970/6762]	Time 0.006 (0.004)	
Epoch: [2][1980/6762]	Time 0.003 (0.004)	
Epoch: [2][1990/6762]	Time 0.003 (0.004)	
Epoch: [2][2000/6762]	Time 0.003 (0.004)	
Epoch: [2][2010/6762]	Time 0.004 (0.004)	
Epoch: [2][2020/6762]	Time 0.004 (0.004)	
Epoch: [2][2030/6762]	Time 0.004 (0.004)	
Epoch: [2][2040/6762]	Time 0.004 (0.004)	
Epoch: [2][2050/6762]	Time 0.003 (0.004)	
Epoch: [2][2060/6762]	Time 0.003 (

Epoch: [2][3790/6762]	Time 0.003 (0.004)	
Epoch: [2][3800/6762]	Time 0.003 (0.004)	
Epoch: [2][3810/6762]	Time 0.004 (0.004)	
Epoch: [2][3820/6762]	Time 0.004 (0.004)	
Epoch: [2][3830/6762]	Time 0.003 (0.004)	
Epoch: [2][3840/6762]	Time 0.004 (0.004)	
Epoch: [2][3850/6762]	Time 0.003 (0.004)	
Epoch: [2][3860/6762]	Time 0.005 (0.004)	
Epoch: [2][3870/6762]	Time 0.003 (0.004)	
Epoch: [2][3880/6762]	Time 0.004 (0.004)	
Epoch: [2][3890/6762]	Time 0.003 (0.004)	
Epoch: [2][3900/6762]	Time 0.003 (0.004)	
Epoch: [2][3910/6762]	Time 0.004 (0.004)	
Epoch: [2][3920/6762]	Time 0.004 (0.004)	
Epoch: [2][3930/6762]	Time 0.004 (0.004)	
Epoch: [2][3940/6762]	Time 0.004 (0.004)	
Epoch: [2][3950/6762]	Time 0.004 (0.004)	
Epoch: [2][3960/6762]	Time 0.004 (0.004)	
Epoch: [2][3970/6762]	Time 0.003 (0.004)	
Epoch: [2][3980/6762]	Time 0.004 (0.004)	
Epoch: [2][3990/6762]	Time 0.004 (0.004)	
Epoch: [2][4000/6762]	Time 0.003 (0.004)	
Epoch: [2][4010/6762]	Time 0.003 (0.004)	
Epoch: [2][4020/6762]	Time 0.003 (

Epoch: [2][5790/6762]	Time 0.004 (0.004)	
Epoch: [2][5800/6762]	Time 0.003 (0.004)	
Epoch: [2][5810/6762]	Time 0.004 (0.004)	
Epoch: [2][5820/6762]	Time 0.003 (0.004)	
Epoch: [2][5830/6762]	Time 0.003 (0.004)	
Epoch: [2][5840/6762]	Time 0.003 (0.004)	
Epoch: [2][5850/6762]	Time 0.004 (0.004)	
Epoch: [2][5860/6762]	Time 0.004 (0.004)	
Epoch: [2][5870/6762]	Time 0.003 (0.004)	
Epoch: [2][5880/6762]	Time 0.004 (0.004)	
Epoch: [2][5890/6762]	Time 0.006 (0.004)	
Epoch: [2][5900/6762]	Time 0.004 (0.004)	
Epoch: [2][5910/6762]	Time 0.004 (0.004)	
Epoch: [2][5920/6762]	Time 0.003 (0.004)	
Epoch: [2][5930/6762]	Time 0.004 (0.004)	
Epoch: [2][5940/6762]	Time 0.004 (0.004)	
Epoch: [2][5950/6762]	Time 0.003 (0.004)	
Epoch: [2][5960/6762]	Time 0.003 (0.004)	
Epoch: [2][5970/6762]	Time 0.004 (0.004)	
Epoch: [2][5980/6762]	Time 0.004 (0.004)	
Epoch: [2][5990/6762]	Time 0.004 (0.004)	
Epoch: [2][6000/6762]	Time 0.004 (0.004)	
Epoch: [2][6010/6762]	Time 0.004 (0.004)	
Epoch: [2][6020/6762]	Time 0.004 (

Epoch: [3][650/27046]	Time 0.019 (0.019)	Loss 0.3325 (0.1442)	
Epoch: [3][660/27046]	Time 0.018 (0.019)	Loss 0.1371 (0.1446)	
Epoch: [3][670/27046]	Time 0.019 (0.019)	Loss 0.3995 (0.1452)	
Epoch: [3][680/27046]	Time 0.038 (0.019)	Loss 0.0012 (0.1458)	
Epoch: [3][690/27046]	Time 0.018 (0.019)	Loss 0.4706 (0.1454)	
Epoch: [3][700/27046]	Time 0.019 (0.019)	Loss 0.0822 (0.1455)	
Epoch: [3][710/27046]	Time 0.019 (0.019)	Loss 0.1147 (0.1467)	
Epoch: [3][720/27046]	Time 0.020 (0.019)	Loss 0.0603 (0.1463)	
Epoch: [3][730/27046]	Time 0.019 (0.019)	Loss 0.1811 (0.1461)	
Epoch: [3][740/27046]	Time 0.020 (0.019)	Loss 0.1522 (0.1454)	
Epoch: [3][750/27046]	Time 0.020 (0.019)	Loss 0.1592 (0.1454)	
Epoch: [3][760/27046]	Time 0.018 (0.019)	Loss 0.2921 (0.1454)	
Epoch: [3][770/27046]	Time 0.020 (0.019)	Loss 0.1590 (0.1454)	
Epoch: [3][780/27046]	Time 0.020 (0.019)	Loss 0.0497 (0.1454)	
Epoch: [3][790/27046]	Time 0.019 (0.019)	Loss 0.0367 (0.1464)	
Epoch: [3][800/27046]	Time 0.020 (0.019)	Loss 0.0304 (0

Epoch: [3][1950/27046]	Time 0.019 (0.020)	Loss 0.0111 (0.1493)	
Epoch: [3][1960/27046]	Time 0.040 (0.020)	Loss 0.0387 (0.1491)	
Epoch: [3][1970/27046]	Time 0.019 (0.020)	Loss 0.1793 (0.1494)	
Epoch: [3][1980/27046]	Time 0.020 (0.020)	Loss 0.0153 (0.1489)	
Epoch: [3][1990/27046]	Time 0.019 (0.020)	Loss 0.0920 (0.1494)	
Epoch: [3][2000/27046]	Time 0.023 (0.020)	Loss 0.2353 (0.1494)	
Epoch: [3][2010/27046]	Time 0.024 (0.020)	Loss 0.0779 (0.1495)	
Epoch: [3][2020/27046]	Time 0.021 (0.020)	Loss 0.0488 (0.1509)	
Epoch: [3][2030/27046]	Time 0.020 (0.020)	Loss 0.1602 (0.1508)	
Epoch: [3][2040/27046]	Time 0.021 (0.020)	Loss 0.0081 (0.1505)	
Epoch: [3][2050/27046]	Time 0.018 (0.020)	Loss 0.2895 (0.1516)	
Epoch: [3][2060/27046]	Time 0.019 (0.020)	Loss 0.5814 (0.1528)	
Epoch: [3][2070/27046]	Time 0.020 (0.020)	Loss 0.0665 (0.1525)	
Epoch: [3][2080/27046]	Time 0.021 (0.020)	Loss 0.0493 (0.1526)	
Epoch: [3][2090/27046]	Time 0.020 (0.020)	Loss 0.1008 (0.1525)	
Epoch: [3][2100/27046]	Time 0.022 (0.020

Epoch: [3][3240/27046]	Time 0.043 (0.021)	Loss 0.0325 (0.1527)	
Epoch: [3][3250/27046]	Time 0.020 (0.021)	Loss 0.1437 (0.1526)	
Epoch: [3][3260/27046]	Time 0.019 (0.021)	Loss 0.0684 (0.1524)	
Epoch: [3][3270/27046]	Time 0.020 (0.021)	Loss 0.0060 (0.1524)	
Epoch: [3][3280/27046]	Time 0.020 (0.021)	Loss 0.1693 (0.1525)	
Epoch: [3][3290/27046]	Time 0.024 (0.021)	Loss 0.0157 (0.1525)	
Epoch: [3][3300/27046]	Time 0.018 (0.021)	Loss 0.0173 (0.1525)	
Epoch: [3][3310/27046]	Time 0.020 (0.021)	Loss 0.1974 (0.1526)	
Epoch: [3][3320/27046]	Time 0.019 (0.021)	Loss 0.5516 (0.1526)	
Epoch: [3][3330/27046]	Time 0.020 (0.021)	Loss 0.3118 (0.1528)	
Epoch: [3][3340/27046]	Time 0.021 (0.021)	Loss 0.4053 (0.1526)	
Epoch: [3][3350/27046]	Time 0.022 (0.021)	Loss 0.1195 (0.1524)	
Epoch: [3][3360/27046]	Time 0.024 (0.021)	Loss 0.0359 (0.1525)	
Epoch: [3][3370/27046]	Time 0.021 (0.021)	Loss 0.0504 (0.1524)	
Epoch: [3][3380/27046]	Time 0.021 (0.021)	Loss 0.6198 (0.1528)	
Epoch: [3][3390/27046]	Time 0.019 (0.021

Epoch: [3][4540/27046]	Time 0.022 (0.021)	Loss 0.0134 (0.1531)	
Epoch: [3][4550/27046]	Time 0.023 (0.021)	Loss 0.3842 (0.1533)	
Epoch: [3][4560/27046]	Time 0.020 (0.021)	Loss 0.4795 (0.1535)	
Epoch: [3][4570/27046]	Time 0.025 (0.021)	Loss 0.1964 (0.1535)	
Epoch: [3][4580/27046]	Time 0.021 (0.021)	Loss 0.0667 (0.1534)	
Epoch: [3][4590/27046]	Time 0.019 (0.021)	Loss 0.0896 (0.1534)	
Epoch: [3][4600/27046]	Time 0.022 (0.021)	Loss 0.2514 (0.1532)	
Epoch: [3][4610/27046]	Time 0.022 (0.021)	Loss 0.0049 (0.1531)	
Epoch: [3][4620/27046]	Time 0.027 (0.021)	Loss 0.4295 (0.1531)	
Epoch: [3][4630/27046]	Time 0.023 (0.021)	Loss 0.0700 (0.1531)	
Epoch: [3][4640/27046]	Time 0.026 (0.021)	Loss 0.1947 (0.1530)	
Epoch: [3][4650/27046]	Time 0.020 (0.021)	Loss 0.1602 (0.1531)	
Epoch: [3][4660/27046]	Time 0.025 (0.021)	Loss 0.0436 (0.1531)	
Epoch: [3][4670/27046]	Time 0.023 (0.021)	Loss 0.0137 (0.1534)	
Epoch: [3][4680/27046]	Time 0.023 (0.021)	Loss 0.0059 (0.1533)	
Epoch: [3][4690/27046]	Time 0.023 (0.021

Epoch: [3][5830/27046]	Time 0.021 (0.021)	Loss 0.0486 (0.1530)	
Epoch: [3][5840/27046]	Time 0.025 (0.021)	Loss 0.0676 (0.1530)	
Epoch: [3][5850/27046]	Time 0.018 (0.021)	Loss 0.2777 (0.1529)	
Epoch: [3][5860/27046]	Time 0.020 (0.021)	Loss 0.3997 (0.1531)	
Epoch: [3][5870/27046]	Time 0.022 (0.021)	Loss 0.0835 (0.1531)	
Epoch: [3][5880/27046]	Time 0.023 (0.021)	Loss 0.0528 (0.1530)	
Epoch: [3][5890/27046]	Time 0.022 (0.021)	Loss 0.0231 (0.1531)	
Epoch: [3][5900/27046]	Time 0.020 (0.021)	Loss 0.0259 (0.1530)	
Epoch: [3][5910/27046]	Time 0.020 (0.021)	Loss 0.0004 (0.1528)	
Epoch: [3][5920/27046]	Time 0.019 (0.021)	Loss 0.1933 (0.1527)	
Epoch: [3][5930/27046]	Time 0.023 (0.021)	Loss 0.0045 (0.1527)	
Epoch: [3][5940/27046]	Time 0.020 (0.021)	Loss 0.4976 (0.1526)	
Epoch: [3][5950/27046]	Time 0.019 (0.021)	Loss 0.0440 (0.1524)	
Epoch: [3][5960/27046]	Time 0.019 (0.021)	Loss 0.1711 (0.1525)	
Epoch: [3][5970/27046]	Time 0.018 (0.021)	Loss 0.9662 (0.1527)	
Epoch: [3][5980/27046]	Time 0.019 (0.021

Epoch: [3][7120/27046]	Time 0.019 (0.021)	Loss 0.2147 (0.1514)	
Epoch: [3][7130/27046]	Time 0.021 (0.021)	Loss 0.0226 (0.1515)	
Epoch: [3][7140/27046]	Time 0.020 (0.021)	Loss 0.0439 (0.1515)	
Epoch: [3][7150/27046]	Time 0.021 (0.021)	Loss 0.3832 (0.1514)	
Epoch: [3][7160/27046]	Time 0.022 (0.021)	Loss 0.0240 (0.1513)	
Epoch: [3][7170/27046]	Time 0.020 (0.021)	Loss 0.0531 (0.1513)	
Epoch: [3][7180/27046]	Time 0.023 (0.021)	Loss 0.0135 (0.1513)	
Epoch: [3][7190/27046]	Time 0.020 (0.021)	Loss 0.2444 (0.1513)	
Epoch: [3][7200/27046]	Time 0.019 (0.021)	Loss 0.0011 (0.1512)	
Epoch: [3][7210/27046]	Time 0.019 (0.021)	Loss 0.2605 (0.1511)	
Epoch: [3][7220/27046]	Time 0.019 (0.021)	Loss 0.0163 (0.1511)	
Epoch: [3][7230/27046]	Time 0.020 (0.021)	Loss 0.0828 (0.1511)	
Epoch: [3][7240/27046]	Time 0.020 (0.021)	Loss 0.2229 (0.1513)	
Epoch: [3][7250/27046]	Time 0.019 (0.021)	Loss 0.2431 (0.1514)	
Epoch: [3][7260/27046]	Time 0.019 (0.021)	Loss 0.0041 (0.1513)	
Epoch: [3][7270/27046]	Time 0.021 (0.021

Epoch: [3][8420/27046]	Time 0.019 (0.021)	Loss 0.3452 (0.1515)	
Epoch: [3][8430/27046]	Time 0.022 (0.021)	Loss 0.2605 (0.1514)	
Epoch: [3][8440/27046]	Time 0.023 (0.021)	Loss 0.1967 (0.1513)	
Epoch: [3][8450/27046]	Time 0.020 (0.021)	Loss 0.0331 (0.1513)	
Epoch: [3][8460/27046]	Time 0.019 (0.021)	Loss 0.0457 (0.1515)	
Epoch: [3][8470/27046]	Time 0.021 (0.021)	Loss 0.2604 (0.1515)	
Epoch: [3][8480/27046]	Time 0.020 (0.021)	Loss 0.0098 (0.1514)	
Epoch: [3][8490/27046]	Time 0.019 (0.021)	Loss 0.3498 (0.1514)	
Epoch: [3][8500/27046]	Time 0.020 (0.021)	Loss 0.0149 (0.1516)	
Epoch: [3][8510/27046]	Time 0.020 (0.021)	Loss 0.0176 (0.1515)	
Epoch: [3][8520/27046]	Time 0.020 (0.021)	Loss 0.0508 (0.1515)	
Epoch: [3][8530/27046]	Time 0.020 (0.021)	Loss 0.3028 (0.1515)	
Epoch: [3][8540/27046]	Time 0.019 (0.021)	Loss 0.0534 (0.1515)	
Epoch: [3][8550/27046]	Time 0.021 (0.021)	Loss 0.1188 (0.1515)	
Epoch: [3][8560/27046]	Time 0.020 (0.021)	Loss 0.0395 (0.1514)	
Epoch: [3][8570/27046]	Time 0.020 (0.021

Epoch: [3][9710/27046]	Time 0.022 (0.021)	Loss 0.0667 (0.1514)	
Epoch: [3][9720/27046]	Time 0.019 (0.021)	Loss 0.0290 (0.1517)	
Epoch: [3][9730/27046]	Time 0.020 (0.021)	Loss 0.4420 (0.1518)	
Epoch: [3][9740/27046]	Time 0.019 (0.021)	Loss 0.0692 (0.1518)	
Epoch: [3][9750/27046]	Time 0.018 (0.021)	Loss 0.1601 (0.1517)	
Epoch: [3][9760/27046]	Time 0.021 (0.021)	Loss 0.1049 (0.1517)	
Epoch: [3][9770/27046]	Time 0.020 (0.021)	Loss 0.0193 (0.1517)	
Epoch: [3][9780/27046]	Time 0.020 (0.021)	Loss 0.0111 (0.1516)	
Epoch: [3][9790/27046]	Time 0.020 (0.021)	Loss 0.0180 (0.1516)	
Epoch: [3][9800/27046]	Time 0.018 (0.021)	Loss 0.2413 (0.1516)	
Epoch: [3][9810/27046]	Time 0.019 (0.021)	Loss 0.0539 (0.1515)	
Epoch: [3][9820/27046]	Time 0.019 (0.021)	Loss 0.0444 (0.1515)	
Epoch: [3][9830/27046]	Time 0.020 (0.021)	Loss 0.0202 (0.1515)	
Epoch: [3][9840/27046]	Time 0.019 (0.021)	Loss 0.0833 (0.1515)	
Epoch: [3][9850/27046]	Time 0.020 (0.021)	Loss 0.0685 (0.1516)	
Epoch: [3][9860/27046]	Time 0.021 (0.021

Epoch: [3][10980/27046]	Time 0.021 (0.021)	Loss 0.1875 (0.1522)	
Epoch: [3][10990/27046]	Time 0.021 (0.021)	Loss 0.0211 (0.1523)	
Epoch: [3][11000/27046]	Time 0.019 (0.021)	Loss 0.2925 (0.1523)	
Epoch: [3][11010/27046]	Time 0.019 (0.021)	Loss 0.4738 (0.1523)	
Epoch: [3][11020/27046]	Time 0.020 (0.021)	Loss 0.0731 (0.1522)	
Epoch: [3][11030/27046]	Time 0.020 (0.021)	Loss 0.0130 (0.1524)	
Epoch: [3][11040/27046]	Time 0.020 (0.021)	Loss 0.0701 (0.1523)	
Epoch: [3][11050/27046]	Time 0.022 (0.021)	Loss 0.0074 (0.1522)	
Epoch: [3][11060/27046]	Time 0.021 (0.021)	Loss 0.0212 (0.1522)	
Epoch: [3][11070/27046]	Time 0.018 (0.021)	Loss 0.1171 (0.1523)	
Epoch: [3][11080/27046]	Time 0.018 (0.021)	Loss 0.1071 (0.1523)	
Epoch: [3][11090/27046]	Time 0.019 (0.021)	Loss 0.0342 (0.1523)	
Epoch: [3][11100/27046]	Time 0.021 (0.021)	Loss 0.0580 (0.1523)	
Epoch: [3][11110/27046]	Time 0.019 (0.021)	Loss 0.0607 (0.1522)	
Epoch: [3][11120/27046]	Time 0.019 (0.021)	Loss 0.1483 (0.1522)	
Epoch: [3][11130/27046]	T

Epoch: [3][12250/27046]	Time 0.022 (0.021)	Loss 0.0145 (0.1532)	
Epoch: [3][12260/27046]	Time 0.019 (0.021)	Loss 0.1646 (0.1532)	
Epoch: [3][12270/27046]	Time 0.020 (0.021)	Loss 0.0766 (0.1531)	
Epoch: [3][12280/27046]	Time 0.020 (0.021)	Loss 0.4242 (0.1531)	
Epoch: [3][12290/27046]	Time 0.020 (0.021)	Loss 0.0072 (0.1532)	
Epoch: [3][12300/27046]	Time 0.019 (0.021)	Loss 0.1280 (0.1532)	
Epoch: [3][12310/27046]	Time 0.020 (0.021)	Loss 0.1227 (0.1532)	
Epoch: [3][12320/27046]	Time 0.020 (0.021)	Loss 0.2776 (0.1531)	
Epoch: [3][12330/27046]	Time 0.019 (0.021)	Loss 0.0157 (0.1531)	
Epoch: [3][12340/27046]	Time 0.019 (0.021)	Loss 0.0651 (0.1530)	
Epoch: [3][12350/27046]	Time 0.018 (0.021)	Loss 0.0473 (0.1531)	
Epoch: [3][12360/27046]	Time 0.019 (0.021)	Loss 0.0721 (0.1531)	
Epoch: [3][12370/27046]	Time 0.019 (0.021)	Loss 0.0830 (0.1531)	
Epoch: [3][12380/27046]	Time 0.020 (0.021)	Loss 0.0247 (0.1530)	
Epoch: [3][12390/27046]	Time 0.021 (0.021)	Loss 0.0364 (0.1530)	
Epoch: [3][12400/27046]	T

Epoch: [3][13520/27046]	Time 0.019 (0.021)	Loss 0.1076 (0.1535)	
Epoch: [3][13530/27046]	Time 0.019 (0.021)	Loss 0.0002 (0.1535)	
Epoch: [3][13540/27046]	Time 0.021 (0.021)	Loss 0.0058 (0.1535)	
Epoch: [3][13550/27046]	Time 0.021 (0.021)	Loss 0.2346 (0.1534)	
Epoch: [3][13560/27046]	Time 0.020 (0.021)	Loss 0.6761 (0.1535)	
Epoch: [3][13570/27046]	Time 0.019 (0.021)	Loss 0.0443 (0.1535)	
Epoch: [3][13580/27046]	Time 0.018 (0.021)	Loss 0.0036 (0.1535)	
Epoch: [3][13590/27046]	Time 0.019 (0.021)	Loss 0.0393 (0.1535)	
Epoch: [3][13600/27046]	Time 0.018 (0.021)	Loss 0.0303 (0.1535)	
Epoch: [3][13610/27046]	Time 0.022 (0.021)	Loss 0.0881 (0.1534)	
Epoch: [3][13620/27046]	Time 0.018 (0.021)	Loss 0.0158 (0.1534)	
Epoch: [3][13630/27046]	Time 0.019 (0.021)	Loss 0.1348 (0.1535)	
Epoch: [3][13640/27046]	Time 0.019 (0.021)	Loss 0.0124 (0.1534)	
Epoch: [3][13650/27046]	Time 0.019 (0.021)	Loss 0.0208 (0.1533)	
Epoch: [3][13660/27046]	Time 0.018 (0.021)	Loss 0.0253 (0.1534)	
Epoch: [3][13670/27046]	T

Epoch: [3][14800/27046]	Time 0.020 (0.021)	Loss 0.0613 (0.1534)	
Epoch: [3][14810/27046]	Time 0.020 (0.021)	Loss 0.0297 (0.1534)	
Epoch: [3][14820/27046]	Time 0.018 (0.021)	Loss 0.0278 (0.1534)	
Epoch: [3][14830/27046]	Time 0.022 (0.021)	Loss 0.1613 (0.1534)	
Epoch: [3][14840/27046]	Time 0.019 (0.021)	Loss 0.9779 (0.1534)	
Epoch: [3][14850/27046]	Time 0.019 (0.021)	Loss 0.0384 (0.1535)	
Epoch: [3][14860/27046]	Time 0.020 (0.021)	Loss 0.5425 (0.1535)	
Epoch: [3][14870/27046]	Time 0.019 (0.021)	Loss 0.0747 (0.1534)	
Epoch: [3][14880/27046]	Time 0.020 (0.021)	Loss 0.0402 (0.1534)	
Epoch: [3][14890/27046]	Time 0.019 (0.021)	Loss 0.0180 (0.1534)	
Epoch: [3][14900/27046]	Time 0.019 (0.021)	Loss 0.0564 (0.1534)	
Epoch: [3][14910/27046]	Time 0.019 (0.021)	Loss 0.4135 (0.1533)	
Epoch: [3][14920/27046]	Time 0.021 (0.021)	Loss 0.0260 (0.1533)	
Epoch: [3][14930/27046]	Time 0.023 (0.021)	Loss 0.1678 (0.1533)	
Epoch: [3][14940/27046]	Time 0.021 (0.021)	Loss 0.0056 (0.1533)	
Epoch: [3][14950/27046]	T

KeyboardInterrupt: 

## Driver Code

In [4]:
def evaluate(assignments, args):
    
    # log source of hyperparameter suggestion
    sigopt.log_metadata('optimizer', "Adam")
    sigopt.log_model("Vanilla Vision Transformer")
    sigopt.log_dataset("Udacity self-driving dataset ")

    sigopt.params.setdefault("learning_rate", float(args['learning_rate']))
    sigopt.params.setdefault("reg", float(args['reg']))
#     sigopt.params.setdefault("batch_size", int(args['batch_size']))
    sigopt.params.setdefault("num_heads", int(args['num_heads']))
    sigopt.params.setdefault("num_layers", int(args['num_layers']))
#     sigopt.params.setdefault("patch_size", int(args['patch_size']))
#     sigopt.params.setdefault("embed_dim", int(args['embed_dim']))
    
    
    # Normalizing images per the paper and resizing each image to 64 x 192.
    transform = transforms.Compose([
        # Citation:
        # https://pytorch.org/vision/stable/transforms.html#scriptable-transforms
        transforms.Resize((64, 192)),
    ])
    
    print("Params : ", sigopt.params)
    # Loading in images with normalization and resizing applied.
    training_set, validation_set, test_set = dataset.load_nvidia_dataset(batch_size=BATCH_SIZE, 
                                                                         transform=transform)

    image_size = training_set.dataset[0][0].shape

    model = VanillaVisionTransformer.VisionTransformer(device,
                                                image_size,
                                               PATCH_SIZE, 
                                               HIDDEN_DIM,
                                               EMBED_DIM,
                                               NUM_CHANNELS,
                                               sigopt.params.num_heads,
                                               sigopt.params.num_layers,
                                               DROPOUT).to(device)
    
    criterion = nn.MSELoss()

    optimizer = torch.optim.Adam(model.parameters(), lr=float(sigopt.params.learning_rate), 
                                 weight_decay =float(sigopt.params.reg))
#     scheduler = torch.optim.lr_scheduler.ReduceLROnPlateau(optimizer)
    
    best = float('inf')
    best_model = None
    best_epoch = None
    train_losses = []
    valid_losses = []
    scaler = torch.cuda.amp.GradScaler()


    for epoch in range(NUM_EPOCHS):
        
        # Training.
        train_loss = train(epoch, training_set, model, optimizer, criterion, scaler=scaler)
        temp = train_loss
        temp.cpu()
        temp = float(temp)
        train_losses.append(temp)
        print(f"Average training loss this epoch: {temp:.4f}")
                
        # Validation.
        valid_loss = validate(epoch, validation_set, model, criterion)
        temp = valid_loss
        temp.cpu()
        temp = float(temp)
        valid_losses.append(temp)
        
#         scheduler.step(train_loss)
        
        if valid_loss < best:
            best = valid_loss
            best_model = copy.deepcopy(model)
            best_epoch = epoch
            
    print('Best Loss @1: {:.4f}'.format(best))
    
    losses_to_plot = train_losses, valid_losses
    plots(losses_to_plot, 
          lr=LEARNING_RATE, 
          reg=WEIGHT_DECAY_REGULARIZATION_TERM,
          batch=BATCH_SIZE, 
          # momentum=MOMENTUM  # not necessary for ADAM
         )

    torch.save(best_model.state_dict(), './checkpoints/vanilla_vision_transformer.pth')  
    sigopt.log_metric(name='RMSE', value=best)
    return best.cpu().numpy()

In [19]:
# sigopt setup
import sigopt
import os
os.environ["SIGOPT_API_TOKEN"] = "XWBIVDWCVQXALUZQFDHNGOELLLKDJBMOJALEPCNQXQGBNIGC"
os.environ['SIGOPT_PROJECT'] = 'vanilla_vit'

args = {
    'learning_rate': 0.005,
    'reg': 0.0005,
    'num_heads': 2,
    'num_layers': 6,
    'patch_size': 8,
    'embed_dim': 512
}

  "class": algorithms.Blowfish,


In [20]:
sigopt.set_project('vanilla_vit')
conn = sigopt.Connection(client_token=os.environ.get("SIGOPT_API_TOKEN"))
experiment = conn.experiments().create(
    
    name="Vanilla ViT Optimization 4",
 
    parameters=[
        dict(name="reg", bounds=dict(min=0.00001, max=1), type="double", transformation="log"),
        dict(name="learning_rate", bounds=dict(min=0.00001 ,max=0.1), type="double", transformation="log"),
#         dict(name="batch_size", categorical_values=["1","8","16", "32", "64"], type="categorical"),
        dict(name="num_heads", bounds=dict(min=2, max=10), type="int"),
        dict(name="num_layers", bounds=dict(min=2, max=10), type="int"),
#         dict(name="patch_size", categorical_values=["4","8","16"], type="categorical"),
#         dict(name="embed_dim", categorical_values=["256","512","768", "1024"], type="categorical")
        ],
 
    metrics=[
        dict(name="RMSE", objective="minimize", strategy="optimize")
        ],
 
    observation_budget = 30,
)
 
print("Explore your experiment: https://app.sigopt.com/experiment/" + experiment.id + "/analysis")

Explore your experiment: https://app.sigopt.com/experiment/531185/analysis


In [22]:
#Optimization Loop
for _ in range(experiment.observation_budget):
    suggestion = conn.experiments(experiment.id).suggestions().create()
    assignments = suggestion.assignments
    value = evaluate(assignments, args)
 
    conn.experiments(experiment.id).observations().create(
        suggestion=suggestion.id,
        value=value
    )
    
    #update experiment object
    experiment = conn.experiments(experiment.id).fetch()
 
assignments = conn.experiments(experiment.id).best_assignments().fetch().data[0].assignments  
 
print("BEST ASSIGNMENTS FOUND: \n", assignments)

Params :  {'learning_rate': 0.005, 'reg': 0.0005, 'num_heads': 2, 'num_layers': 6, 'patch_size': 8}


  return F.mse_loss(input, target, reduction=self.reduction)


Epoch: [0][0/27046]	Time 0.033 (0.033)	Loss 0.3770 (0.3770)	
Epoch: [0][10/27046]	Time 0.018 (0.030)	Loss 2.2307 (4.9360)	
Epoch: [0][20/27046]	Time 0.019 (0.025)	Loss 0.3430 (3.2202)	
Epoch: [0][30/27046]	Time 0.019 (0.023)	Loss 0.3785 (2.4272)	
Epoch: [0][40/27046]	Time 0.019 (0.022)	Loss 0.2562 (1.8740)	
Epoch: [0][50/27046]	Time 0.019 (0.022)	Loss 0.2599 (1.5965)	
Epoch: [0][60/27046]	Time 0.021 (0.022)	Loss 0.7788 (1.4202)	
Epoch: [0][70/27046]	Time 0.019 (0.021)	Loss 0.1967 (1.2801)	
Epoch: [0][80/27046]	Time 0.018 (0.021)	Loss 0.9656 (1.1572)	
Epoch: [0][90/27046]	Time 0.019 (0.021)	Loss 0.6652 (1.0801)	
Epoch: [0][100/27046]	Time 0.019 (0.021)	Loss 0.2612 (0.9975)	
Epoch: [0][110/27046]	Time 0.019 (0.020)	Loss 0.9212 (0.9273)	
Epoch: [0][120/27046]	Time 0.018 (0.021)	Loss 0.1923 (0.8675)	
Epoch: [0][130/27046]	Time 0.019 (0.020)	Loss 0.0348 (0.8323)	
Epoch: [0][140/27046]	Time 0.019 (0.020)	Loss 0.0218 (0.7863)	
Epoch: [0][150/27046]	Time 0.018 (0.020)	Loss 0.2083 (0.7569)	
Epo

Epoch: [0][1300/27046]	Time 0.020 (0.020)	Loss 0.0591 (0.2566)	
Epoch: [0][1310/27046]	Time 0.024 (0.020)	Loss 0.2213 (0.2561)	
Epoch: [0][1320/27046]	Time 0.023 (0.020)	Loss 0.0104 (0.2551)	
Epoch: [0][1330/27046]	Time 0.021 (0.020)	Loss 0.0432 (0.2552)	
Epoch: [0][1340/27046]	Time 0.020 (0.020)	Loss 0.4126 (0.2544)	
Epoch: [0][1350/27046]	Time 0.023 (0.020)	Loss 0.0089 (0.2533)	
Epoch: [0][1360/27046]	Time 0.024 (0.020)	Loss 0.0655 (0.2523)	
Epoch: [0][1370/27046]	Time 0.019 (0.020)	Loss 0.0134 (0.2510)	
Epoch: [0][1380/27046]	Time 0.020 (0.020)	Loss 0.0074 (0.2507)	
Epoch: [0][1390/27046]	Time 0.023 (0.021)	Loss 0.0103 (0.2499)	
Epoch: [0][1400/27046]	Time 0.021 (0.021)	Loss 0.1372 (0.2490)	
Epoch: [0][1410/27046]	Time 0.023 (0.021)	Loss 0.0607 (0.2480)	
Epoch: [0][1420/27046]	Time 0.021 (0.021)	Loss 0.0266 (0.2470)	
Epoch: [0][1430/27046]	Time 0.022 (0.021)	Loss 0.0027 (0.2463)	
Epoch: [0][1440/27046]	Time 0.022 (0.021)	Loss 0.3532 (0.2455)	
Epoch: [0][1450/27046]	Time 0.020 (0.021

Epoch: [0][2590/27046]	Time 0.019 (0.020)	Loss 0.5101 (0.2048)	
Epoch: [0][2600/27046]	Time 0.020 (0.020)	Loss 0.0326 (0.2047)	
Epoch: [0][2610/27046]	Time 0.019 (0.020)	Loss 0.0138 (0.2045)	
Epoch: [0][2620/27046]	Time 0.021 (0.020)	Loss 0.0223 (0.2042)	
Epoch: [0][2630/27046]	Time 0.019 (0.020)	Loss 0.0119 (0.2044)	
Epoch: [0][2640/27046]	Time 0.021 (0.020)	Loss 0.2380 (0.2047)	
Epoch: [0][2650/27046]	Time 0.020 (0.020)	Loss 0.0995 (0.2041)	
Epoch: [0][2660/27046]	Time 0.021 (0.020)	Loss 0.0430 (0.2043)	
Epoch: [0][2670/27046]	Time 0.020 (0.020)	Loss 0.0008 (0.2037)	
Epoch: [0][2680/27046]	Time 0.019 (0.020)	Loss 0.0079 (0.2041)	
Epoch: [0][2690/27046]	Time 0.019 (0.020)	Loss 0.2293 (0.2037)	
Epoch: [0][2700/27046]	Time 0.020 (0.020)	Loss 0.5606 (0.2034)	
Epoch: [0][2710/27046]	Time 0.020 (0.020)	Loss 0.4069 (0.2033)	
Epoch: [0][2720/27046]	Time 0.019 (0.020)	Loss 0.0293 (0.2028)	
Epoch: [0][2730/27046]	Time 0.020 (0.020)	Loss 0.0376 (0.2024)	
Epoch: [0][2740/27046]	Time 0.019 (0.020

Epoch: [0][3890/27046]	Time 0.019 (0.020)	Loss 0.4053 (0.1896)	
Epoch: [0][3900/27046]	Time 0.019 (0.020)	Loss 0.2969 (0.1897)	
Epoch: [0][3910/27046]	Time 0.019 (0.020)	Loss 0.0259 (0.1896)	
Epoch: [0][3920/27046]	Time 0.019 (0.020)	Loss 0.0048 (0.1894)	
Epoch: [0][3930/27046]	Time 0.019 (0.020)	Loss 0.0131 (0.1891)	
Epoch: [0][3940/27046]	Time 0.019 (0.020)	Loss 0.3026 (0.1895)	
Epoch: [0][3950/27046]	Time 0.018 (0.020)	Loss 0.1575 (0.1896)	
Epoch: [0][3960/27046]	Time 0.019 (0.020)	Loss 0.0436 (0.1895)	
Epoch: [0][3970/27046]	Time 0.019 (0.020)	Loss 0.0746 (0.1892)	
Epoch: [0][3980/27046]	Time 0.021 (0.020)	Loss 0.0281 (0.1892)	
Epoch: [0][3990/27046]	Time 0.019 (0.020)	Loss 0.0338 (0.1890)	
Epoch: [0][4000/27046]	Time 0.020 (0.020)	Loss 0.0960 (0.1891)	
Epoch: [0][4010/27046]	Time 0.019 (0.020)	Loss 0.0114 (0.1889)	
Epoch: [0][4020/27046]	Time 0.019 (0.020)	Loss 0.1849 (0.1887)	
Epoch: [0][4030/27046]	Time 0.021 (0.020)	Loss 0.0332 (0.1885)	
Epoch: [0][4040/27046]	Time 0.020 (0.020

Epoch: [0][5190/27046]	Time 0.020 (0.020)	Loss 0.0885 (0.1841)	
Epoch: [0][5200/27046]	Time 0.019 (0.020)	Loss 0.0676 (0.1840)	
Epoch: [0][5210/27046]	Time 0.019 (0.020)	Loss 0.3675 (0.1840)	
Epoch: [0][5220/27046]	Time 0.020 (0.020)	Loss 0.0060 (0.1841)	
Epoch: [0][5230/27046]	Time 0.021 (0.020)	Loss 1.0357 (0.1841)	
Epoch: [0][5240/27046]	Time 0.021 (0.020)	Loss 0.0346 (0.1839)	
Epoch: [0][5250/27046]	Time 0.019 (0.020)	Loss 0.0200 (0.1837)	
Epoch: [0][5260/27046]	Time 0.019 (0.020)	Loss 0.7278 (0.1841)	
Epoch: [0][5270/27046]	Time 0.019 (0.020)	Loss 0.2660 (0.1840)	
Epoch: [0][5280/27046]	Time 0.019 (0.020)	Loss 0.0150 (0.1840)	
Epoch: [0][5290/27046]	Time 0.020 (0.020)	Loss 0.0533 (0.1841)	
Epoch: [0][5300/27046]	Time 0.020 (0.020)	Loss 0.0347 (0.1839)	
Epoch: [0][5310/27046]	Time 0.019 (0.020)	Loss 0.0326 (0.1842)	
Epoch: [0][5320/27046]	Time 0.019 (0.020)	Loss 0.0077 (0.1843)	
Epoch: [0][5330/27046]	Time 0.019 (0.020)	Loss 0.1043 (0.1843)	
Epoch: [0][5340/27046]	Time 0.020 (0.020

Epoch: [0][6490/27046]	Time 0.020 (0.020)	Loss 0.2134 (0.1822)	
Epoch: [0][6500/27046]	Time 0.020 (0.020)	Loss 0.0674 (0.1822)	
Epoch: [0][6510/27046]	Time 0.019 (0.020)	Loss 0.5120 (0.1823)	
Epoch: [0][6520/27046]	Time 0.019 (0.020)	Loss 0.0172 (0.1825)	
Epoch: [0][6530/27046]	Time 0.020 (0.020)	Loss 0.0517 (0.1823)	
Epoch: [0][6540/27046]	Time 0.020 (0.020)	Loss 0.0100 (0.1822)	
Epoch: [0][6550/27046]	Time 0.020 (0.020)	Loss 0.1141 (0.1824)	
Epoch: [0][6560/27046]	Time 0.020 (0.020)	Loss 0.0273 (0.1824)	
Epoch: [0][6570/27046]	Time 0.020 (0.020)	Loss 1.1141 (0.1825)	
Epoch: [0][6580/27046]	Time 0.020 (0.020)	Loss 0.0516 (0.1824)	
Epoch: [0][6590/27046]	Time 0.018 (0.020)	Loss 0.0116 (0.1823)	
Epoch: [0][6600/27046]	Time 0.020 (0.020)	Loss 0.1086 (0.1825)	
Epoch: [0][6610/27046]	Time 0.019 (0.020)	Loss 0.0447 (0.1825)	
Epoch: [0][6620/27046]	Time 0.021 (0.020)	Loss 0.0718 (0.1824)	
Epoch: [0][6630/27046]	Time 0.018 (0.020)	Loss 0.0308 (0.1825)	
Epoch: [0][6640/27046]	Time 0.047 (0.020

Epoch: [0][7780/27046]	Time 0.019 (0.020)	Loss 0.0057 (0.1780)	
Epoch: [0][7790/27046]	Time 0.019 (0.020)	Loss 0.0143 (0.1780)	
Epoch: [0][7800/27046]	Time 0.020 (0.020)	Loss 0.0021 (0.1779)	
Epoch: [0][7810/27046]	Time 0.021 (0.020)	Loss 0.0203 (0.1778)	
Epoch: [0][7820/27046]	Time 0.019 (0.020)	Loss 0.2537 (0.1779)	
Epoch: [0][7830/27046]	Time 0.022 (0.020)	Loss 0.0239 (0.1778)	
Epoch: [0][7840/27046]	Time 0.020 (0.020)	Loss 0.1508 (0.1778)	
Epoch: [0][7850/27046]	Time 0.019 (0.020)	Loss 0.0593 (0.1777)	
Epoch: [0][7860/27046]	Time 0.023 (0.020)	Loss 0.0023 (0.1778)	
Epoch: [0][7870/27046]	Time 0.019 (0.020)	Loss 0.1253 (0.1779)	
Epoch: [0][7880/27046]	Time 0.020 (0.020)	Loss 1.4372 (0.1781)	
Epoch: [0][7890/27046]	Time 0.020 (0.020)	Loss 0.0369 (0.1781)	
Epoch: [0][7900/27046]	Time 0.020 (0.020)	Loss 0.1589 (0.1780)	
Epoch: [0][7910/27046]	Time 0.020 (0.020)	Loss 0.0662 (0.1780)	
Epoch: [0][7920/27046]	Time 0.046 (0.020)	Loss 0.1353 (0.1779)	
Epoch: [0][7930/27046]	Time 0.020 (0.020

Epoch: [0][9070/27046]	Time 0.019 (0.020)	Loss 0.2537 (0.1764)	
Epoch: [0][9080/27046]	Time 0.023 (0.020)	Loss 0.0151 (0.1764)	
Epoch: [0][9090/27046]	Time 0.019 (0.020)	Loss 0.0697 (0.1763)	
Epoch: [0][9100/27046]	Time 0.019 (0.020)	Loss 0.0255 (0.1763)	
Epoch: [0][9110/27046]	Time 0.019 (0.020)	Loss 0.0316 (0.1764)	
Epoch: [0][9120/27046]	Time 0.019 (0.020)	Loss 0.0836 (0.1763)	
Epoch: [0][9130/27046]	Time 0.018 (0.020)	Loss 0.0133 (0.1763)	
Epoch: [0][9140/27046]	Time 0.019 (0.020)	Loss 0.3093 (0.1763)	
Epoch: [0][9150/27046]	Time 0.019 (0.020)	Loss 0.2186 (0.1762)	
Epoch: [0][9160/27046]	Time 0.020 (0.020)	Loss 0.0977 (0.1761)	
Epoch: [0][9170/27046]	Time 0.021 (0.020)	Loss 0.0051 (0.1762)	
Epoch: [0][9180/27046]	Time 0.019 (0.020)	Loss 0.0857 (0.1762)	
Epoch: [0][9190/27046]	Time 0.019 (0.020)	Loss 0.7661 (0.1765)	
Epoch: [0][9200/27046]	Time 0.045 (0.020)	Loss 0.3716 (0.1765)	
Epoch: [0][9210/27046]	Time 0.019 (0.020)	Loss 0.5651 (0.1767)	
Epoch: [0][9220/27046]	Time 0.019 (0.020

Epoch: [0][10360/27046]	Time 0.019 (0.020)	Loss 0.2004 (0.1747)	
Epoch: [0][10370/27046]	Time 0.019 (0.020)	Loss 0.1815 (0.1746)	
Epoch: [0][10380/27046]	Time 0.019 (0.020)	Loss 0.0217 (0.1745)	
Epoch: [0][10390/27046]	Time 0.019 (0.020)	Loss 0.0114 (0.1747)	
Epoch: [0][10400/27046]	Time 0.020 (0.020)	Loss 0.0675 (0.1747)	
Epoch: [0][10410/27046]	Time 0.019 (0.020)	Loss 0.1395 (0.1747)	
Epoch: [0][10420/27046]	Time 0.020 (0.020)	Loss 0.0656 (0.1747)	
Epoch: [0][10430/27046]	Time 0.019 (0.020)	Loss 0.0036 (0.1746)	
Epoch: [0][10440/27046]	Time 0.020 (0.020)	Loss 0.3118 (0.1746)	
Epoch: [0][10450/27046]	Time 0.019 (0.020)	Loss 0.5373 (0.1746)	
Epoch: [0][10460/27046]	Time 0.019 (0.020)	Loss 0.0726 (0.1745)	
Epoch: [0][10470/27046]	Time 0.019 (0.020)	Loss 0.1176 (0.1745)	
Epoch: [0][10480/27046]	Time 0.045 (0.020)	Loss 0.0973 (0.1745)	
Epoch: [0][10490/27046]	Time 0.020 (0.020)	Loss 0.3973 (0.1745)	
Epoch: [0][10500/27046]	Time 0.019 (0.020)	Loss 0.2096 (0.1744)	
Epoch: [0][10510/27046]	T

Epoch: [0][11630/27046]	Time 0.021 (0.020)	Loss 0.0022 (0.1755)	
Epoch: [0][11640/27046]	Time 0.021 (0.020)	Loss 0.0130 (0.1756)	
Epoch: [0][11650/27046]	Time 0.019 (0.020)	Loss 0.0345 (0.1755)	
Epoch: [0][11660/27046]	Time 0.019 (0.020)	Loss 0.0693 (0.1755)	
Epoch: [0][11670/27046]	Time 0.019 (0.020)	Loss 0.0518 (0.1756)	
Epoch: [0][11680/27046]	Time 0.020 (0.020)	Loss 0.0831 (0.1756)	
Epoch: [0][11690/27046]	Time 0.021 (0.020)	Loss 0.0362 (0.1755)	
Epoch: [0][11700/27046]	Time 0.019 (0.020)	Loss 0.0693 (0.1755)	
Epoch: [0][11710/27046]	Time 0.019 (0.020)	Loss 0.1350 (0.1755)	
Epoch: [0][11720/27046]	Time 0.019 (0.020)	Loss 0.2395 (0.1755)	
Epoch: [0][11730/27046]	Time 0.021 (0.020)	Loss 0.0383 (0.1754)	
Epoch: [0][11740/27046]	Time 0.019 (0.020)	Loss 0.1299 (0.1754)	
Epoch: [0][11750/27046]	Time 0.021 (0.020)	Loss 0.0667 (0.1755)	
Epoch: [0][11760/27046]	Time 0.044 (0.020)	Loss 0.5445 (0.1754)	
Epoch: [0][11770/27046]	Time 0.019 (0.020)	Loss 0.5096 (0.1754)	
Epoch: [0][11780/27046]	T

Epoch: [0][12910/27046]	Time 0.021 (0.020)	Loss 0.2621 (0.1733)	
Epoch: [0][12920/27046]	Time 0.024 (0.020)	Loss 0.0433 (0.1732)	
Epoch: [0][12930/27046]	Time 0.021 (0.020)	Loss 0.3293 (0.1732)	
Epoch: [0][12940/27046]	Time 0.021 (0.020)	Loss 0.2776 (0.1733)	
Epoch: [0][12950/27046]	Time 0.021 (0.020)	Loss 0.0165 (0.1733)	
Epoch: [0][12960/27046]	Time 0.022 (0.020)	Loss 0.1517 (0.1734)	
Epoch: [0][12970/27046]	Time 0.021 (0.020)	Loss 0.1832 (0.1735)	
Epoch: [0][12980/27046]	Time 0.019 (0.020)	Loss 0.0319 (0.1735)	
Epoch: [0][12990/27046]	Time 0.020 (0.020)	Loss 0.2308 (0.1734)	
Epoch: [0][13000/27046]	Time 0.020 (0.020)	Loss 0.1394 (0.1736)	
Epoch: [0][13010/27046]	Time 0.022 (0.020)	Loss 0.0319 (0.1736)	
Epoch: [0][13020/27046]	Time 0.020 (0.020)	Loss 0.0787 (0.1735)	
Epoch: [0][13030/27046]	Time 0.021 (0.020)	Loss 0.1407 (0.1735)	
Epoch: [0][13040/27046]	Time 0.048 (0.020)	Loss 0.0037 (0.1734)	
Epoch: [0][13050/27046]	Time 0.021 (0.020)	Loss 0.4579 (0.1735)	
Epoch: [0][13060/27046]	T

Epoch: [0][14180/27046]	Time 0.021 (0.020)	Loss 0.2646 (0.1724)	
Epoch: [0][14190/27046]	Time 0.022 (0.020)	Loss 0.1050 (0.1724)	
Epoch: [0][14200/27046]	Time 0.024 (0.020)	Loss 0.2079 (0.1724)	
Epoch: [0][14210/27046]	Time 0.019 (0.020)	Loss 0.0045 (0.1723)	
Epoch: [0][14220/27046]	Time 0.020 (0.020)	Loss 0.0645 (0.1723)	
Epoch: [0][14230/27046]	Time 0.019 (0.020)	Loss 0.1098 (0.1723)	
Epoch: [0][14240/27046]	Time 0.021 (0.020)	Loss 0.1035 (0.1722)	
Epoch: [0][14250/27046]	Time 0.021 (0.020)	Loss 0.1188 (0.1723)	
Epoch: [0][14260/27046]	Time 0.019 (0.020)	Loss 0.0261 (0.1722)	
Epoch: [0][14270/27046]	Time 0.020 (0.020)	Loss 0.0433 (0.1722)	
Epoch: [0][14280/27046]	Time 0.020 (0.020)	Loss 0.6128 (0.1722)	
Epoch: [0][14290/27046]	Time 0.020 (0.020)	Loss 0.0094 (0.1722)	
Epoch: [0][14300/27046]	Time 0.019 (0.020)	Loss 0.4800 (0.1721)	
Epoch: [0][14310/27046]	Time 0.019 (0.020)	Loss 0.1028 (0.1721)	
Epoch: [0][14320/27046]	Time 0.049 (0.020)	Loss 0.0271 (0.1721)	
Epoch: [0][14330/27046]	T

Epoch: [0][15460/27046]	Time 0.019 (0.020)	Loss 0.3576 (0.1713)	
Epoch: [0][15470/27046]	Time 0.019 (0.020)	Loss 0.0003 (0.1714)	
Epoch: [0][15480/27046]	Time 0.019 (0.020)	Loss 0.1180 (0.1714)	
Epoch: [0][15490/27046]	Time 0.019 (0.020)	Loss 0.0420 (0.1714)	
Epoch: [0][15500/27046]	Time 0.021 (0.020)	Loss 0.0143 (0.1713)	
Epoch: [0][15510/27046]	Time 0.022 (0.020)	Loss 0.0484 (0.1713)	
Epoch: [0][15520/27046]	Time 0.021 (0.020)	Loss 0.5767 (0.1712)	
Epoch: [0][15530/27046]	Time 0.019 (0.020)	Loss 0.2291 (0.1712)	
Epoch: [0][15540/27046]	Time 0.020 (0.020)	Loss 0.0344 (0.1712)	
Epoch: [0][15550/27046]	Time 0.022 (0.020)	Loss 0.0362 (0.1712)	
Epoch: [0][15560/27046]	Time 0.019 (0.020)	Loss 0.8193 (0.1712)	
Epoch: [0][15570/27046]	Time 0.020 (0.020)	Loss 0.6194 (0.1713)	
Epoch: [0][15580/27046]	Time 0.021 (0.020)	Loss 0.7206 (0.1714)	
Epoch: [0][15590/27046]	Time 0.020 (0.020)	Loss 0.0221 (0.1715)	
Epoch: [0][15600/27046]	Time 0.046 (0.020)	Loss 0.0784 (0.1714)	
Epoch: [0][15610/27046]	T

Epoch: [0][16730/27046]	Time 0.019 (0.020)	Loss 0.1155 (0.1705)	
Epoch: [0][16740/27046]	Time 0.022 (0.020)	Loss 0.0250 (0.1705)	
Epoch: [0][16750/27046]	Time 0.020 (0.020)	Loss 0.2483 (0.1705)	
Epoch: [0][16760/27046]	Time 0.020 (0.020)	Loss 0.1606 (0.1704)	
Epoch: [0][16770/27046]	Time 0.023 (0.020)	Loss 0.0246 (0.1704)	
Epoch: [0][16780/27046]	Time 0.024 (0.020)	Loss 0.0398 (0.1704)	
Epoch: [0][16790/27046]	Time 0.020 (0.020)	Loss 0.0761 (0.1704)	
Epoch: [0][16800/27046]	Time 0.019 (0.020)	Loss 0.0992 (0.1704)	
Epoch: [0][16810/27046]	Time 0.020 (0.020)	Loss 0.0485 (0.1704)	
Epoch: [0][16820/27046]	Time 0.022 (0.020)	Loss 0.6028 (0.1704)	
Epoch: [0][16830/27046]	Time 0.019 (0.020)	Loss 0.2491 (0.1703)	
Epoch: [0][16840/27046]	Time 0.021 (0.020)	Loss 0.0104 (0.1703)	
Epoch: [0][16850/27046]	Time 0.021 (0.020)	Loss 0.0140 (0.1703)	
Epoch: [0][16860/27046]	Time 0.020 (0.020)	Loss 0.1026 (0.1703)	
Epoch: [0][16870/27046]	Time 0.020 (0.020)	Loss 0.0796 (0.1703)	
Epoch: [0][16880/27046]	T

Epoch: [0][18010/27046]	Time 0.014 (0.020)	Loss 0.0337 (0.1704)	
Epoch: [0][18020/27046]	Time 0.021 (0.020)	Loss 0.1091 (0.1703)	
Epoch: [0][18030/27046]	Time 0.021 (0.020)	Loss 0.1193 (0.1703)	
Epoch: [0][18040/27046]	Time 0.020 (0.020)	Loss 0.1338 (0.1702)	
Epoch: [0][18050/27046]	Time 0.021 (0.020)	Loss 0.0642 (0.1702)	
Epoch: [0][18060/27046]	Time 0.029 (0.020)	Loss 0.0822 (0.1702)	
Epoch: [0][18070/27046]	Time 0.021 (0.020)	Loss 0.0343 (0.1702)	
Epoch: [0][18080/27046]	Time 0.022 (0.020)	Loss 0.0299 (0.1702)	
Epoch: [0][18090/27046]	Time 0.021 (0.020)	Loss 0.0100 (0.1702)	
Epoch: [0][18100/27046]	Time 0.022 (0.020)	Loss 0.5665 (0.1702)	
Epoch: [0][18110/27046]	Time 0.026 (0.020)	Loss 0.0017 (0.1702)	
Epoch: [0][18120/27046]	Time 0.025 (0.020)	Loss 0.0607 (0.1701)	
Epoch: [0][18130/27046]	Time 0.023 (0.020)	Loss 0.4430 (0.1701)	
Epoch: [0][18140/27046]	Time 0.022 (0.020)	Loss 0.0630 (0.1701)	
Epoch: [0][18150/27046]	Time 0.025 (0.020)	Loss 0.1221 (0.1701)	
Epoch: [0][18160/27046]	T

Epoch: [0][19280/27046]	Time 0.024 (0.020)	Loss 0.0095 (0.1691)	
Epoch: [0][19290/27046]	Time 0.021 (0.020)	Loss 0.0156 (0.1691)	
Epoch: [0][19300/27046]	Time 0.022 (0.020)	Loss 0.1094 (0.1691)	
Epoch: [0][19310/27046]	Time 0.020 (0.020)	Loss 0.0754 (0.1692)	
Epoch: [0][19320/27046]	Time 0.020 (0.020)	Loss 0.2327 (0.1692)	
Epoch: [0][19330/27046]	Time 0.020 (0.020)	Loss 0.1264 (0.1691)	
Epoch: [0][19340/27046]	Time 0.021 (0.020)	Loss 0.0127 (0.1691)	
Epoch: [0][19350/27046]	Time 0.023 (0.020)	Loss 0.2961 (0.1691)	
Epoch: [0][19360/27046]	Time 0.025 (0.020)	Loss 0.0067 (0.1690)	
Epoch: [0][19370/27046]	Time 0.021 (0.020)	Loss 0.1771 (0.1690)	
Epoch: [0][19380/27046]	Time 0.021 (0.020)	Loss 0.0099 (0.1690)	
Epoch: [0][19390/27046]	Time 0.023 (0.020)	Loss 0.4566 (0.1690)	
Epoch: [0][19400/27046]	Time 0.026 (0.020)	Loss 0.0428 (0.1689)	
Epoch: [0][19410/27046]	Time 0.020 (0.020)	Loss 0.0076 (0.1689)	
Epoch: [0][19420/27046]	Time 0.021 (0.020)	Loss 0.1106 (0.1689)	
Epoch: [0][19430/27046]	T

Epoch: [0][20560/27046]	Time 0.020 (0.020)	Loss 0.1772 (0.1683)	
Epoch: [0][20570/27046]	Time 0.022 (0.020)	Loss 0.1259 (0.1683)	
Epoch: [0][20580/27046]	Time 0.023 (0.020)	Loss 0.0281 (0.1683)	
Epoch: [0][20590/27046]	Time 0.020 (0.020)	Loss 0.3425 (0.1683)	
Epoch: [0][20600/27046]	Time 0.020 (0.020)	Loss 0.0038 (0.1682)	
Epoch: [0][20610/27046]	Time 0.023 (0.020)	Loss 0.2283 (0.1682)	
Epoch: [0][20620/27046]	Time 0.020 (0.020)	Loss 0.0620 (0.1682)	
Epoch: [0][20630/27046]	Time 0.022 (0.020)	Loss 0.3521 (0.1682)	
Epoch: [0][20640/27046]	Time 0.025 (0.020)	Loss 0.4897 (0.1681)	
Epoch: [0][20650/27046]	Time 0.020 (0.020)	Loss 0.4674 (0.1682)	
Epoch: [0][20660/27046]	Time 0.020 (0.020)	Loss 0.0329 (0.1682)	
Epoch: [0][20670/27046]	Time 0.024 (0.020)	Loss 0.0161 (0.1682)	
Epoch: [0][20680/27046]	Time 0.022 (0.020)	Loss 0.6561 (0.1682)	
Epoch: [0][20690/27046]	Time 0.020 (0.020)	Loss 0.0456 (0.1681)	
Epoch: [0][20700/27046]	Time 0.021 (0.020)	Loss 0.0455 (0.1682)	
Epoch: [0][20710/27046]	T

Epoch: [0][21830/27046]	Time 0.020 (0.020)	Loss 0.0767 (0.1674)	
Epoch: [0][21840/27046]	Time 0.025 (0.020)	Loss 0.0968 (0.1674)	
Epoch: [0][21850/27046]	Time 0.020 (0.020)	Loss 0.3403 (0.1674)	
Epoch: [0][21860/27046]	Time 0.021 (0.020)	Loss 0.0084 (0.1674)	
Epoch: [0][21870/27046]	Time 0.024 (0.020)	Loss 0.6281 (0.1674)	
Epoch: [0][21880/27046]	Time 0.023 (0.020)	Loss 0.0603 (0.1674)	
Epoch: [0][21890/27046]	Time 0.020 (0.020)	Loss 0.0172 (0.1674)	
Epoch: [0][21900/27046]	Time 0.022 (0.020)	Loss 0.0131 (0.1674)	
Epoch: [0][21910/27046]	Time 0.019 (0.020)	Loss 0.0604 (0.1674)	
Epoch: [0][21920/27046]	Time 0.022 (0.020)	Loss 0.0038 (0.1673)	
Epoch: [0][21930/27046]	Time 0.021 (0.020)	Loss 0.0279 (0.1673)	
Epoch: [0][21940/27046]	Time 0.020 (0.020)	Loss 0.2062 (0.1673)	
Epoch: [0][21950/27046]	Time 0.023 (0.020)	Loss 1.3162 (0.1673)	
Epoch: [0][21960/27046]	Time 0.021 (0.020)	Loss 0.1455 (0.1673)	
Epoch: [0][21970/27046]	Time 0.020 (0.020)	Loss 0.0210 (0.1673)	
Epoch: [0][21980/27046]	T

Epoch: [0][23110/27046]	Time 0.020 (0.020)	Loss 0.0058 (0.1680)	
Epoch: [0][23120/27046]	Time 0.019 (0.020)	Loss 0.0132 (0.1680)	
Epoch: [0][23130/27046]	Time 0.020 (0.020)	Loss 0.0071 (0.1680)	
Epoch: [0][23140/27046]	Time 0.020 (0.020)	Loss 0.2757 (0.1680)	
Epoch: [0][23150/27046]	Time 0.020 (0.020)	Loss 0.0793 (0.1680)	
Epoch: [0][23160/27046]	Time 0.020 (0.020)	Loss 0.0311 (0.1680)	
Epoch: [0][23170/27046]	Time 0.021 (0.020)	Loss 0.0491 (0.1680)	
Epoch: [0][23180/27046]	Time 0.021 (0.020)	Loss 0.0179 (0.1680)	
Epoch: [0][23190/27046]	Time 0.022 (0.020)	Loss 0.1372 (0.1680)	
Epoch: [0][23200/27046]	Time 0.020 (0.020)	Loss 0.0367 (0.1680)	
Epoch: [0][23210/27046]	Time 0.020 (0.020)	Loss 0.0138 (0.1679)	
Epoch: [0][23220/27046]	Time 0.024 (0.020)	Loss 0.0093 (0.1679)	
Epoch: [0][23230/27046]	Time 0.020 (0.020)	Loss 0.0229 (0.1679)	
Epoch: [0][23240/27046]	Time 0.020 (0.020)	Loss 0.4109 (0.1679)	
Epoch: [0][23250/27046]	Time 0.020 (0.020)	Loss 0.0331 (0.1678)	
Epoch: [0][23260/27046]	T

Epoch: [0][24390/27046]	Time 0.019 (0.020)	Loss 0.0030 (0.1680)	
Epoch: [0][24400/27046]	Time 0.019 (0.020)	Loss 0.1260 (0.1680)	
Epoch: [0][24410/27046]	Time 0.020 (0.020)	Loss 0.0103 (0.1680)	
Epoch: [0][24420/27046]	Time 0.024 (0.020)	Loss 0.0342 (0.1679)	
Epoch: [0][24430/27046]	Time 0.019 (0.020)	Loss 0.2048 (0.1679)	
Epoch: [0][24440/27046]	Time 0.021 (0.020)	Loss 0.2048 (0.1680)	
Epoch: [0][24450/27046]	Time 0.021 (0.020)	Loss 0.0541 (0.1679)	
Epoch: [0][24460/27046]	Time 0.019 (0.020)	Loss 0.4077 (0.1679)	
Epoch: [0][24470/27046]	Time 0.019 (0.020)	Loss 0.2101 (0.1679)	
Epoch: [0][24480/27046]	Time 0.020 (0.020)	Loss 0.6303 (0.1680)	
Epoch: [0][24490/27046]	Time 0.021 (0.020)	Loss 0.0292 (0.1680)	
Epoch: [0][24500/27046]	Time 0.020 (0.020)	Loss 1.6355 (0.1680)	
Epoch: [0][24510/27046]	Time 0.020 (0.020)	Loss 0.0571 (0.1679)	
Epoch: [0][24520/27046]	Time 0.020 (0.020)	Loss 0.0321 (0.1679)	
Epoch: [0][24530/27046]	Time 0.019 (0.020)	Loss 0.3997 (0.1679)	
Epoch: [0][24540/27046]	T

Epoch: [0][25670/27046]	Time 0.020 (0.020)	Loss 0.2228 (0.1678)	
Epoch: [0][25680/27046]	Time 0.021 (0.020)	Loss 0.0181 (0.1678)	
Epoch: [0][25690/27046]	Time 0.019 (0.020)	Loss 0.0837 (0.1678)	
Epoch: [0][25700/27046]	Time 0.019 (0.020)	Loss 0.0980 (0.1678)	
Epoch: [0][25710/27046]	Time 0.021 (0.020)	Loss 0.2043 (0.1678)	
Epoch: [0][25720/27046]	Time 0.022 (0.020)	Loss 0.0266 (0.1677)	
Epoch: [0][25730/27046]	Time 0.020 (0.020)	Loss 0.0471 (0.1677)	
Epoch: [0][25740/27046]	Time 0.019 (0.020)	Loss 0.3010 (0.1677)	
Epoch: [0][25750/27046]	Time 0.022 (0.020)	Loss 0.3567 (0.1677)	
Epoch: [0][25760/27046]	Time 0.025 (0.020)	Loss 0.9019 (0.1677)	
Epoch: [0][25770/27046]	Time 0.025 (0.020)	Loss 0.0582 (0.1678)	
Epoch: [0][25780/27046]	Time 0.020 (0.020)	Loss 0.0083 (0.1677)	
Epoch: [0][25790/27046]	Time 0.022 (0.020)	Loss 1.0216 (0.1678)	
Epoch: [0][25800/27046]	Time 0.023 (0.020)	Loss 0.4200 (0.1678)	
Epoch: [0][25810/27046]	Time 0.020 (0.020)	Loss 0.0004 (0.1678)	
Epoch: [0][25820/27046]	T

Epoch: [0][26950/27046]	Time 0.020 (0.021)	Loss 0.4921 (0.1677)	
Epoch: [0][26960/27046]	Time 0.020 (0.021)	Loss 0.1077 (0.1677)	
Epoch: [0][26970/27046]	Time 0.022 (0.021)	Loss 0.1394 (0.1677)	
Epoch: [0][26980/27046]	Time 0.022 (0.021)	Loss 0.0346 (0.1677)	
Epoch: [0][26990/27046]	Time 0.021 (0.021)	Loss 0.3897 (0.1677)	
Epoch: [0][27000/27046]	Time 0.021 (0.021)	Loss 0.0039 (0.1676)	
Epoch: [0][27010/27046]	Time 0.023 (0.021)	Loss 0.4465 (0.1676)	
Epoch: [0][27020/27046]	Time 0.023 (0.021)	Loss 0.0503 (0.1676)	
Epoch: [0][27030/27046]	Time 0.022 (0.021)	Loss 0.0152 (0.1676)	
Epoch: [0][27040/27046]	Time 0.020 (0.021)	Loss 0.0350 (0.1676)	
Average training loss this epoch: 0.1676
Epoch: [0][0/6762]	Time 0.005 (0.005)	
Epoch: [0][10/6762]	Time 0.005 (0.004)	
Epoch: [0][20/6762]	Time 0.004 (0.004)	
Epoch: [0][30/6762]	Time 0.004 (0.004)	
Epoch: [0][40/6762]	Time 0.004 (0.004)	
Epoch: [0][50/6762]	Time 0.004 (0.004)	
Epoch: [0][60/6762]	Time 0.005 (0.004)	
Epoch: [0][70/6762]	Time 0.004

Epoch: [0][1830/6762]	Time 0.004 (0.004)	
Epoch: [0][1840/6762]	Time 0.004 (0.004)	
Epoch: [0][1850/6762]	Time 0.004 (0.004)	
Epoch: [0][1860/6762]	Time 0.004 (0.004)	
Epoch: [0][1870/6762]	Time 0.006 (0.004)	
Epoch: [0][1880/6762]	Time 0.004 (0.004)	
Epoch: [0][1890/6762]	Time 0.004 (0.004)	
Epoch: [0][1900/6762]	Time 0.004 (0.004)	
Epoch: [0][1910/6762]	Time 0.004 (0.004)	
Epoch: [0][1920/6762]	Time 0.004 (0.004)	
Epoch: [0][1930/6762]	Time 0.006 (0.004)	
Epoch: [0][1940/6762]	Time 0.005 (0.004)	
Epoch: [0][1950/6762]	Time 0.004 (0.004)	
Epoch: [0][1960/6762]	Time 0.004 (0.004)	
Epoch: [0][1970/6762]	Time 0.004 (0.004)	
Epoch: [0][1980/6762]	Time 0.004 (0.004)	
Epoch: [0][1990/6762]	Time 0.006 (0.004)	
Epoch: [0][2000/6762]	Time 0.005 (0.004)	
Epoch: [0][2010/6762]	Time 0.005 (0.004)	
Epoch: [0][2020/6762]	Time 0.004 (0.004)	
Epoch: [0][2030/6762]	Time 0.006 (0.004)	
Epoch: [0][2040/6762]	Time 0.003 (0.004)	
Epoch: [0][2050/6762]	Time 0.004 (0.004)	
Epoch: [0][2060/6762]	Time 0.004 (

Epoch: [0][3820/6762]	Time 0.004 (0.005)	
Epoch: [0][3830/6762]	Time 0.004 (0.005)	
Epoch: [0][3840/6762]	Time 0.005 (0.005)	
Epoch: [0][3850/6762]	Time 0.004 (0.005)	
Epoch: [0][3860/6762]	Time 0.004 (0.005)	
Epoch: [0][3870/6762]	Time 0.004 (0.005)	
Epoch: [0][3880/6762]	Time 0.003 (0.005)	
Epoch: [0][3890/6762]	Time 0.003 (0.005)	
Epoch: [0][3900/6762]	Time 0.007 (0.005)	
Epoch: [0][3910/6762]	Time 0.004 (0.005)	
Epoch: [0][3920/6762]	Time 0.004 (0.005)	
Epoch: [0][3930/6762]	Time 0.003 (0.005)	
Epoch: [0][3940/6762]	Time 0.005 (0.005)	
Epoch: [0][3950/6762]	Time 0.004 (0.005)	
Epoch: [0][3960/6762]	Time 0.004 (0.005)	
Epoch: [0][3970/6762]	Time 0.004 (0.005)	
Epoch: [0][3980/6762]	Time 0.004 (0.005)	
Epoch: [0][3990/6762]	Time 0.003 (0.004)	
Epoch: [0][4000/6762]	Time 0.005 (0.004)	
Epoch: [0][4010/6762]	Time 0.005 (0.004)	
Epoch: [0][4020/6762]	Time 0.003 (0.004)	
Epoch: [0][4030/6762]	Time 0.004 (0.004)	
Epoch: [0][4040/6762]	Time 0.004 (0.004)	
Epoch: [0][4050/6762]	Time 0.004 (

Epoch: [0][5800/6762]	Time 0.004 (0.004)	
Epoch: [0][5810/6762]	Time 0.004 (0.004)	
Epoch: [0][5820/6762]	Time 0.005 (0.004)	
Epoch: [0][5830/6762]	Time 0.004 (0.004)	
Epoch: [0][5840/6762]	Time 0.004 (0.004)	
Epoch: [0][5850/6762]	Time 0.004 (0.004)	
Epoch: [0][5860/6762]	Time 0.003 (0.004)	
Epoch: [0][5870/6762]	Time 0.003 (0.004)	
Epoch: [0][5880/6762]	Time 0.004 (0.004)	
Epoch: [0][5890/6762]	Time 0.007 (0.004)	
Epoch: [0][5900/6762]	Time 0.004 (0.004)	
Epoch: [0][5910/6762]	Time 0.004 (0.004)	
Epoch: [0][5920/6762]	Time 0.004 (0.004)	
Epoch: [0][5930/6762]	Time 0.005 (0.004)	
Epoch: [0][5940/6762]	Time 0.004 (0.004)	
Epoch: [0][5950/6762]	Time 0.005 (0.004)	
Epoch: [0][5960/6762]	Time 0.004 (0.004)	
Epoch: [0][5970/6762]	Time 0.005 (0.004)	
Epoch: [0][5980/6762]	Time 0.004 (0.004)	
Epoch: [0][5990/6762]	Time 0.004 (0.004)	
Epoch: [0][6000/6762]	Time 0.004 (0.004)	
Epoch: [0][6010/6762]	Time 0.007 (0.004)	
Epoch: [0][6020/6762]	Time 0.003 (0.004)	
Epoch: [0][6030/6762]	Time 0.004 (

Epoch: [1][660/27046]	Time 0.023 (0.022)	Loss 0.1532 (0.1807)	
Epoch: [1][670/27046]	Time 0.025 (0.022)	Loss 0.1001 (0.1801)	
Epoch: [1][680/27046]	Time 0.020 (0.022)	Loss 0.0802 (0.1795)	
Epoch: [1][690/27046]	Time 0.021 (0.022)	Loss 0.1588 (0.1795)	
Epoch: [1][700/27046]	Time 0.025 (0.022)	Loss 0.5721 (0.1800)	
Epoch: [1][710/27046]	Time 0.024 (0.022)	Loss 0.0186 (0.1821)	
Epoch: [1][720/27046]	Time 0.021 (0.022)	Loss 0.0072 (0.1812)	
Epoch: [1][730/27046]	Time 0.021 (0.022)	Loss 0.6717 (0.1823)	
Epoch: [1][740/27046]	Time 0.022 (0.022)	Loss 0.3694 (0.1813)	
Epoch: [1][750/27046]	Time 0.021 (0.022)	Loss 0.2223 (0.1830)	
Epoch: [1][760/27046]	Time 0.020 (0.022)	Loss 0.0798 (0.1828)	
Epoch: [1][770/27046]	Time 0.026 (0.022)	Loss 0.0599 (0.1831)	
Epoch: [1][780/27046]	Time 0.023 (0.022)	Loss 0.0136 (0.1817)	
Epoch: [1][790/27046]	Time 0.023 (0.022)	Loss 0.1006 (0.1809)	
Epoch: [1][800/27046]	Time 0.050 (0.022)	Loss 0.0136 (0.1796)	
Epoch: [1][810/27046]	Time 0.021 (0.022)	Loss 0.1925 (0

Epoch: [1][1960/27046]	Time 0.020 (0.022)	Loss 0.0385 (0.1698)	
Epoch: [1][1970/27046]	Time 0.024 (0.022)	Loss 0.0720 (0.1696)	
Epoch: [1][1980/27046]	Time 0.020 (0.022)	Loss 0.0024 (0.1700)	
Epoch: [1][1990/27046]	Time 0.020 (0.022)	Loss 0.0299 (0.1701)	
Epoch: [1][2000/27046]	Time 0.020 (0.022)	Loss 0.0718 (0.1698)	
Epoch: [1][2010/27046]	Time 0.021 (0.022)	Loss 0.0517 (0.1694)	
Epoch: [1][2020/27046]	Time 0.020 (0.022)	Loss 0.8187 (0.1698)	
Epoch: [1][2030/27046]	Time 0.022 (0.022)	Loss 0.1356 (0.1697)	
Epoch: [1][2040/27046]	Time 0.023 (0.022)	Loss 0.0436 (0.1694)	
Epoch: [1][2050/27046]	Time 0.024 (0.022)	Loss 0.0583 (0.1690)	
Epoch: [1][2060/27046]	Time 0.020 (0.022)	Loss 0.5614 (0.1690)	
Epoch: [1][2070/27046]	Time 0.021 (0.022)	Loss 0.6157 (0.1692)	
Epoch: [1][2080/27046]	Time 0.056 (0.022)	Loss 0.0603 (0.1692)	
Epoch: [1][2090/27046]	Time 0.022 (0.022)	Loss 0.1082 (0.1690)	
Epoch: [1][2100/27046]	Time 0.025 (0.022)	Loss 0.0538 (0.1690)	
Epoch: [1][2110/27046]	Time 0.023 (0.022

Epoch: [1][3250/27046]	Time 0.023 (0.022)	Loss 0.1310 (0.1677)	
Epoch: [1][3260/27046]	Time 0.021 (0.022)	Loss 0.1285 (0.1678)	
Epoch: [1][3270/27046]	Time 0.021 (0.022)	Loss 0.1072 (0.1681)	
Epoch: [1][3280/27046]	Time 0.020 (0.022)	Loss 0.0663 (0.1679)	
Epoch: [1][3290/27046]	Time 0.026 (0.022)	Loss 0.0297 (0.1678)	
Epoch: [1][3300/27046]	Time 0.020 (0.022)	Loss 0.1378 (0.1680)	
Epoch: [1][3310/27046]	Time 0.036 (0.022)	Loss 0.1499 (0.1679)	
Epoch: [1][3320/27046]	Time 0.025 (0.022)	Loss 0.0701 (0.1683)	
Epoch: [1][3330/27046]	Time 0.020 (0.022)	Loss 0.0539 (0.1682)	
Epoch: [1][3340/27046]	Time 0.024 (0.022)	Loss 0.0152 (0.1682)	
Epoch: [1][3350/27046]	Time 0.020 (0.022)	Loss 0.0343 (0.1679)	
Epoch: [1][3360/27046]	Time 0.046 (0.022)	Loss 0.0694 (0.1685)	
Epoch: [1][3370/27046]	Time 0.021 (0.022)	Loss 0.2627 (0.1685)	
Epoch: [1][3380/27046]	Time 0.022 (0.022)	Loss 0.0088 (0.1687)	
Epoch: [1][3390/27046]	Time 0.022 (0.022)	Loss 0.0923 (0.1689)	
Epoch: [1][3400/27046]	Time 0.026 (0.022

Epoch: [1][4540/27046]	Time 0.022 (0.022)	Loss 0.0954 (0.1657)	
Epoch: [1][4550/27046]	Time 0.021 (0.022)	Loss 0.0178 (0.1655)	
Epoch: [1][4560/27046]	Time 0.020 (0.022)	Loss 0.2602 (0.1654)	
Epoch: [1][4570/27046]	Time 0.024 (0.022)	Loss 0.6807 (0.1653)	
Epoch: [1][4580/27046]	Time 0.021 (0.022)	Loss 0.1044 (0.1651)	
Epoch: [1][4590/27046]	Time 0.021 (0.022)	Loss 0.4633 (0.1651)	
Epoch: [1][4600/27046]	Time 0.021 (0.022)	Loss 0.0442 (0.1651)	
Epoch: [1][4610/27046]	Time 0.021 (0.022)	Loss 0.1139 (0.1651)	
Epoch: [1][4620/27046]	Time 0.019 (0.022)	Loss 0.0293 (0.1648)	
Epoch: [1][4630/27046]	Time 0.023 (0.022)	Loss 0.0069 (0.1646)	
Epoch: [1][4640/27046]	Time 0.047 (0.022)	Loss 0.1025 (0.1647)	
Epoch: [1][4650/27046]	Time 0.020 (0.022)	Loss 0.0142 (0.1648)	
Epoch: [1][4660/27046]	Time 0.021 (0.022)	Loss 0.0086 (0.1649)	
Epoch: [1][4670/27046]	Time 0.023 (0.022)	Loss 0.0122 (0.1648)	
Epoch: [1][4680/27046]	Time 0.024 (0.022)	Loss 0.1059 (0.1647)	
Epoch: [1][4690/27046]	Time 0.023 (0.022

Epoch: [1][5830/27046]	Time 0.024 (0.022)	Loss 0.0349 (0.1646)	
Epoch: [1][5840/27046]	Time 0.020 (0.022)	Loss 0.2419 (0.1648)	
Epoch: [1][5850/27046]	Time 0.021 (0.022)	Loss 0.0121 (0.1646)	
Epoch: [1][5860/27046]	Time 0.025 (0.022)	Loss 0.0198 (0.1647)	
Epoch: [1][5870/27046]	Time 0.025 (0.022)	Loss 0.0706 (0.1646)	
Epoch: [1][5880/27046]	Time 0.023 (0.022)	Loss 0.0026 (0.1644)	
Epoch: [1][5890/27046]	Time 0.024 (0.022)	Loss 0.0272 (0.1644)	
Epoch: [1][5900/27046]	Time 0.024 (0.022)	Loss 0.0295 (0.1644)	
Epoch: [1][5910/27046]	Time 0.024 (0.022)	Loss 0.1766 (0.1644)	
Epoch: [1][5920/27046]	Time 0.048 (0.022)	Loss 0.0325 (0.1644)	
Epoch: [1][5930/27046]	Time 0.024 (0.022)	Loss 0.9044 (0.1645)	
Epoch: [1][5940/27046]	Time 0.024 (0.022)	Loss 0.0439 (0.1646)	
Epoch: [1][5950/27046]	Time 0.023 (0.022)	Loss 0.1217 (0.1645)	
Epoch: [1][5960/27046]	Time 0.022 (0.022)	Loss 0.1285 (0.1648)	
Epoch: [1][5970/27046]	Time 0.022 (0.022)	Loss 0.0148 (0.1650)	
Epoch: [1][5980/27046]	Time 0.025 (0.022

Epoch: [1][7130/27046]	Time 0.022 (0.022)	Loss 0.0160 (0.1685)	
Epoch: [1][7140/27046]	Time 0.022 (0.022)	Loss 0.0979 (0.1684)	
Epoch: [1][7150/27046]	Time 0.019 (0.022)	Loss 0.0370 (0.1684)	
Epoch: [1][7160/27046]	Time 0.019 (0.022)	Loss 0.0452 (0.1683)	
Epoch: [1][7170/27046]	Time 0.020 (0.022)	Loss 0.0334 (0.1681)	
Epoch: [1][7180/27046]	Time 0.020 (0.022)	Loss 0.0134 (0.1680)	
Epoch: [1][7190/27046]	Time 0.023 (0.022)	Loss 0.0716 (0.1680)	
Epoch: [1][7200/27046]	Time 0.046 (0.022)	Loss 0.0705 (0.1678)	
Epoch: [1][7210/27046]	Time 0.023 (0.022)	Loss 0.0174 (0.1679)	
Epoch: [1][7220/27046]	Time 0.020 (0.022)	Loss 0.0689 (0.1678)	
Epoch: [1][7230/27046]	Time 0.022 (0.022)	Loss 0.0149 (0.1677)	
Epoch: [1][7240/27046]	Time 0.020 (0.022)	Loss 0.0701 (0.1678)	
Epoch: [1][7250/27046]	Time 0.022 (0.022)	Loss 0.0276 (0.1677)	
Epoch: [1][7260/27046]	Time 0.023 (0.022)	Loss 0.0331 (0.1676)	
Epoch: [1][7270/27046]	Time 0.022 (0.022)	Loss 0.0254 (0.1675)	
Epoch: [1][7280/27046]	Time 0.022 (0.022

Epoch: [1][8420/27046]	Time 0.022 (0.022)	Loss 0.0164 (0.1645)	
Epoch: [1][8430/27046]	Time 0.024 (0.022)	Loss 0.0170 (0.1644)	
Epoch: [1][8440/27046]	Time 0.024 (0.022)	Loss 0.1002 (0.1644)	
Epoch: [1][8450/27046]	Time 0.024 (0.022)	Loss 0.0020 (0.1643)	
Epoch: [1][8460/27046]	Time 0.022 (0.022)	Loss 0.3812 (0.1643)	
Epoch: [1][8470/27046]	Time 0.025 (0.022)	Loss 0.3975 (0.1645)	
Epoch: [1][8480/27046]	Time 0.048 (0.022)	Loss 0.0142 (0.1644)	
Epoch: [1][8490/27046]	Time 0.024 (0.022)	Loss 0.0682 (0.1644)	
Epoch: [1][8500/27046]	Time 0.023 (0.022)	Loss 0.6316 (0.1644)	
Epoch: [1][8510/27046]	Time 0.024 (0.022)	Loss 0.0352 (0.1644)	
Epoch: [1][8520/27046]	Time 0.024 (0.022)	Loss 0.1193 (0.1643)	
Epoch: [1][8530/27046]	Time 0.024 (0.022)	Loss 0.0766 (0.1645)	
Epoch: [1][8540/27046]	Time 0.022 (0.022)	Loss 0.2874 (0.1646)	
Epoch: [1][8550/27046]	Time 0.020 (0.022)	Loss 0.2948 (0.1647)	
Epoch: [1][8560/27046]	Time 0.022 (0.022)	Loss 0.0147 (0.1647)	
Epoch: [1][8570/27046]	Time 0.021 (0.022

Epoch: [1][9710/27046]	Time 0.023 (0.022)	Loss 0.0018 (0.1653)	
Epoch: [1][9720/27046]	Time 0.021 (0.022)	Loss 0.0215 (0.1652)	
Epoch: [1][9730/27046]	Time 0.020 (0.022)	Loss 0.5727 (0.1653)	
Epoch: [1][9740/27046]	Time 0.022 (0.022)	Loss 0.0471 (0.1653)	
Epoch: [1][9750/27046]	Time 0.022 (0.022)	Loss 0.0023 (0.1652)	
Epoch: [1][9760/27046]	Time 0.044 (0.022)	Loss 0.1934 (0.1651)	
Epoch: [1][9770/27046]	Time 0.024 (0.022)	Loss 0.0360 (0.1653)	
Epoch: [1][9780/27046]	Time 0.024 (0.022)	Loss 0.3840 (0.1653)	
Epoch: [1][9790/27046]	Time 0.021 (0.022)	Loss 0.2688 (0.1656)	
Epoch: [1][9800/27046]	Time 0.020 (0.022)	Loss 1.0392 (0.1656)	
Epoch: [1][9810/27046]	Time 0.020 (0.022)	Loss 0.1250 (0.1655)	
Epoch: [1][9820/27046]	Time 0.021 (0.022)	Loss 0.2556 (0.1654)	
Epoch: [1][9830/27046]	Time 0.022 (0.022)	Loss 0.4586 (0.1654)	
Epoch: [1][9840/27046]	Time 0.022 (0.022)	Loss 0.0392 (0.1653)	
Epoch: [1][9850/27046]	Time 0.024 (0.022)	Loss 0.0091 (0.1652)	
Epoch: [1][9860/27046]	Time 0.019 (0.022

Epoch: [1][10980/27046]	Time 0.023 (0.022)	Loss 0.0150 (0.1651)	
Epoch: [1][10990/27046]	Time 0.026 (0.022)	Loss 0.5007 (0.1651)	
Epoch: [1][11000/27046]	Time 0.023 (0.022)	Loss 0.1437 (0.1652)	
Epoch: [1][11010/27046]	Time 0.023 (0.022)	Loss 0.5794 (0.1653)	
Epoch: [1][11020/27046]	Time 0.024 (0.022)	Loss 0.2754 (0.1653)	
Epoch: [1][11030/27046]	Time 0.025 (0.022)	Loss 0.1901 (0.1654)	
Epoch: [1][11040/27046]	Time 0.049 (0.022)	Loss 0.0610 (0.1654)	
Epoch: [1][11050/27046]	Time 0.023 (0.022)	Loss 0.0586 (0.1655)	
Epoch: [1][11060/27046]	Time 0.021 (0.022)	Loss 0.0949 (0.1655)	
Epoch: [1][11070/27046]	Time 0.027 (0.022)	Loss 0.2082 (0.1656)	
Epoch: [1][11080/27046]	Time 0.022 (0.022)	Loss 0.5026 (0.1655)	
Epoch: [1][11090/27046]	Time 0.023 (0.022)	Loss 0.0537 (0.1655)	
Epoch: [1][11100/27046]	Time 0.024 (0.022)	Loss 0.7440 (0.1655)	
Epoch: [1][11110/27046]	Time 0.024 (0.022)	Loss 0.0861 (0.1655)	
Epoch: [1][11120/27046]	Time 0.020 (0.022)	Loss 0.1698 (0.1655)	
Epoch: [1][11130/27046]	T

Epoch: [1][12260/27046]	Time 0.021 (0.022)	Loss 0.0411 (0.1642)	
Epoch: [1][12270/27046]	Time 0.020 (0.022)	Loss 0.1151 (0.1642)	
Epoch: [1][12280/27046]	Time 0.019 (0.022)	Loss 0.0600 (0.1641)	
Epoch: [1][12290/27046]	Time 0.022 (0.022)	Loss 0.2330 (0.1641)	
Epoch: [1][12300/27046]	Time 0.020 (0.022)	Loss 0.0589 (0.1641)	
Epoch: [1][12310/27046]	Time 0.020 (0.022)	Loss 0.0597 (0.1641)	
Epoch: [1][12320/27046]	Time 0.045 (0.022)	Loss 0.0014 (0.1640)	
Epoch: [1][12330/27046]	Time 0.020 (0.022)	Loss 0.0668 (0.1640)	
Epoch: [1][12340/27046]	Time 0.022 (0.022)	Loss 0.0116 (0.1641)	
Epoch: [1][12350/27046]	Time 0.020 (0.022)	Loss 0.0270 (0.1641)	
Epoch: [1][12360/27046]	Time 0.020 (0.022)	Loss 0.0134 (0.1640)	
Epoch: [1][12370/27046]	Time 0.019 (0.022)	Loss 1.7119 (0.1641)	
Epoch: [1][12380/27046]	Time 0.019 (0.022)	Loss 0.4869 (0.1641)	
Epoch: [1][12390/27046]	Time 0.022 (0.022)	Loss 0.1067 (0.1641)	
Epoch: [1][12400/27046]	Time 0.020 (0.022)	Loss 0.0186 (0.1641)	
Epoch: [1][12410/27046]	T

Epoch: [1][13530/27046]	Time 0.023 (0.022)	Loss 0.0283 (0.1647)	
Epoch: [1][13540/27046]	Time 0.020 (0.022)	Loss 0.1825 (0.1647)	
Epoch: [1][13550/27046]	Time 0.020 (0.022)	Loss 0.2284 (0.1646)	
Epoch: [1][13560/27046]	Time 0.021 (0.022)	Loss 0.0945 (0.1647)	
Epoch: [1][13570/27046]	Time 0.020 (0.022)	Loss 0.1067 (0.1647)	
Epoch: [1][13580/27046]	Time 0.020 (0.022)	Loss 0.0243 (0.1646)	
Epoch: [1][13590/27046]	Time 0.020 (0.022)	Loss 0.0721 (0.1646)	
Epoch: [1][13600/27046]	Time 0.044 (0.022)	Loss 0.1321 (0.1646)	
Epoch: [1][13610/27046]	Time 0.025 (0.022)	Loss 0.3516 (0.1645)	
Epoch: [1][13620/27046]	Time 0.021 (0.022)	Loss 0.1468 (0.1645)	
Epoch: [1][13630/27046]	Time 0.020 (0.022)	Loss 0.3874 (0.1645)	
Epoch: [1][13640/27046]	Time 0.023 (0.022)	Loss 0.1584 (0.1645)	
Epoch: [1][13650/27046]	Time 0.021 (0.022)	Loss 0.0740 (0.1644)	
Epoch: [1][13660/27046]	Time 0.021 (0.022)	Loss 0.3979 (0.1644)	
Epoch: [1][13670/27046]	Time 0.021 (0.022)	Loss 0.0096 (0.1644)	
Epoch: [1][13680/27046]	T

Epoch: [1][14800/27046]	Time 0.020 (0.022)	Loss 0.0380 (0.1633)	
Epoch: [1][14810/27046]	Time 0.020 (0.022)	Loss 0.1156 (0.1633)	
Epoch: [1][14820/27046]	Time 0.020 (0.022)	Loss 0.4881 (0.1634)	
Epoch: [1][14830/27046]	Time 0.022 (0.022)	Loss 0.0163 (0.1633)	
Epoch: [1][14840/27046]	Time 0.019 (0.022)	Loss 0.1932 (0.1633)	
Epoch: [1][14850/27046]	Time 0.020 (0.022)	Loss 0.0150 (0.1633)	
Epoch: [1][14860/27046]	Time 0.020 (0.022)	Loss 0.1265 (0.1632)	
Epoch: [1][14870/27046]	Time 0.023 (0.022)	Loss 0.3200 (0.1633)	
Epoch: [1][14880/27046]	Time 0.044 (0.022)	Loss 0.0216 (0.1633)	
Epoch: [1][14890/27046]	Time 0.021 (0.022)	Loss 0.0023 (0.1633)	
Epoch: [1][14900/27046]	Time 0.019 (0.022)	Loss 0.0012 (0.1634)	
Epoch: [1][14910/27046]	Time 0.020 (0.022)	Loss 0.0077 (0.1635)	
Epoch: [1][14920/27046]	Time 0.021 (0.022)	Loss 0.0306 (0.1634)	
Epoch: [1][14930/27046]	Time 0.020 (0.022)	Loss 0.1031 (0.1636)	
Epoch: [1][14940/27046]	Time 0.019 (0.022)	Loss 0.3316 (0.1636)	
Epoch: [1][14950/27046]	T

Epoch: [1][16070/27046]	Time 0.021 (0.022)	Loss 0.4066 (0.1634)	
Epoch: [1][16080/27046]	Time 0.023 (0.022)	Loss 0.0948 (0.1635)	
Epoch: [1][16090/27046]	Time 0.024 (0.022)	Loss 0.7826 (0.1636)	
Epoch: [1][16100/27046]	Time 0.021 (0.022)	Loss 0.2143 (0.1637)	
Epoch: [1][16110/27046]	Time 0.022 (0.022)	Loss 0.1767 (0.1636)	
Epoch: [1][16120/27046]	Time 0.025 (0.022)	Loss 0.3448 (0.1636)	
Epoch: [1][16130/27046]	Time 0.021 (0.022)	Loss 0.0586 (0.1636)	
Epoch: [1][16140/27046]	Time 0.021 (0.022)	Loss 0.0179 (0.1636)	
Epoch: [1][16150/27046]	Time 0.024 (0.022)	Loss 0.0145 (0.1636)	
Epoch: [1][16160/27046]	Time 0.045 (0.022)	Loss 0.0386 (0.1635)	
Epoch: [1][16170/27046]	Time 0.020 (0.022)	Loss 0.1156 (0.1635)	
Epoch: [1][16180/27046]	Time 0.021 (0.022)	Loss 0.0047 (0.1635)	
Epoch: [1][16190/27046]	Time 0.022 (0.022)	Loss 0.1466 (0.1634)	
Epoch: [1][16200/27046]	Time 0.025 (0.022)	Loss 0.0317 (0.1634)	
Epoch: [1][16210/27046]	Time 0.021 (0.022)	Loss 0.4769 (0.1634)	
Epoch: [1][16220/27046]	T

Epoch: [1][17340/27046]	Time 0.021 (0.022)	Loss 0.0118 (0.1630)	
Epoch: [1][17350/27046]	Time 0.019 (0.022)	Loss 0.0696 (0.1630)	
Epoch: [1][17360/27046]	Time 0.021 (0.022)	Loss 0.0310 (0.1630)	
Epoch: [1][17370/27046]	Time 0.020 (0.022)	Loss 0.0147 (0.1630)	
Epoch: [1][17380/27046]	Time 0.020 (0.022)	Loss 0.2993 (0.1630)	
Epoch: [1][17390/27046]	Time 0.024 (0.022)	Loss 0.1961 (0.1629)	
Epoch: [1][17400/27046]	Time 0.021 (0.022)	Loss 0.2087 (0.1630)	
Epoch: [1][17410/27046]	Time 0.020 (0.022)	Loss 0.2506 (0.1630)	
Epoch: [1][17420/27046]	Time 0.020 (0.022)	Loss 0.1054 (0.1629)	
Epoch: [1][17430/27046]	Time 0.026 (0.022)	Loss 0.0035 (0.1629)	
Epoch: [1][17440/27046]	Time 0.046 (0.022)	Loss 1.0736 (0.1630)	
Epoch: [1][17450/27046]	Time 0.020 (0.022)	Loss 0.3628 (0.1630)	
Epoch: [1][17460/27046]	Time 0.020 (0.022)	Loss 0.2482 (0.1631)	
Epoch: [1][17470/27046]	Time 0.022 (0.022)	Loss 0.0275 (0.1631)	
Epoch: [1][17480/27046]	Time 0.023 (0.022)	Loss 0.1007 (0.1630)	
Epoch: [1][17490/27046]	T

Epoch: [1][18620/27046]	Time 0.019 (0.022)	Loss 0.1877 (0.1631)	
Epoch: [1][18630/27046]	Time 0.021 (0.022)	Loss 0.1193 (0.1631)	
Epoch: [1][18640/27046]	Time 0.020 (0.022)	Loss 0.0508 (0.1631)	
Epoch: [1][18650/27046]	Time 0.020 (0.022)	Loss 0.1060 (0.1630)	
Epoch: [1][18660/27046]	Time 0.021 (0.022)	Loss 0.1326 (0.1630)	
Epoch: [1][18670/27046]	Time 0.023 (0.022)	Loss 0.6776 (0.1630)	
Epoch: [1][18680/27046]	Time 0.019 (0.022)	Loss 0.1070 (0.1630)	
Epoch: [1][18690/27046]	Time 0.021 (0.022)	Loss 0.4615 (0.1630)	
Epoch: [1][18700/27046]	Time 0.019 (0.022)	Loss 0.0495 (0.1630)	
Epoch: [1][18710/27046]	Time 0.019 (0.022)	Loss 0.2873 (0.1631)	
Epoch: [1][18720/27046]	Time 0.044 (0.022)	Loss 0.0106 (0.1630)	
Epoch: [1][18730/27046]	Time 0.019 (0.022)	Loss 1.3927 (0.1631)	
Epoch: [1][18740/27046]	Time 0.019 (0.022)	Loss 0.1741 (0.1631)	
Epoch: [1][18750/27046]	Time 0.026 (0.022)	Loss 0.0068 (0.1631)	
Epoch: [1][18760/27046]	Time 0.023 (0.022)	Loss 0.0369 (0.1630)	
Epoch: [1][18770/27046]	T

Epoch: [1][19890/27046]	Time 0.024 (0.022)	Loss 0.2428 (0.1632)	
Epoch: [1][19900/27046]	Time 0.023 (0.022)	Loss 0.0166 (0.1632)	
Epoch: [1][19910/27046]	Time 0.022 (0.022)	Loss 0.3185 (0.1632)	
Epoch: [1][19920/27046]	Time 0.019 (0.022)	Loss 0.4190 (0.1632)	
Epoch: [1][19930/27046]	Time 0.023 (0.022)	Loss 0.2346 (0.1632)	
Epoch: [1][19940/27046]	Time 0.023 (0.022)	Loss 0.0646 (0.1632)	
Epoch: [1][19950/27046]	Time 0.020 (0.022)	Loss 0.6729 (0.1632)	
Epoch: [1][19960/27046]	Time 0.020 (0.022)	Loss 0.1427 (0.1632)	
Epoch: [1][19970/27046]	Time 0.022 (0.022)	Loss 0.3639 (0.1632)	
Epoch: [1][19980/27046]	Time 0.023 (0.022)	Loss 0.1742 (0.1632)	
Epoch: [1][19990/27046]	Time 0.021 (0.022)	Loss 0.3627 (0.1632)	
Epoch: [1][20000/27046]	Time 0.041 (0.022)	Loss 0.1054 (0.1632)	
Epoch: [1][20010/27046]	Time 0.022 (0.022)	Loss 0.0543 (0.1632)	
Epoch: [1][20020/27046]	Time 0.020 (0.022)	Loss 0.0477 (0.1631)	
Epoch: [1][20030/27046]	Time 0.020 (0.022)	Loss 0.1088 (0.1632)	
Epoch: [1][20040/27046]	T

Epoch: [1][21160/27046]	Time 0.020 (0.022)	Loss 0.0711 (0.1631)	
Epoch: [1][21170/27046]	Time 0.020 (0.022)	Loss 0.1252 (0.1631)	
Epoch: [1][21180/27046]	Time 0.021 (0.022)	Loss 0.1968 (0.1632)	
Epoch: [1][21190/27046]	Time 0.021 (0.022)	Loss 0.0949 (0.1632)	
Epoch: [1][21200/27046]	Time 0.022 (0.022)	Loss 0.0057 (0.1631)	
Epoch: [1][21210/27046]	Time 0.023 (0.022)	Loss 0.2811 (0.1631)	
Epoch: [1][21220/27046]	Time 0.020 (0.022)	Loss 0.0219 (0.1631)	
Epoch: [1][21230/27046]	Time 0.020 (0.022)	Loss 0.1724 (0.1632)	
Epoch: [1][21240/27046]	Time 0.022 (0.022)	Loss 0.7737 (0.1632)	
Epoch: [1][21250/27046]	Time 0.021 (0.022)	Loss 0.0814 (0.1632)	
Epoch: [1][21260/27046]	Time 0.019 (0.022)	Loss 1.1228 (0.1632)	
Epoch: [1][21270/27046]	Time 0.023 (0.022)	Loss 0.0335 (0.1632)	
Epoch: [1][21280/27046]	Time 0.042 (0.022)	Loss 0.0908 (0.1632)	
Epoch: [1][21290/27046]	Time 0.024 (0.022)	Loss 0.0871 (0.1631)	
Epoch: [1][21300/27046]	Time 0.020 (0.022)	Loss 0.0158 (0.1631)	
Epoch: [1][21310/27046]	T

Epoch: [1][22440/27046]	Time 0.023 (0.021)	Loss 0.3104 (0.1633)	
Epoch: [1][22450/27046]	Time 0.024 (0.021)	Loss 0.0036 (0.1633)	
Epoch: [1][22460/27046]	Time 0.020 (0.021)	Loss 0.2360 (0.1633)	
Epoch: [1][22470/27046]	Time 0.021 (0.021)	Loss 0.1057 (0.1633)	
Epoch: [1][22480/27046]	Time 0.022 (0.021)	Loss 0.2258 (0.1633)	
Epoch: [1][22490/27046]	Time 0.020 (0.021)	Loss 0.1490 (0.1633)	
Epoch: [1][22500/27046]	Time 0.019 (0.021)	Loss 0.0007 (0.1634)	
Epoch: [1][22510/27046]	Time 0.020 (0.021)	Loss 0.0681 (0.1634)	
Epoch: [1][22520/27046]	Time 0.020 (0.021)	Loss 0.1207 (0.1634)	
Epoch: [1][22530/27046]	Time 0.022 (0.021)	Loss 0.0372 (0.1634)	
Epoch: [1][22540/27046]	Time 0.020 (0.021)	Loss 0.4722 (0.1634)	
Epoch: [1][22550/27046]	Time 0.020 (0.021)	Loss 0.3604 (0.1633)	
Epoch: [1][22560/27046]	Time 0.043 (0.021)	Loss 0.3708 (0.1634)	
Epoch: [1][22570/27046]	Time 0.024 (0.021)	Loss 0.2005 (0.1634)	
Epoch: [1][22580/27046]	Time 0.019 (0.021)	Loss 0.3672 (0.1633)	
Epoch: [1][22590/27046]	T

Epoch: [1][23710/27046]	Time 0.021 (0.021)	Loss 0.0884 (0.1638)	
Epoch: [1][23720/27046]	Time 0.021 (0.021)	Loss 0.0547 (0.1638)	
Epoch: [1][23730/27046]	Time 0.020 (0.021)	Loss 0.2311 (0.1638)	
Epoch: [1][23740/27046]	Time 0.018 (0.021)	Loss 0.2614 (0.1638)	
Epoch: [1][23750/27046]	Time 0.020 (0.021)	Loss 1.1934 (0.1639)	
Epoch: [1][23760/27046]	Time 0.021 (0.021)	Loss 0.0488 (0.1639)	
Epoch: [1][23770/27046]	Time 0.020 (0.021)	Loss 0.1458 (0.1639)	
Epoch: [1][23780/27046]	Time 0.019 (0.021)	Loss 0.0474 (0.1639)	
Epoch: [1][23790/27046]	Time 0.020 (0.021)	Loss 0.0290 (0.1638)	
Epoch: [1][23800/27046]	Time 0.020 (0.021)	Loss 0.0541 (0.1638)	
Epoch: [1][23810/27046]	Time 0.020 (0.021)	Loss 0.0734 (0.1638)	
Epoch: [1][23820/27046]	Time 0.020 (0.021)	Loss 0.0152 (0.1638)	
Epoch: [1][23830/27046]	Time 0.020 (0.021)	Loss 0.2275 (0.1638)	
Epoch: [1][23840/27046]	Time 0.041 (0.021)	Loss 0.4470 (0.1638)	
Epoch: [1][23850/27046]	Time 0.022 (0.021)	Loss 0.0988 (0.1638)	
Epoch: [1][23860/27046]	T

Epoch: [1][24980/27046]	Time 0.029 (0.021)	Loss 0.0933 (0.1635)	
Epoch: [1][24990/27046]	Time 0.020 (0.021)	Loss 0.0859 (0.1635)	
Epoch: [1][25000/27046]	Time 0.019 (0.021)	Loss 0.0430 (0.1635)	
Epoch: [1][25010/27046]	Time 0.021 (0.021)	Loss 0.4163 (0.1635)	
Epoch: [1][25020/27046]	Time 0.022 (0.021)	Loss 0.0244 (0.1635)	
Epoch: [1][25030/27046]	Time 0.019 (0.021)	Loss 0.0712 (0.1635)	
Epoch: [1][25040/27046]	Time 0.019 (0.021)	Loss 0.4120 (0.1635)	
Epoch: [1][25050/27046]	Time 0.022 (0.021)	Loss 0.0022 (0.1635)	
Epoch: [1][25060/27046]	Time 0.023 (0.021)	Loss 0.0026 (0.1635)	
Epoch: [1][25070/27046]	Time 0.022 (0.021)	Loss 0.0029 (0.1635)	
Epoch: [1][25080/27046]	Time 0.019 (0.021)	Loss 0.3034 (0.1635)	
Epoch: [1][25090/27046]	Time 0.022 (0.021)	Loss 0.2046 (0.1635)	
Epoch: [1][25100/27046]	Time 0.021 (0.021)	Loss 0.0311 (0.1636)	
Epoch: [1][25110/27046]	Time 0.020 (0.021)	Loss 0.1957 (0.1636)	
Epoch: [1][25120/27046]	Time 0.039 (0.021)	Loss 0.0320 (0.1636)	
Epoch: [1][25130/27046]	T

Epoch: [1][26250/27046]	Time 0.020 (0.021)	Loss 0.0485 (0.1634)	
Epoch: [1][26260/27046]	Time 0.021 (0.021)	Loss 0.1645 (0.1634)	
Epoch: [1][26270/27046]	Time 0.020 (0.021)	Loss 0.0044 (0.1634)	
Epoch: [1][26280/27046]	Time 0.020 (0.021)	Loss 0.4226 (0.1634)	
Epoch: [1][26290/27046]	Time 0.024 (0.021)	Loss 0.2776 (0.1635)	
Epoch: [1][26300/27046]	Time 0.019 (0.021)	Loss 0.0627 (0.1635)	
Epoch: [1][26310/27046]	Time 0.019 (0.021)	Loss 0.4787 (0.1635)	
Epoch: [1][26320/27046]	Time 0.022 (0.021)	Loss 0.2950 (0.1635)	
Epoch: [1][26330/27046]	Time 0.019 (0.021)	Loss 0.0799 (0.1635)	
Epoch: [1][26340/27046]	Time 0.022 (0.021)	Loss 0.0043 (0.1635)	
Epoch: [1][26350/27046]	Time 0.021 (0.021)	Loss 0.0135 (0.1635)	
Epoch: [1][26360/27046]	Time 0.019 (0.021)	Loss 0.0600 (0.1635)	
Epoch: [1][26370/27046]	Time 0.021 (0.021)	Loss 0.0604 (0.1635)	
Epoch: [1][26380/27046]	Time 0.021 (0.021)	Loss 0.2405 (0.1635)	
Epoch: [1][26390/27046]	Time 0.023 (0.021)	Loss 0.0300 (0.1635)	
Epoch: [1][26400/27046]	T

Epoch: [1][740/6762]	Time 0.005 (0.004)	
Epoch: [1][750/6762]	Time 0.005 (0.004)	
Epoch: [1][760/6762]	Time 0.004 (0.004)	
Epoch: [1][770/6762]	Time 0.004 (0.004)	
Epoch: [1][780/6762]	Time 0.004 (0.004)	
Epoch: [1][790/6762]	Time 0.003 (0.004)	
Epoch: [1][800/6762]	Time 0.004 (0.004)	
Epoch: [1][810/6762]	Time 0.004 (0.004)	
Epoch: [1][820/6762]	Time 0.005 (0.004)	
Epoch: [1][830/6762]	Time 0.005 (0.004)	
Epoch: [1][840/6762]	Time 0.005 (0.004)	
Epoch: [1][850/6762]	Time 0.005 (0.004)	
Epoch: [1][860/6762]	Time 0.004 (0.004)	
Epoch: [1][870/6762]	Time 0.005 (0.004)	
Epoch: [1][880/6762]	Time 0.005 (0.004)	
Epoch: [1][890/6762]	Time 0.004 (0.004)	
Epoch: [1][900/6762]	Time 0.005 (0.004)	
Epoch: [1][910/6762]	Time 0.004 (0.004)	
Epoch: [1][920/6762]	Time 0.005 (0.004)	
Epoch: [1][930/6762]	Time 0.005 (0.004)	
Epoch: [1][940/6762]	Time 0.004 (0.004)	
Epoch: [1][950/6762]	Time 0.004 (0.004)	
Epoch: [1][960/6762]	Time 0.005 (0.004)	
Epoch: [1][970/6762]	Time 0.004 (0.004)	
Epoch: [1][980/6

Epoch: [1][2700/6762]	Time 0.005 (0.004)	
Epoch: [1][2710/6762]	Time 0.005 (0.004)	
Epoch: [1][2720/6762]	Time 0.005 (0.004)	
Epoch: [1][2730/6762]	Time 0.005 (0.004)	
Epoch: [1][2740/6762]	Time 0.005 (0.004)	
Epoch: [1][2750/6762]	Time 0.004 (0.004)	
Epoch: [1][2760/6762]	Time 0.005 (0.004)	
Epoch: [1][2770/6762]	Time 0.004 (0.004)	
Epoch: [1][2780/6762]	Time 0.004 (0.004)	
Epoch: [1][2790/6762]	Time 0.004 (0.004)	
Epoch: [1][2800/6762]	Time 0.004 (0.004)	
Epoch: [1][2810/6762]	Time 0.004 (0.004)	
Epoch: [1][2820/6762]	Time 0.004 (0.004)	
Epoch: [1][2830/6762]	Time 0.006 (0.004)	
Epoch: [1][2840/6762]	Time 0.004 (0.004)	
Epoch: [1][2850/6762]	Time 0.004 (0.004)	
Epoch: [1][2860/6762]	Time 0.004 (0.004)	
Epoch: [1][2870/6762]	Time 0.005 (0.004)	
Epoch: [1][2880/6762]	Time 0.005 (0.004)	
Epoch: [1][2890/6762]	Time 0.005 (0.004)	
Epoch: [1][2900/6762]	Time 0.004 (0.004)	
Epoch: [1][2910/6762]	Time 0.005 (0.004)	
Epoch: [1][2920/6762]	Time 0.004 (0.004)	
Epoch: [1][2930/6762]	Time 0.004 (

Epoch: [1][4680/6762]	Time 0.005 (0.004)	
Epoch: [1][4690/6762]	Time 0.006 (0.004)	
Epoch: [1][4700/6762]	Time 0.004 (0.004)	
Epoch: [1][4710/6762]	Time 0.005 (0.004)	
Epoch: [1][4720/6762]	Time 0.004 (0.004)	
Epoch: [1][4730/6762]	Time 0.004 (0.004)	
Epoch: [1][4740/6762]	Time 0.004 (0.004)	
Epoch: [1][4750/6762]	Time 0.004 (0.004)	
Epoch: [1][4760/6762]	Time 0.004 (0.004)	
Epoch: [1][4770/6762]	Time 0.004 (0.004)	
Epoch: [1][4780/6762]	Time 0.004 (0.004)	
Epoch: [1][4790/6762]	Time 0.004 (0.004)	
Epoch: [1][4800/6762]	Time 0.004 (0.004)	
Epoch: [1][4810/6762]	Time 0.005 (0.004)	
Epoch: [1][4820/6762]	Time 0.004 (0.004)	
Epoch: [1][4830/6762]	Time 0.004 (0.004)	
Epoch: [1][4840/6762]	Time 0.003 (0.004)	
Epoch: [1][4850/6762]	Time 0.004 (0.004)	
Epoch: [1][4860/6762]	Time 0.005 (0.004)	
Epoch: [1][4870/6762]	Time 0.004 (0.004)	
Epoch: [1][4880/6762]	Time 0.004 (0.004)	
Epoch: [1][4890/6762]	Time 0.004 (0.004)	
Epoch: [1][4900/6762]	Time 0.005 (0.004)	
Epoch: [1][4910/6762]	Time 0.004 (

Epoch: [1][6660/6762]	Time 0.004 (0.004)	
Epoch: [1][6670/6762]	Time 0.004 (0.004)	
Epoch: [1][6680/6762]	Time 0.004 (0.004)	
Epoch: [1][6690/6762]	Time 0.004 (0.004)	
Epoch: [1][6700/6762]	Time 0.005 (0.004)	
Epoch: [1][6710/6762]	Time 0.004 (0.004)	
Epoch: [1][6720/6762]	Time 0.005 (0.004)	
Epoch: [1][6730/6762]	Time 0.004 (0.004)	
Epoch: [1][6740/6762]	Time 0.004 (0.004)	
Epoch: [1][6750/6762]	Time 0.004 (0.004)	
Epoch: [1][6760/6762]	Time 0.004 (0.004)	
* Average Loss @1: 0.1677
Epoch: [2][0/27046]	Time 0.021 (0.021)	Loss 0.0443 (0.0443)	
Epoch: [2][10/27046]	Time 0.022 (0.020)	Loss 0.0068 (0.0745)	
Epoch: [2][20/27046]	Time 0.019 (0.021)	Loss 0.2237 (0.0824)	
Epoch: [2][30/27046]	Time 0.020 (0.020)	Loss 0.0001 (0.1138)	
Epoch: [2][40/27046]	Time 0.021 (0.020)	Loss 0.6522 (0.1555)	
Epoch: [2][50/27046]	Time 0.020 (0.020)	Loss 0.0114 (0.1682)	
Epoch: [2][60/27046]	Time 0.021 (0.020)	Loss 0.0115 (0.1480)	
Epoch: [2][70/27046]	Time 0.020 (0.020)	Loss 1.0085 (0.1618)	
Epoch: [2][80/270

Epoch: [2][1240/27046]	Time 0.021 (0.021)	Loss 0.0161 (0.1701)	
Epoch: [2][1250/27046]	Time 0.020 (0.021)	Loss 0.1806 (0.1697)	
Epoch: [2][1260/27046]	Time 0.020 (0.021)	Loss 0.0042 (0.1692)	
Epoch: [2][1270/27046]	Time 0.023 (0.021)	Loss 0.0242 (0.1688)	
Epoch: [2][1280/27046]	Time 0.021 (0.021)	Loss 0.0927 (0.1686)	
Epoch: [2][1290/27046]	Time 0.020 (0.021)	Loss 0.0640 (0.1687)	
Epoch: [2][1300/27046]	Time 0.019 (0.021)	Loss 0.0580 (0.1690)	
Epoch: [2][1310/27046]	Time 0.019 (0.021)	Loss 0.0680 (0.1681)	
Epoch: [2][1320/27046]	Time 0.020 (0.021)	Loss 0.0020 (0.1674)	
Epoch: [2][1330/27046]	Time 0.021 (0.021)	Loss 0.1030 (0.1675)	
Epoch: [2][1340/27046]	Time 0.021 (0.021)	Loss 0.0088 (0.1678)	
Epoch: [2][1350/27046]	Time 0.021 (0.021)	Loss 0.0018 (0.1674)	
Epoch: [2][1360/27046]	Time 0.037 (0.021)	Loss 0.3198 (0.1673)	
Epoch: [2][1370/27046]	Time 0.020 (0.021)	Loss 0.0242 (0.1680)	
Epoch: [2][1380/27046]	Time 0.020 (0.021)	Loss 0.0338 (0.1674)	
Epoch: [2][1390/27046]	Time 0.020 (0.021

Epoch: [2][2530/27046]	Time 0.023 (0.021)	Loss 0.2747 (0.1700)	
Epoch: [2][2540/27046]	Time 0.021 (0.021)	Loss 0.0664 (0.1695)	
Epoch: [2][2550/27046]	Time 0.025 (0.021)	Loss 0.3927 (0.1696)	
Epoch: [2][2560/27046]	Time 0.021 (0.021)	Loss 0.0082 (0.1694)	
Epoch: [2][2570/27046]	Time 0.025 (0.021)	Loss 0.8288 (0.1693)	
Epoch: [2][2580/27046]	Time 0.024 (0.021)	Loss 0.0578 (0.1696)	
Epoch: [2][2590/27046]	Time 0.025 (0.021)	Loss 0.0417 (0.1696)	
Epoch: [2][2600/27046]	Time 0.021 (0.021)	Loss 0.0965 (0.1695)	
Epoch: [2][2610/27046]	Time 0.024 (0.021)	Loss 0.3757 (0.1694)	
Epoch: [2][2620/27046]	Time 0.024 (0.021)	Loss 0.0176 (0.1693)	
Epoch: [2][2630/27046]	Time 0.027 (0.021)	Loss 0.0113 (0.1691)	
Epoch: [2][2640/27046]	Time 0.043 (0.021)	Loss 0.0864 (0.1686)	
Epoch: [2][2650/27046]	Time 0.024 (0.021)	Loss 0.0257 (0.1686)	
Epoch: [2][2660/27046]	Time 0.023 (0.021)	Loss 0.0363 (0.1686)	
Epoch: [2][2670/27046]	Time 0.025 (0.021)	Loss 0.0517 (0.1685)	
Epoch: [2][2680/27046]	Time 0.023 (0.021

Epoch: [2][3820/27046]	Time 0.022 (0.021)	Loss 0.0658 (0.1629)	
Epoch: [2][3830/27046]	Time 0.026 (0.021)	Loss 0.0260 (0.1635)	
Epoch: [2][3840/27046]	Time 0.025 (0.021)	Loss 0.1052 (0.1633)	
Epoch: [2][3850/27046]	Time 0.025 (0.021)	Loss 0.2615 (0.1632)	
Epoch: [2][3860/27046]	Time 0.019 (0.021)	Loss 0.0392 (0.1633)	
Epoch: [2][3870/27046]	Time 0.025 (0.021)	Loss 0.0052 (0.1634)	
Epoch: [2][3880/27046]	Time 0.022 (0.021)	Loss 0.0426 (0.1632)	
Epoch: [2][3890/27046]	Time 0.024 (0.021)	Loss 0.1449 (0.1633)	
Epoch: [2][3900/27046]	Time 0.021 (0.021)	Loss 0.1804 (0.1632)	
Epoch: [2][3910/27046]	Time 0.025 (0.021)	Loss 0.0434 (0.1631)	
Epoch: [2][3920/27046]	Time 0.046 (0.021)	Loss 0.2850 (0.1637)	
Epoch: [2][3930/27046]	Time 0.024 (0.021)	Loss 0.0199 (0.1637)	
Epoch: [2][3940/27046]	Time 0.021 (0.021)	Loss 0.2171 (0.1635)	
Epoch: [2][3950/27046]	Time 0.023 (0.021)	Loss 0.0016 (0.1634)	
Epoch: [2][3960/27046]	Time 0.021 (0.021)	Loss 0.2063 (0.1637)	
Epoch: [2][3970/27046]	Time 0.022 (0.021

Epoch: [2][5110/27046]	Time 0.024 (0.022)	Loss 0.0221 (0.1662)	
Epoch: [2][5120/27046]	Time 0.022 (0.022)	Loss 0.0030 (0.1660)	
Epoch: [2][5130/27046]	Time 0.022 (0.022)	Loss 0.1735 (0.1660)	
Epoch: [2][5140/27046]	Time 0.024 (0.022)	Loss 0.0463 (0.1662)	
Epoch: [2][5150/27046]	Time 0.027 (0.022)	Loss 0.1897 (0.1663)	
Epoch: [2][5160/27046]	Time 0.022 (0.022)	Loss 0.4177 (0.1663)	
Epoch: [2][5170/27046]	Time 0.030 (0.022)	Loss 0.0578 (0.1663)	
Epoch: [2][5180/27046]	Time 0.024 (0.022)	Loss 0.0570 (0.1664)	
Epoch: [2][5190/27046]	Time 0.027 (0.022)	Loss 0.9483 (0.1665)	
Epoch: [2][5200/27046]	Time 0.046 (0.022)	Loss 0.0200 (0.1664)	
Epoch: [2][5210/27046]	Time 0.026 (0.022)	Loss 0.0581 (0.1664)	
Epoch: [2][5220/27046]	Time 0.024 (0.022)	Loss 0.1693 (0.1664)	
Epoch: [2][5230/27046]	Time 0.023 (0.022)	Loss 0.1254 (0.1664)	
Epoch: [2][5240/27046]	Time 0.024 (0.022)	Loss 0.0111 (0.1662)	
Epoch: [2][5250/27046]	Time 0.027 (0.022)	Loss 0.0844 (0.1662)	
Epoch: [2][5260/27046]	Time 0.022 (0.022

Epoch: [2][6400/27046]	Time 0.022 (0.022)	Loss 0.0317 (0.1639)	
Epoch: [2][6410/27046]	Time 0.026 (0.022)	Loss 0.0583 (0.1642)	
Epoch: [2][6420/27046]	Time 0.022 (0.022)	Loss 0.2166 (0.1642)	
Epoch: [2][6430/27046]	Time 0.027 (0.022)	Loss 0.2730 (0.1643)	
Epoch: [2][6440/27046]	Time 0.028 (0.022)	Loss 0.0414 (0.1643)	
Epoch: [2][6450/27046]	Time 0.032 (0.022)	Loss 0.0197 (0.1642)	
Epoch: [2][6460/27046]	Time 0.026 (0.022)	Loss 0.0225 (0.1640)	
Epoch: [2][6470/27046]	Time 0.026 (0.022)	Loss 0.0531 (0.1639)	
Epoch: [2][6480/27046]	Time 0.043 (0.022)	Loss 0.0045 (0.1638)	
Epoch: [2][6490/27046]	Time 0.022 (0.022)	Loss 0.1346 (0.1638)	
Epoch: [2][6500/27046]	Time 0.027 (0.022)	Loss 0.0437 (0.1637)	
Epoch: [2][6510/27046]	Time 0.025 (0.022)	Loss 0.1972 (0.1637)	
Epoch: [2][6520/27046]	Time 0.025 (0.022)	Loss 0.3105 (0.1636)	
Epoch: [2][6530/27046]	Time 0.027 (0.022)	Loss 0.4097 (0.1637)	
Epoch: [2][6540/27046]	Time 0.023 (0.022)	Loss 0.0252 (0.1636)	
Epoch: [2][6550/27046]	Time 0.025 (0.022

Epoch: [2][7690/27046]	Time 0.028 (0.022)	Loss 0.3029 (0.1625)	
Epoch: [2][7700/27046]	Time 0.025 (0.022)	Loss 0.5185 (0.1626)	
Epoch: [2][7710/27046]	Time 0.026 (0.022)	Loss 0.0266 (0.1626)	
Epoch: [2][7720/27046]	Time 0.020 (0.022)	Loss 0.0247 (0.1625)	
Epoch: [2][7730/27046]	Time 0.028 (0.022)	Loss 0.0653 (0.1625)	
Epoch: [2][7740/27046]	Time 0.021 (0.022)	Loss 0.0402 (0.1627)	
Epoch: [2][7750/27046]	Time 0.024 (0.022)	Loss 0.2451 (0.1629)	
Epoch: [2][7760/27046]	Time 0.047 (0.022)	Loss 0.1182 (0.1628)	
Epoch: [2][7770/27046]	Time 0.029 (0.022)	Loss 0.0386 (0.1627)	
Epoch: [2][7780/27046]	Time 0.021 (0.022)	Loss 0.0315 (0.1628)	
Epoch: [2][7790/27046]	Time 0.032 (0.022)	Loss 0.1047 (0.1629)	
Epoch: [2][7800/27046]	Time 0.021 (0.022)	Loss 0.0194 (0.1629)	
Epoch: [2][7810/27046]	Time 0.029 (0.022)	Loss 0.0677 (0.1630)	
Epoch: [2][7820/27046]	Time 0.025 (0.022)	Loss 0.0294 (0.1630)	
Epoch: [2][7830/27046]	Time 0.023 (0.022)	Loss 0.0111 (0.1630)	
Epoch: [2][7840/27046]	Time 0.021 (0.022

Epoch: [2][8980/27046]	Time 0.024 (0.022)	Loss 0.1480 (0.1641)	
Epoch: [2][8990/27046]	Time 0.029 (0.022)	Loss 0.0313 (0.1640)	
Epoch: [2][9000/27046]	Time 0.023 (0.022)	Loss 0.1724 (0.1640)	
Epoch: [2][9010/27046]	Time 0.023 (0.022)	Loss 0.1188 (0.1640)	
Epoch: [2][9020/27046]	Time 0.032 (0.022)	Loss 0.0170 (0.1639)	
Epoch: [2][9030/27046]	Time 0.021 (0.022)	Loss 0.0490 (0.1639)	
Epoch: [2][9040/27046]	Time 0.049 (0.022)	Loss 0.0588 (0.1638)	
Epoch: [2][9050/27046]	Time 0.026 (0.022)	Loss 0.0890 (0.1637)	
Epoch: [2][9060/27046]	Time 0.027 (0.022)	Loss 0.2719 (0.1637)	
Epoch: [2][9070/27046]	Time 0.029 (0.022)	Loss 0.2293 (0.1638)	
Epoch: [2][9080/27046]	Time 0.028 (0.022)	Loss 0.1043 (0.1638)	
Epoch: [2][9090/27046]	Time 0.032 (0.022)	Loss 0.1428 (0.1638)	
Epoch: [2][9100/27046]	Time 0.020 (0.022)	Loss 0.0284 (0.1637)	
Epoch: [2][9110/27046]	Time 0.027 (0.022)	Loss 0.5021 (0.1638)	
Epoch: [2][9120/27046]	Time 0.022 (0.022)	Loss 0.5494 (0.1639)	
Epoch: [2][9130/27046]	Time 0.024 (0.022

Epoch: [2][10260/27046]	Time 0.019 (0.022)	Loss 0.0305 (0.1640)	
Epoch: [2][10270/27046]	Time 0.021 (0.022)	Loss 0.0329 (0.1639)	
Epoch: [2][10280/27046]	Time 0.019 (0.022)	Loss 0.0278 (0.1639)	
Epoch: [2][10290/27046]	Time 0.021 (0.022)	Loss 0.1386 (0.1639)	
Epoch: [2][10300/27046]	Time 0.020 (0.022)	Loss 0.0119 (0.1638)	
Epoch: [2][10310/27046]	Time 0.020 (0.022)	Loss 0.2454 (0.1638)	
Epoch: [2][10320/27046]	Time 0.049 (0.022)	Loss 0.1030 (0.1637)	
Epoch: [2][10330/27046]	Time 0.021 (0.022)	Loss 0.0790 (0.1636)	
Epoch: [2][10340/27046]	Time 0.020 (0.022)	Loss 0.0793 (0.1638)	
Epoch: [2][10350/27046]	Time 0.019 (0.022)	Loss 0.4610 (0.1638)	
Epoch: [2][10360/27046]	Time 0.020 (0.022)	Loss 0.0326 (0.1638)	
Epoch: [2][10370/27046]	Time 0.020 (0.022)	Loss 0.0862 (0.1638)	
Epoch: [2][10380/27046]	Time 0.019 (0.022)	Loss 0.0076 (0.1638)	
Epoch: [2][10390/27046]	Time 0.021 (0.022)	Loss 0.4279 (0.1637)	
Epoch: [2][10400/27046]	Time 0.022 (0.022)	Loss 0.1377 (0.1639)	
Epoch: [2][10410/27046]	T

Epoch: [2][11530/27046]	Time 0.020 (0.022)	Loss 0.0256 (0.1637)	
Epoch: [2][11540/27046]	Time 0.020 (0.022)	Loss 0.0916 (0.1637)	
Epoch: [2][11550/27046]	Time 0.019 (0.022)	Loss 0.0817 (0.1637)	
Epoch: [2][11560/27046]	Time 0.021 (0.022)	Loss 0.2558 (0.1638)	
Epoch: [2][11570/27046]	Time 0.024 (0.022)	Loss 0.0433 (0.1637)	
Epoch: [2][11580/27046]	Time 0.026 (0.022)	Loss 0.0557 (0.1639)	
Epoch: [2][11590/27046]	Time 0.024 (0.022)	Loss 0.1469 (0.1638)	
Epoch: [2][11600/27046]	Time 0.050 (0.022)	Loss 0.0206 (0.1638)	
Epoch: [2][11610/27046]	Time 0.026 (0.022)	Loss 0.1244 (0.1637)	
Epoch: [2][11620/27046]	Time 0.021 (0.022)	Loss 0.0704 (0.1638)	
Epoch: [2][11630/27046]	Time 0.022 (0.022)	Loss 0.0123 (0.1638)	
Epoch: [2][11640/27046]	Time 0.020 (0.022)	Loss 0.0524 (0.1637)	
Epoch: [2][11650/27046]	Time 0.019 (0.022)	Loss 0.3581 (0.1639)	
Epoch: [2][11660/27046]	Time 0.021 (0.022)	Loss 0.1102 (0.1638)	
Epoch: [2][11670/27046]	Time 0.021 (0.022)	Loss 0.0596 (0.1639)	
Epoch: [2][11680/27046]	T

Epoch: [2][12800/27046]	Time 0.020 (0.022)	Loss 0.1544 (0.1639)	
Epoch: [2][12810/27046]	Time 0.020 (0.022)	Loss 0.4774 (0.1639)	
Epoch: [2][12820/27046]	Time 0.019 (0.022)	Loss 0.1988 (0.1639)	
Epoch: [2][12830/27046]	Time 0.020 (0.022)	Loss 0.1320 (0.1639)	
Epoch: [2][12840/27046]	Time 0.019 (0.022)	Loss 0.2721 (0.1639)	
Epoch: [2][12850/27046]	Time 0.024 (0.022)	Loss 0.2211 (0.1640)	
Epoch: [2][12860/27046]	Time 0.020 (0.022)	Loss 0.1192 (0.1639)	
Epoch: [2][12870/27046]	Time 0.021 (0.022)	Loss 0.0182 (0.1638)	
Epoch: [2][12880/27046]	Time 0.050 (0.022)	Loss 0.0276 (0.1638)	
Epoch: [2][12890/27046]	Time 0.022 (0.022)	Loss 0.0164 (0.1638)	
Epoch: [2][12900/27046]	Time 0.019 (0.022)	Loss 0.1177 (0.1639)	
Epoch: [2][12910/27046]	Time 0.023 (0.022)	Loss 0.0151 (0.1639)	
Epoch: [2][12920/27046]	Time 0.019 (0.022)	Loss 0.0866 (0.1638)	
Epoch: [2][12930/27046]	Time 0.021 (0.022)	Loss 0.2636 (0.1640)	
Epoch: [2][12940/27046]	Time 0.021 (0.022)	Loss 0.0509 (0.1639)	
Epoch: [2][12950/27046]	T

Epoch: [2][14070/27046]	Time 0.019 (0.022)	Loss 0.0235 (0.1644)	
Epoch: [2][14080/27046]	Time 0.023 (0.022)	Loss 0.0760 (0.1644)	
Epoch: [2][14090/27046]	Time 0.020 (0.022)	Loss 0.2357 (0.1644)	
Epoch: [2][14100/27046]	Time 0.020 (0.022)	Loss 0.0145 (0.1643)	
Epoch: [2][14110/27046]	Time 0.021 (0.022)	Loss 0.1530 (0.1643)	
Epoch: [2][14120/27046]	Time 0.021 (0.022)	Loss 0.2448 (0.1642)	
Epoch: [2][14130/27046]	Time 0.023 (0.022)	Loss 0.0786 (0.1642)	
Epoch: [2][14140/27046]	Time 0.021 (0.022)	Loss 0.0101 (0.1642)	
Epoch: [2][14150/27046]	Time 0.020 (0.022)	Loss 0.0498 (0.1642)	
Epoch: [2][14160/27046]	Time 0.047 (0.022)	Loss 0.2465 (0.1642)	
Epoch: [2][14170/27046]	Time 0.020 (0.022)	Loss 0.0763 (0.1642)	
Epoch: [2][14180/27046]	Time 0.020 (0.022)	Loss 0.0177 (0.1642)	
Epoch: [2][14190/27046]	Time 0.023 (0.022)	Loss 0.0122 (0.1642)	
Epoch: [2][14200/27046]	Time 0.020 (0.022)	Loss 0.0013 (0.1642)	
Epoch: [2][14210/27046]	Time 0.020 (0.022)	Loss 0.1292 (0.1642)	
Epoch: [2][14220/27046]	T

Epoch: [2][15340/27046]	Time 0.019 (0.022)	Loss 0.2426 (0.1646)	
Epoch: [2][15350/27046]	Time 0.022 (0.022)	Loss 0.1076 (0.1646)	
Epoch: [2][15360/27046]	Time 0.022 (0.022)	Loss 0.0811 (0.1646)	
Epoch: [2][15370/27046]	Time 0.021 (0.022)	Loss 0.3903 (0.1646)	
Epoch: [2][15380/27046]	Time 0.020 (0.022)	Loss 0.1791 (0.1646)	
Epoch: [2][15390/27046]	Time 0.022 (0.022)	Loss 0.8713 (0.1646)	
Epoch: [2][15400/27046]	Time 0.021 (0.022)	Loss 0.4889 (0.1648)	
Epoch: [2][15410/27046]	Time 0.020 (0.022)	Loss 0.1259 (0.1652)	
Epoch: [2][15420/27046]	Time 0.019 (0.022)	Loss 0.1824 (0.1652)	
Epoch: [2][15430/27046]	Time 0.019 (0.022)	Loss 0.1213 (0.1652)	
Epoch: [2][15440/27046]	Time 0.051 (0.022)	Loss 0.2464 (0.1654)	
Epoch: [2][15450/27046]	Time 0.020 (0.022)	Loss 0.0313 (0.1656)	
Epoch: [2][15460/27046]	Time 0.020 (0.022)	Loss 0.9773 (0.1656)	
Epoch: [2][15470/27046]	Time 0.024 (0.022)	Loss 0.2765 (0.1659)	
Epoch: [2][15480/27046]	Time 0.020 (0.022)	Loss 0.0878 (0.1659)	
Epoch: [2][15490/27046]	T

Epoch: [2][16610/27046]	Time 0.023 (0.022)	Loss 0.0424 (0.1656)	
Epoch: [2][16620/27046]	Time 0.020 (0.022)	Loss 0.1024 (0.1656)	
Epoch: [2][16630/27046]	Time 0.019 (0.022)	Loss 0.0708 (0.1655)	
Epoch: [2][16640/27046]	Time 0.020 (0.022)	Loss 0.2148 (0.1655)	
Epoch: [2][16650/27046]	Time 0.020 (0.022)	Loss 0.1633 (0.1655)	
Epoch: [2][16660/27046]	Time 0.024 (0.022)	Loss 0.5364 (0.1655)	
Epoch: [2][16670/27046]	Time 0.020 (0.022)	Loss 0.2775 (0.1655)	
Epoch: [2][16680/27046]	Time 0.019 (0.022)	Loss 0.1608 (0.1654)	
Epoch: [2][16690/27046]	Time 0.020 (0.022)	Loss 0.0225 (0.1654)	
Epoch: [2][16700/27046]	Time 0.021 (0.022)	Loss 0.0358 (0.1654)	
Epoch: [2][16710/27046]	Time 0.019 (0.022)	Loss 0.0123 (0.1653)	
Epoch: [2][16720/27046]	Time 0.049 (0.022)	Loss 0.2109 (0.1654)	
Epoch: [2][16730/27046]	Time 0.021 (0.022)	Loss 0.1993 (0.1654)	
Epoch: [2][16740/27046]	Time 0.021 (0.022)	Loss 0.0609 (0.1654)	
Epoch: [2][16750/27046]	Time 0.021 (0.022)	Loss 0.1579 (0.1654)	
Epoch: [2][16760/27046]	T

Epoch: [2][17880/27046]	Time 0.020 (0.022)	Loss 0.3702 (0.1645)	
Epoch: [2][17890/27046]	Time 0.024 (0.022)	Loss 0.0537 (0.1644)	
Epoch: [2][17900/27046]	Time 0.020 (0.022)	Loss 0.3079 (0.1645)	
Epoch: [2][17910/27046]	Time 0.022 (0.022)	Loss 0.1752 (0.1645)	
Epoch: [2][17920/27046]	Time 0.024 (0.022)	Loss 0.0003 (0.1646)	
Epoch: [2][17930/27046]	Time 0.024 (0.022)	Loss 0.0730 (0.1645)	
Epoch: [2][17940/27046]	Time 0.021 (0.022)	Loss 0.2917 (0.1646)	
Epoch: [2][17950/27046]	Time 0.026 (0.022)	Loss 0.2666 (0.1646)	
Epoch: [2][17960/27046]	Time 0.021 (0.022)	Loss 0.1507 (0.1646)	
Epoch: [2][17970/27046]	Time 0.022 (0.022)	Loss 0.3509 (0.1646)	
Epoch: [2][17980/27046]	Time 0.023 (0.022)	Loss 0.0964 (0.1646)	
Epoch: [2][17990/27046]	Time 0.027 (0.022)	Loss 0.0151 (0.1647)	
Epoch: [2][18000/27046]	Time 0.055 (0.022)	Loss 0.1216 (0.1647)	
Epoch: [2][18010/27046]	Time 0.022 (0.022)	Loss 0.0373 (0.1646)	
Epoch: [2][18020/27046]	Time 0.021 (0.022)	Loss 0.0174 (0.1646)	
Epoch: [2][18030/27046]	T

Epoch: [2][19150/27046]	Time 0.021 (0.022)	Loss 0.0234 (0.1639)	
Epoch: [2][19160/27046]	Time 0.024 (0.022)	Loss 0.0465 (0.1639)	
Epoch: [2][19170/27046]	Time 0.023 (0.022)	Loss 0.0101 (0.1639)	
Epoch: [2][19180/27046]	Time 0.020 (0.022)	Loss 0.0239 (0.1639)	
Epoch: [2][19190/27046]	Time 0.022 (0.022)	Loss 0.1827 (0.1638)	
Epoch: [2][19200/27046]	Time 0.020 (0.022)	Loss 0.5400 (0.1638)	
Epoch: [2][19210/27046]	Time 0.019 (0.022)	Loss 0.0708 (0.1639)	
Epoch: [2][19220/27046]	Time 0.020 (0.022)	Loss 0.1529 (0.1640)	
Epoch: [2][19230/27046]	Time 0.027 (0.022)	Loss 0.1045 (0.1640)	
Epoch: [2][19240/27046]	Time 0.023 (0.022)	Loss 0.0211 (0.1640)	
Epoch: [2][19250/27046]	Time 0.021 (0.022)	Loss 0.0311 (0.1640)	
Epoch: [2][19260/27046]	Time 0.021 (0.022)	Loss 0.0617 (0.1639)	
Epoch: [2][19270/27046]	Time 0.025 (0.022)	Loss 0.1011 (0.1639)	
Epoch: [2][19280/27046]	Time 0.051 (0.022)	Loss 0.0076 (0.1640)	
Epoch: [2][19290/27046]	Time 0.024 (0.022)	Loss 0.0459 (0.1640)	
Epoch: [2][19300/27046]	T

Epoch: [2][20420/27046]	Time 0.023 (0.021)	Loss 0.3437 (0.1652)	
Epoch: [2][20430/27046]	Time 0.021 (0.021)	Loss 0.3419 (0.1652)	
Epoch: [2][20440/27046]	Time 0.020 (0.021)	Loss 0.6987 (0.1653)	
Epoch: [2][20450/27046]	Time 0.023 (0.021)	Loss 0.3923 (0.1654)	
Epoch: [2][20460/27046]	Time 0.019 (0.021)	Loss 0.0140 (0.1654)	
Epoch: [2][20470/27046]	Time 0.022 (0.021)	Loss 0.0102 (0.1654)	
Epoch: [2][20480/27046]	Time 0.019 (0.021)	Loss 0.3758 (0.1654)	
Epoch: [2][20490/27046]	Time 0.020 (0.021)	Loss 0.4375 (0.1654)	
Epoch: [2][20500/27046]	Time 0.020 (0.021)	Loss 0.0542 (0.1654)	
Epoch: [2][20510/27046]	Time 0.023 (0.021)	Loss 0.0966 (0.1654)	
Epoch: [2][20520/27046]	Time 0.021 (0.021)	Loss 0.0462 (0.1654)	
Epoch: [2][20530/27046]	Time 0.024 (0.021)	Loss 0.3188 (0.1654)	
Epoch: [2][20540/27046]	Time 0.024 (0.021)	Loss 0.0219 (0.1654)	
Epoch: [2][20550/27046]	Time 0.021 (0.021)	Loss 0.1736 (0.1655)	
Epoch: [2][20560/27046]	Time 0.050 (0.021)	Loss 0.1216 (0.1655)	
Epoch: [2][20570/27046]	T

Epoch: [2][21690/27046]	Time 0.019 (0.021)	Loss 0.0103 (0.1653)	
Epoch: [2][21700/27046]	Time 0.020 (0.021)	Loss 0.3502 (0.1653)	
Epoch: [2][21710/27046]	Time 0.021 (0.021)	Loss 0.0550 (0.1654)	
Epoch: [2][21720/27046]	Time 0.023 (0.021)	Loss 0.3380 (0.1654)	
Epoch: [2][21730/27046]	Time 0.029 (0.021)	Loss 0.3002 (0.1654)	
Epoch: [2][21740/27046]	Time 0.024 (0.021)	Loss 0.0891 (0.1654)	
Epoch: [2][21750/27046]	Time 0.024 (0.021)	Loss 0.2790 (0.1653)	
Epoch: [2][21760/27046]	Time 0.023 (0.021)	Loss 0.0563 (0.1653)	
Epoch: [2][21770/27046]	Time 0.021 (0.021)	Loss 0.4925 (0.1653)	
Epoch: [2][21780/27046]	Time 0.019 (0.021)	Loss 0.2855 (0.1653)	
Epoch: [2][21790/27046]	Time 0.026 (0.021)	Loss 1.2949 (0.1653)	
Epoch: [2][21800/27046]	Time 0.019 (0.021)	Loss 0.0004 (0.1653)	
Epoch: [2][21810/27046]	Time 0.020 (0.021)	Loss 0.1146 (0.1653)	
Epoch: [2][21820/27046]	Time 0.021 (0.021)	Loss 0.0585 (0.1653)	
Epoch: [2][21830/27046]	Time 0.021 (0.021)	Loss 0.2790 (0.1653)	
Epoch: [2][21840/27046]	T

Epoch: [2][22960/27046]	Time 0.024 (0.021)	Loss 1.7610 (0.1644)	
Epoch: [2][22970/27046]	Time 0.023 (0.021)	Loss 0.0558 (0.1644)	
Epoch: [2][22980/27046]	Time 0.019 (0.021)	Loss 0.1047 (0.1643)	
Epoch: [2][22990/27046]	Time 0.020 (0.021)	Loss 0.0372 (0.1643)	
Epoch: [2][23000/27046]	Time 0.020 (0.021)	Loss 0.3936 (0.1644)	
Epoch: [2][23010/27046]	Time 0.021 (0.021)	Loss 0.6632 (0.1644)	
Epoch: [2][23020/27046]	Time 0.020 (0.021)	Loss 0.0150 (0.1643)	
Epoch: [2][23030/27046]	Time 0.021 (0.021)	Loss 0.0410 (0.1643)	
Epoch: [2][23040/27046]	Time 0.020 (0.021)	Loss 0.1347 (0.1643)	
Epoch: [2][23050/27046]	Time 0.022 (0.021)	Loss 0.2636 (0.1642)	
Epoch: [2][23060/27046]	Time 0.020 (0.021)	Loss 0.0156 (0.1642)	
Epoch: [2][23070/27046]	Time 0.023 (0.021)	Loss 0.1077 (0.1642)	
Epoch: [2][23080/27046]	Time 0.019 (0.021)	Loss 0.0239 (0.1642)	
Epoch: [2][23090/27046]	Time 0.019 (0.021)	Loss 0.0252 (0.1642)	
Epoch: [2][23100/27046]	Time 0.019 (0.021)	Loss 0.1425 (0.1642)	
Epoch: [2][23110/27046]	T

Epoch: [2][24230/27046]	Time 0.021 (0.021)	Loss 0.0261 (0.1643)	
Epoch: [2][24240/27046]	Time 0.019 (0.021)	Loss 0.1246 (0.1643)	
Epoch: [2][24250/27046]	Time 0.020 (0.021)	Loss 0.0005 (0.1643)	
Epoch: [2][24260/27046]	Time 0.019 (0.021)	Loss 0.1650 (0.1643)	
Epoch: [2][24270/27046]	Time 0.021 (0.021)	Loss 0.0600 (0.1643)	
Epoch: [2][24280/27046]	Time 0.019 (0.021)	Loss 0.0295 (0.1643)	
Epoch: [2][24290/27046]	Time 0.024 (0.021)	Loss 0.1805 (0.1642)	
Epoch: [2][24300/27046]	Time 0.020 (0.021)	Loss 0.0070 (0.1643)	
Epoch: [2][24310/27046]	Time 0.021 (0.021)	Loss 0.0641 (0.1642)	
Epoch: [2][24320/27046]	Time 0.020 (0.021)	Loss 0.6886 (0.1642)	
Epoch: [2][24330/27046]	Time 0.019 (0.021)	Loss 0.0990 (0.1642)	
Epoch: [2][24340/27046]	Time 0.023 (0.021)	Loss 0.0715 (0.1642)	
Epoch: [2][24350/27046]	Time 0.024 (0.021)	Loss 0.0214 (0.1642)	
Epoch: [2][24360/27046]	Time 0.020 (0.021)	Loss 0.0026 (0.1642)	
Epoch: [2][24370/27046]	Time 0.020 (0.021)	Loss 0.2299 (0.1642)	
Epoch: [2][24380/27046]	T

Epoch: [2][25500/27046]	Time 0.020 (0.021)	Loss 0.0128 (0.1641)	
Epoch: [2][25510/27046]	Time 0.020 (0.021)	Loss 0.0044 (0.1641)	
Epoch: [2][25520/27046]	Time 0.021 (0.021)	Loss 0.0034 (0.1641)	
Epoch: [2][25530/27046]	Time 0.020 (0.021)	Loss 0.0140 (0.1641)	
Epoch: [2][25540/27046]	Time 0.020 (0.021)	Loss 0.0467 (0.1641)	
Epoch: [2][25550/27046]	Time 0.021 (0.021)	Loss 0.1276 (0.1641)	
Epoch: [2][25560/27046]	Time 0.020 (0.021)	Loss 0.0304 (0.1641)	
Epoch: [2][25570/27046]	Time 0.022 (0.021)	Loss 0.2185 (0.1641)	
Epoch: [2][25580/27046]	Time 0.020 (0.021)	Loss 0.2217 (0.1641)	
Epoch: [2][25590/27046]	Time 0.021 (0.021)	Loss 0.3221 (0.1642)	
Epoch: [2][25600/27046]	Time 0.020 (0.021)	Loss 0.2585 (0.1643)	
Epoch: [2][25610/27046]	Time 0.025 (0.021)	Loss 0.0047 (0.1643)	
Epoch: [2][25620/27046]	Time 0.019 (0.021)	Loss 0.5736 (0.1644)	
Epoch: [2][25630/27046]	Time 0.020 (0.021)	Loss 0.3395 (0.1643)	
Epoch: [2][25640/27046]	Time 0.021 (0.021)	Loss 0.0316 (0.1643)	
Epoch: [2][25650/27046]	T

Epoch: [2][26770/27046]	Time 0.021 (0.021)	Loss 0.0383 (0.1647)	
Epoch: [2][26780/27046]	Time 0.021 (0.021)	Loss 0.8580 (0.1647)	
Epoch: [2][26790/27046]	Time 0.020 (0.021)	Loss 0.0159 (0.1647)	
Epoch: [2][26800/27046]	Time 0.025 (0.021)	Loss 0.0506 (0.1647)	
Epoch: [2][26810/27046]	Time 0.022 (0.021)	Loss 0.0459 (0.1647)	
Epoch: [2][26820/27046]	Time 0.023 (0.021)	Loss 0.2990 (0.1647)	
Epoch: [2][26830/27046]	Time 0.025 (0.021)	Loss 0.1375 (0.1647)	
Epoch: [2][26840/27046]	Time 0.019 (0.021)	Loss 0.4519 (0.1647)	
Epoch: [2][26850/27046]	Time 0.025 (0.021)	Loss 0.0208 (0.1646)	
Epoch: [2][26860/27046]	Time 0.019 (0.021)	Loss 0.0901 (0.1646)	
Epoch: [2][26870/27046]	Time 0.021 (0.021)	Loss 0.0144 (0.1645)	
Epoch: [2][26880/27046]	Time 0.023 (0.021)	Loss 0.1096 (0.1646)	
Epoch: [2][26890/27046]	Time 0.020 (0.021)	Loss 0.0365 (0.1646)	
Epoch: [2][26900/27046]	Time 0.019 (0.021)	Loss 0.0555 (0.1646)	
Epoch: [2][26910/27046]	Time 0.024 (0.021)	Loss 0.0511 (0.1645)	
Epoch: [2][26920/27046]	T

Epoch: [2][1570/6762]	Time 0.004 (0.005)	
Epoch: [2][1580/6762]	Time 0.004 (0.005)	
Epoch: [2][1590/6762]	Time 0.004 (0.005)	
Epoch: [2][1600/6762]	Time 0.004 (0.005)	
Epoch: [2][1610/6762]	Time 0.003 (0.005)	
Epoch: [2][1620/6762]	Time 0.003 (0.005)	
Epoch: [2][1630/6762]	Time 0.003 (0.005)	
Epoch: [2][1640/6762]	Time 0.005 (0.005)	
Epoch: [2][1650/6762]	Time 0.003 (0.005)	
Epoch: [2][1660/6762]	Time 0.004 (0.005)	
Epoch: [2][1670/6762]	Time 0.004 (0.005)	
Epoch: [2][1680/6762]	Time 0.005 (0.005)	
Epoch: [2][1690/6762]	Time 0.004 (0.005)	
Epoch: [2][1700/6762]	Time 0.004 (0.005)	
Epoch: [2][1710/6762]	Time 0.005 (0.005)	
Epoch: [2][1720/6762]	Time 0.004 (0.005)	
Epoch: [2][1730/6762]	Time 0.004 (0.005)	
Epoch: [2][1740/6762]	Time 0.004 (0.005)	
Epoch: [2][1750/6762]	Time 0.005 (0.005)	
Epoch: [2][1760/6762]	Time 0.005 (0.005)	
Epoch: [2][1770/6762]	Time 0.005 (0.005)	
Epoch: [2][1780/6762]	Time 0.004 (0.005)	
Epoch: [2][1790/6762]	Time 0.004 (0.005)	
Epoch: [2][1800/6762]	Time 0.004 (

Epoch: [2][3560/6762]	Time 0.003 (0.005)	
Epoch: [2][3570/6762]	Time 0.004 (0.005)	
Epoch: [2][3580/6762]	Time 0.003 (0.005)	
Epoch: [2][3590/6762]	Time 0.004 (0.005)	
Epoch: [2][3600/6762]	Time 0.003 (0.005)	
Epoch: [2][3610/6762]	Time 0.004 (0.005)	
Epoch: [2][3620/6762]	Time 0.003 (0.005)	
Epoch: [2][3630/6762]	Time 0.003 (0.005)	
Epoch: [2][3640/6762]	Time 0.009 (0.005)	
Epoch: [2][3650/6762]	Time 0.004 (0.005)	
Epoch: [2][3660/6762]	Time 0.004 (0.005)	
Epoch: [2][3670/6762]	Time 0.004 (0.005)	
Epoch: [2][3680/6762]	Time 0.003 (0.005)	
Epoch: [2][3690/6762]	Time 0.005 (0.005)	
Epoch: [2][3700/6762]	Time 0.004 (0.005)	
Epoch: [2][3710/6762]	Time 0.004 (0.005)	
Epoch: [2][3720/6762]	Time 0.005 (0.005)	
Epoch: [2][3730/6762]	Time 0.004 (0.005)	
Epoch: [2][3740/6762]	Time 0.004 (0.005)	
Epoch: [2][3750/6762]	Time 0.004 (0.005)	
Epoch: [2][3760/6762]	Time 0.004 (0.005)	
Epoch: [2][3770/6762]	Time 0.003 (0.005)	
Epoch: [2][3780/6762]	Time 0.005 (0.005)	
Epoch: [2][3790/6762]	Time 0.004 (

Epoch: [2][5540/6762]	Time 0.005 (0.005)	
Epoch: [2][5550/6762]	Time 0.004 (0.005)	
Epoch: [2][5560/6762]	Time 0.005 (0.005)	
Epoch: [2][5570/6762]	Time 0.004 (0.005)	
Epoch: [2][5580/6762]	Time 0.004 (0.005)	
Epoch: [2][5590/6762]	Time 0.005 (0.005)	
Epoch: [2][5600/6762]	Time 0.004 (0.005)	
Epoch: [2][5610/6762]	Time 0.004 (0.005)	
Epoch: [2][5620/6762]	Time 0.004 (0.005)	
Epoch: [2][5630/6762]	Time 0.004 (0.005)	
Epoch: [2][5640/6762]	Time 0.004 (0.005)	
Epoch: [2][5650/6762]	Time 0.004 (0.005)	
Epoch: [2][5660/6762]	Time 0.004 (0.005)	
Epoch: [2][5670/6762]	Time 0.006 (0.005)	
Epoch: [2][5680/6762]	Time 0.004 (0.005)	
Epoch: [2][5690/6762]	Time 0.005 (0.005)	
Epoch: [2][5700/6762]	Time 0.004 (0.005)	
Epoch: [2][5710/6762]	Time 0.005 (0.005)	
Epoch: [2][5720/6762]	Time 0.004 (0.005)	
Epoch: [2][5730/6762]	Time 0.004 (0.005)	
Epoch: [2][5740/6762]	Time 0.004 (0.005)	
Epoch: [2][5750/6762]	Time 0.005 (0.005)	
Epoch: [2][5760/6762]	Time 0.003 (0.005)	
Epoch: [2][5770/6762]	Time 0.005 (

Epoch: [3][490/27046]	Time 0.020 (0.021)	Loss 0.1150 (0.1598)	
Epoch: [3][500/27046]	Time 0.020 (0.021)	Loss 0.0146 (0.1599)	
Epoch: [3][510/27046]	Time 0.020 (0.021)	Loss 0.2646 (0.1583)	
Epoch: [3][520/27046]	Time 0.020 (0.021)	Loss 0.0425 (0.1566)	
Epoch: [3][530/27046]	Time 0.019 (0.021)	Loss 0.5651 (0.1568)	
Epoch: [3][540/27046]	Time 0.019 (0.021)	Loss 0.1588 (0.1567)	
Epoch: [3][550/27046]	Time 0.020 (0.021)	Loss 0.0077 (0.1547)	
Epoch: [3][560/27046]	Time 0.019 (0.021)	Loss 0.0113 (0.1540)	
Epoch: [3][570/27046]	Time 0.023 (0.021)	Loss 0.1651 (0.1526)	
Epoch: [3][580/27046]	Time 0.020 (0.021)	Loss 0.1001 (0.1521)	
Epoch: [3][590/27046]	Time 0.019 (0.021)	Loss 0.6484 (0.1559)	
Epoch: [3][600/27046]	Time 0.020 (0.021)	Loss 0.0223 (0.1551)	
Epoch: [3][610/27046]	Time 0.019 (0.021)	Loss 0.8982 (0.1574)	
Epoch: [3][620/27046]	Time 0.019 (0.021)	Loss 0.1409 (0.1586)	
Epoch: [3][630/27046]	Time 0.023 (0.021)	Loss 0.0058 (0.1592)	
Epoch: [3][640/27046]	Time 0.066 (0.021)	Loss 0.0182 (0

Epoch: [3][1790/27046]	Time 0.025 (0.021)	Loss 0.0258 (0.1485)	
Epoch: [3][1800/27046]	Time 0.021 (0.021)	Loss 0.0745 (0.1486)	
Epoch: [3][1810/27046]	Time 0.027 (0.021)	Loss 0.0810 (0.1482)	
Epoch: [3][1820/27046]	Time 0.027 (0.021)	Loss 0.0775 (0.1480)	
Epoch: [3][1830/27046]	Time 0.024 (0.021)	Loss 0.0335 (0.1478)	
Epoch: [3][1840/27046]	Time 0.022 (0.021)	Loss 0.1218 (0.1475)	
Epoch: [3][1850/27046]	Time 0.026 (0.021)	Loss 0.1504 (0.1472)	
Epoch: [3][1860/27046]	Time 0.020 (0.021)	Loss 0.1113 (0.1468)	
Epoch: [3][1870/27046]	Time 0.023 (0.021)	Loss 0.0329 (0.1468)	
Epoch: [3][1880/27046]	Time 0.024 (0.021)	Loss 0.0564 (0.1468)	
Epoch: [3][1890/27046]	Time 0.022 (0.021)	Loss 0.0153 (0.1468)	
Epoch: [3][1900/27046]	Time 0.023 (0.021)	Loss 0.3478 (0.1464)	
Epoch: [3][1910/27046]	Time 0.027 (0.021)	Loss 0.3683 (0.1464)	
Epoch: [3][1920/27046]	Time 0.064 (0.021)	Loss 0.0781 (0.1465)	
Epoch: [3][1930/27046]	Time 0.023 (0.021)	Loss 0.0017 (0.1462)	
Epoch: [3][1940/27046]	Time 0.025 (0.021

Epoch: [3][3080/27046]	Time 0.024 (0.022)	Loss 0.1695 (0.1561)	
Epoch: [3][3090/27046]	Time 0.027 (0.022)	Loss 0.1448 (0.1563)	
Epoch: [3][3100/27046]	Time 0.025 (0.022)	Loss 0.0960 (0.1565)	
Epoch: [3][3110/27046]	Time 0.030 (0.022)	Loss 0.0621 (0.1564)	
Epoch: [3][3120/27046]	Time 0.024 (0.022)	Loss 0.1591 (0.1568)	
Epoch: [3][3130/27046]	Time 0.025 (0.022)	Loss 0.0619 (0.1569)	
Epoch: [3][3140/27046]	Time 0.021 (0.022)	Loss 0.0305 (0.1570)	
Epoch: [3][3150/27046]	Time 0.021 (0.022)	Loss 0.2854 (0.1571)	
Epoch: [3][3160/27046]	Time 0.027 (0.022)	Loss 0.1102 (0.1573)	
Epoch: [3][3170/27046]	Time 0.029 (0.022)	Loss 0.4715 (0.1574)	
Epoch: [3][3180/27046]	Time 0.024 (0.022)	Loss 0.2478 (0.1574)	
Epoch: [3][3190/27046]	Time 0.025 (0.022)	Loss 0.0331 (0.1571)	
Epoch: [3][3200/27046]	Time 0.063 (0.022)	Loss 0.0103 (0.1572)	
Epoch: [3][3210/27046]	Time 0.021 (0.022)	Loss 0.0128 (0.1570)	
Epoch: [3][3220/27046]	Time 0.019 (0.022)	Loss 0.0137 (0.1571)	
Epoch: [3][3230/27046]	Time 0.030 (0.022

Epoch: [3][4370/27046]	Time 0.020 (0.023)	Loss 0.0123 (0.1587)	
Epoch: [3][4380/27046]	Time 0.029 (0.023)	Loss 0.0392 (0.1586)	
Epoch: [3][4390/27046]	Time 0.023 (0.023)	Loss 0.1111 (0.1586)	
Epoch: [3][4400/27046]	Time 0.026 (0.023)	Loss 0.0061 (0.1588)	
Epoch: [3][4410/27046]	Time 0.023 (0.023)	Loss 0.8233 (0.1589)	
Epoch: [3][4420/27046]	Time 0.024 (0.023)	Loss 0.0627 (0.1588)	
Epoch: [3][4430/27046]	Time 0.023 (0.023)	Loss 0.0138 (0.1586)	
Epoch: [3][4440/27046]	Time 0.029 (0.023)	Loss 0.0289 (0.1588)	
Epoch: [3][4450/27046]	Time 0.029 (0.023)	Loss 0.0075 (0.1588)	
Epoch: [3][4460/27046]	Time 0.028 (0.023)	Loss 0.0577 (0.1588)	
Epoch: [3][4470/27046]	Time 0.023 (0.023)	Loss 0.9320 (0.1592)	
Epoch: [3][4480/27046]	Time 0.064 (0.023)	Loss 0.1263 (0.1592)	
Epoch: [3][4490/27046]	Time 0.021 (0.023)	Loss 0.1941 (0.1592)	
Epoch: [3][4500/27046]	Time 0.023 (0.023)	Loss 0.3008 (0.1594)	
Epoch: [3][4510/27046]	Time 0.023 (0.023)	Loss 0.0082 (0.1594)	
Epoch: [3][4520/27046]	Time 0.023 (0.023

Epoch: [3][5660/27046]	Time 0.022 (0.023)	Loss 0.1531 (0.1604)	
Epoch: [3][5670/27046]	Time 0.023 (0.023)	Loss 0.1917 (0.1604)	
Epoch: [3][5680/27046]	Time 0.024 (0.023)	Loss 0.1164 (0.1606)	
Epoch: [3][5690/27046]	Time 0.035 (0.023)	Loss 0.1404 (0.1606)	
Epoch: [3][5700/27046]	Time 0.029 (0.023)	Loss 0.0728 (0.1606)	
Epoch: [3][5710/27046]	Time 0.028 (0.023)	Loss 0.2742 (0.1606)	
Epoch: [3][5720/27046]	Time 0.024 (0.023)	Loss 0.0570 (0.1605)	
Epoch: [3][5730/27046]	Time 0.025 (0.023)	Loss 0.0350 (0.1606)	
Epoch: [3][5740/27046]	Time 0.027 (0.023)	Loss 0.2322 (0.1605)	
Epoch: [3][5750/27046]	Time 0.031 (0.023)	Loss 0.0070 (0.1607)	
Epoch: [3][5760/27046]	Time 0.069 (0.023)	Loss 0.0534 (0.1608)	
Epoch: [3][5770/27046]	Time 0.026 (0.023)	Loss 0.0490 (0.1608)	
Epoch: [3][5780/27046]	Time 0.028 (0.023)	Loss 0.1018 (0.1609)	
Epoch: [3][5790/27046]	Time 0.023 (0.023)	Loss 0.2221 (0.1610)	
Epoch: [3][5800/27046]	Time 0.028 (0.023)	Loss 0.0127 (0.1611)	
Epoch: [3][5810/27046]	Time 0.027 (0.023

Epoch: [3][6950/27046]	Time 0.024 (0.023)	Loss 0.0639 (0.1622)	
Epoch: [3][6960/27046]	Time 0.025 (0.023)	Loss 0.0038 (0.1620)	
Epoch: [3][6970/27046]	Time 0.020 (0.023)	Loss 0.1527 (0.1620)	
Epoch: [3][6980/27046]	Time 0.030 (0.023)	Loss 0.0683 (0.1620)	
Epoch: [3][6990/27046]	Time 0.024 (0.023)	Loss 0.0809 (0.1620)	
Epoch: [3][7000/27046]	Time 0.027 (0.023)	Loss 0.0654 (0.1619)	
Epoch: [3][7010/27046]	Time 0.023 (0.023)	Loss 0.4001 (0.1620)	
Epoch: [3][7020/27046]	Time 0.025 (0.023)	Loss 0.1362 (0.1619)	
Epoch: [3][7030/27046]	Time 0.027 (0.023)	Loss 0.0041 (0.1620)	
Epoch: [3][7040/27046]	Time 0.077 (0.023)	Loss 0.0700 (0.1620)	
Epoch: [3][7050/27046]	Time 0.022 (0.023)	Loss 0.1145 (0.1619)	
Epoch: [3][7060/27046]	Time 0.028 (0.023)	Loss 0.2068 (0.1619)	
Epoch: [3][7070/27046]	Time 0.021 (0.023)	Loss 0.0657 (0.1618)	
Epoch: [3][7080/27046]	Time 0.022 (0.023)	Loss 0.0065 (0.1617)	
Epoch: [3][7090/27046]	Time 0.025 (0.023)	Loss 0.4879 (0.1618)	
Epoch: [3][7100/27046]	Time 0.038 (0.023

Epoch: [3][8240/27046]	Time 0.023 (0.023)	Loss 0.5216 (0.1632)	
Epoch: [3][8250/27046]	Time 0.031 (0.023)	Loss 0.2370 (0.1630)	
Epoch: [3][8260/27046]	Time 0.024 (0.023)	Loss 0.0258 (0.1632)	
Epoch: [3][8270/27046]	Time 0.026 (0.023)	Loss 0.0577 (0.1631)	
Epoch: [3][8280/27046]	Time 0.024 (0.023)	Loss 0.0255 (0.1630)	
Epoch: [3][8290/27046]	Time 0.024 (0.023)	Loss 0.0794 (0.1631)	
Epoch: [3][8300/27046]	Time 0.029 (0.023)	Loss 0.0022 (0.1630)	
Epoch: [3][8310/27046]	Time 0.031 (0.023)	Loss 0.0178 (0.1629)	
Epoch: [3][8320/27046]	Time 0.083 (0.023)	Loss 0.0649 (0.1629)	
Epoch: [3][8330/27046]	Time 0.020 (0.023)	Loss 0.0397 (0.1629)	
Epoch: [3][8340/27046]	Time 0.033 (0.023)	Loss 0.0967 (0.1630)	
Epoch: [3][8350/27046]	Time 0.025 (0.023)	Loss 0.4401 (0.1631)	
Epoch: [3][8360/27046]	Time 0.025 (0.023)	Loss 0.0444 (0.1630)	
Epoch: [3][8370/27046]	Time 0.025 (0.023)	Loss 0.2186 (0.1629)	
Epoch: [3][8380/27046]	Time 0.028 (0.023)	Loss 0.0097 (0.1629)	
Epoch: [3][8390/27046]	Time 0.025 (0.023

Epoch: [3][9540/27046]	Time 0.021 (0.023)	Loss 0.1195 (0.1631)	
Epoch: [3][9550/27046]	Time 0.019 (0.023)	Loss 0.5796 (0.1632)	
Epoch: [3][9560/27046]	Time 0.020 (0.023)	Loss 0.0380 (0.1631)	
Epoch: [3][9570/27046]	Time 0.021 (0.023)	Loss 0.0369 (0.1631)	
Epoch: [3][9580/27046]	Time 0.020 (0.023)	Loss 0.9593 (0.1631)	
Epoch: [3][9590/27046]	Time 0.025 (0.023)	Loss 0.0908 (0.1632)	
Epoch: [3][9600/27046]	Time 0.082 (0.023)	Loss 0.2886 (0.1631)	
Epoch: [3][9610/27046]	Time 0.019 (0.023)	Loss 0.4835 (0.1631)	
Epoch: [3][9620/27046]	Time 0.019 (0.023)	Loss 0.0494 (0.1631)	
Epoch: [3][9630/27046]	Time 0.021 (0.023)	Loss 0.0250 (0.1631)	
Epoch: [3][9640/27046]	Time 0.020 (0.023)	Loss 0.0378 (0.1630)	
Epoch: [3][9650/27046]	Time 0.024 (0.023)	Loss 0.4187 (0.1631)	
Epoch: [3][9660/27046]	Time 0.020 (0.023)	Loss 0.2561 (0.1631)	
Epoch: [3][9670/27046]	Time 0.019 (0.023)	Loss 0.4161 (0.1631)	
Epoch: [3][9680/27046]	Time 0.020 (0.023)	Loss 0.2475 (0.1632)	
Epoch: [3][9690/27046]	Time 0.020 (0.023

Epoch: [3][10820/27046]	Time 0.021 (0.023)	Loss 0.1681 (0.1627)	
Epoch: [3][10830/27046]	Time 0.020 (0.023)	Loss 0.0325 (0.1627)	
Epoch: [3][10840/27046]	Time 0.021 (0.023)	Loss 0.0359 (0.1626)	
Epoch: [3][10850/27046]	Time 0.025 (0.023)	Loss 1.2887 (0.1628)	
Epoch: [3][10860/27046]	Time 0.022 (0.023)	Loss 0.5597 (0.1628)	
Epoch: [3][10870/27046]	Time 0.019 (0.023)	Loss 0.2589 (0.1630)	
Epoch: [3][10880/27046]	Time 0.084 (0.023)	Loss 0.1717 (0.1630)	
Epoch: [3][10890/27046]	Time 0.029 (0.023)	Loss 0.3857 (0.1630)	
Epoch: [3][10900/27046]	Time 0.025 (0.023)	Loss 0.0017 (0.1630)	
Epoch: [3][10910/27046]	Time 0.020 (0.023)	Loss 0.0355 (0.1632)	
Epoch: [3][10920/27046]	Time 0.023 (0.023)	Loss 0.1384 (0.1631)	
Epoch: [3][10930/27046]	Time 0.028 (0.023)	Loss 0.0053 (0.1631)	
Epoch: [3][10940/27046]	Time 0.028 (0.023)	Loss 0.0906 (0.1631)	
Epoch: [3][10950/27046]	Time 0.022 (0.023)	Loss 0.5971 (0.1631)	
Epoch: [3][10960/27046]	Time 0.021 (0.023)	Loss 0.2575 (0.1631)	
Epoch: [3][10970/27046]	T

Epoch: [3][12090/27046]	Time 0.021 (0.023)	Loss 0.1079 (0.1636)	
Epoch: [3][12100/27046]	Time 0.020 (0.023)	Loss 0.0139 (0.1636)	
Epoch: [3][12110/27046]	Time 0.025 (0.023)	Loss 0.0008 (0.1635)	
Epoch: [3][12120/27046]	Time 0.025 (0.023)	Loss 0.0159 (0.1635)	
Epoch: [3][12130/27046]	Time 0.026 (0.023)	Loss 0.0446 (0.1634)	
Epoch: [3][12140/27046]	Time 0.025 (0.023)	Loss 0.1847 (0.1635)	
Epoch: [3][12150/27046]	Time 0.022 (0.023)	Loss 0.2277 (0.1634)	
Epoch: [3][12160/27046]	Time 0.083 (0.023)	Loss 0.7887 (0.1635)	
Epoch: [3][12170/27046]	Time 0.029 (0.023)	Loss 0.0520 (0.1635)	
Epoch: [3][12180/27046]	Time 0.027 (0.023)	Loss 0.1000 (0.1634)	
Epoch: [3][12190/27046]	Time 0.026 (0.023)	Loss 0.1389 (0.1636)	
Epoch: [3][12200/27046]	Time 0.026 (0.023)	Loss 0.0103 (0.1636)	
Epoch: [3][12210/27046]	Time 0.025 (0.023)	Loss 0.0158 (0.1635)	
Epoch: [3][12220/27046]	Time 0.019 (0.023)	Loss 0.0455 (0.1635)	
Epoch: [3][12230/27046]	Time 0.021 (0.023)	Loss 0.0095 (0.1637)	
Epoch: [3][12240/27046]	T

Epoch: [3][13370/27046]	Time 0.022 (0.023)	Loss 0.0456 (0.1655)	
Epoch: [3][13380/27046]	Time 0.019 (0.023)	Loss 0.0809 (0.1655)	
Epoch: [3][13390/27046]	Time 0.022 (0.023)	Loss 0.0870 (0.1655)	
Epoch: [3][13400/27046]	Time 0.021 (0.023)	Loss 0.2357 (0.1656)	
Epoch: [3][13410/27046]	Time 0.021 (0.023)	Loss 0.2766 (0.1655)	
Epoch: [3][13420/27046]	Time 0.028 (0.023)	Loss 0.0689 (0.1655)	
Epoch: [3][13430/27046]	Time 0.021 (0.023)	Loss 0.2428 (0.1655)	
Epoch: [3][13440/27046]	Time 0.086 (0.023)	Loss 0.1829 (0.1655)	
Epoch: [3][13450/27046]	Time 0.023 (0.023)	Loss 0.0187 (0.1655)	
Epoch: [3][13460/27046]	Time 0.021 (0.023)	Loss 0.1473 (0.1655)	
Epoch: [3][13470/27046]	Time 0.025 (0.023)	Loss 0.2060 (0.1655)	
Epoch: [3][13480/27046]	Time 0.027 (0.023)	Loss 0.0950 (0.1654)	
Epoch: [3][13490/27046]	Time 0.026 (0.023)	Loss 0.3235 (0.1654)	
Epoch: [3][13500/27046]	Time 0.027 (0.023)	Loss 0.0242 (0.1654)	
Epoch: [3][13510/27046]	Time 0.023 (0.023)	Loss 0.0057 (0.1654)	
Epoch: [3][13520/27046]	T

Epoch: [3][14640/27046]	Time 0.020 (0.023)	Loss 0.2645 (0.1656)	
Epoch: [3][14650/27046]	Time 0.026 (0.023)	Loss 0.1773 (0.1656)	
Epoch: [3][14660/27046]	Time 0.020 (0.023)	Loss 0.4488 (0.1657)	
Epoch: [3][14670/27046]	Time 0.025 (0.023)	Loss 0.0031 (0.1656)	
Epoch: [3][14680/27046]	Time 0.025 (0.023)	Loss 0.0588 (0.1656)	
Epoch: [3][14690/27046]	Time 0.026 (0.023)	Loss 0.2729 (0.1656)	
Epoch: [3][14700/27046]	Time 0.025 (0.023)	Loss 0.2916 (0.1655)	
Epoch: [3][14710/27046]	Time 0.028 (0.023)	Loss 0.0756 (0.1656)	
Epoch: [3][14720/27046]	Time 0.083 (0.023)	Loss 0.5610 (0.1656)	
Epoch: [3][14730/27046]	Time 0.027 (0.023)	Loss 0.2677 (0.1655)	
Epoch: [3][14740/27046]	Time 0.025 (0.023)	Loss 0.0388 (0.1654)	
Epoch: [3][14750/27046]	Time 0.029 (0.023)	Loss 0.0094 (0.1654)	
Epoch: [3][14760/27046]	Time 0.028 (0.023)	Loss 0.5013 (0.1655)	
Epoch: [3][14770/27046]	Time 0.025 (0.023)	Loss 0.0872 (0.1655)	
Epoch: [3][14780/27046]	Time 0.024 (0.023)	Loss 0.0056 (0.1656)	
Epoch: [3][14790/27046]	T

Epoch: [3][15920/27046]	Time 0.019 (0.023)	Loss 0.0231 (0.1655)	
Epoch: [3][15930/27046]	Time 0.021 (0.023)	Loss 0.0419 (0.1654)	
Epoch: [3][15940/27046]	Time 0.021 (0.023)	Loss 0.4760 (0.1654)	
Epoch: [3][15950/27046]	Time 0.023 (0.023)	Loss 0.0052 (0.1654)	
Epoch: [3][15960/27046]	Time 0.023 (0.023)	Loss 0.0086 (0.1653)	
Epoch: [3][15970/27046]	Time 0.025 (0.023)	Loss 0.0891 (0.1653)	
Epoch: [3][15980/27046]	Time 0.019 (0.023)	Loss 0.0157 (0.1652)	
Epoch: [3][15990/27046]	Time 0.026 (0.023)	Loss 0.0269 (0.1652)	
Epoch: [3][16000/27046]	Time 0.087 (0.023)	Loss 0.0140 (0.1652)	
Epoch: [3][16010/27046]	Time 0.020 (0.023)	Loss 0.2891 (0.1652)	
Epoch: [3][16020/27046]	Time 0.021 (0.023)	Loss 0.0077 (0.1652)	
Epoch: [3][16030/27046]	Time 0.024 (0.023)	Loss 0.0333 (0.1651)	
Epoch: [3][16040/27046]	Time 0.019 (0.023)	Loss 0.2571 (0.1651)	
Epoch: [3][16050/27046]	Time 0.020 (0.023)	Loss 0.0110 (0.1650)	
Epoch: [3][16060/27046]	Time 0.021 (0.023)	Loss 0.0120 (0.1650)	
Epoch: [3][16070/27046]	T

Epoch: [3][17200/27046]	Time 0.021 (0.023)	Loss 0.0801 (0.1653)	
Epoch: [3][17210/27046]	Time 0.025 (0.023)	Loss 0.9795 (0.1655)	
Epoch: [3][17220/27046]	Time 0.020 (0.023)	Loss 0.4584 (0.1655)	
Epoch: [3][17230/27046]	Time 0.026 (0.023)	Loss 0.1925 (0.1655)	
Epoch: [3][17240/27046]	Time 0.024 (0.023)	Loss 0.3334 (0.1655)	
Epoch: [3][17250/27046]	Time 0.021 (0.023)	Loss 0.0231 (0.1656)	
Epoch: [3][17260/27046]	Time 0.022 (0.023)	Loss 0.5712 (0.1657)	
Epoch: [3][17270/27046]	Time 0.020 (0.023)	Loss 0.1630 (0.1658)	
Epoch: [3][17280/27046]	Time 0.082 (0.023)	Loss 0.3606 (0.1658)	
Epoch: [3][17290/27046]	Time 0.027 (0.023)	Loss 0.0009 (0.1658)	
Epoch: [3][17300/27046]	Time 0.027 (0.023)	Loss 0.2677 (0.1658)	
Epoch: [3][17310/27046]	Time 0.019 (0.023)	Loss 0.0584 (0.1658)	
Epoch: [3][17320/27046]	Time 0.019 (0.023)	Loss 0.3974 (0.1658)	
Epoch: [3][17330/27046]	Time 0.026 (0.023)	Loss 1.7459 (0.1660)	
Epoch: [3][17340/27046]	Time 0.026 (0.023)	Loss 0.0894 (0.1660)	
Epoch: [3][17350/27046]	T

Epoch: [3][18470/27046]	Time 0.021 (0.023)	Loss 0.0947 (0.1662)	
Epoch: [3][18480/27046]	Time 0.021 (0.023)	Loss 0.0198 (0.1662)	
Epoch: [3][18490/27046]	Time 0.024 (0.023)	Loss 0.0885 (0.1662)	
Epoch: [3][18500/27046]	Time 0.019 (0.023)	Loss 0.0894 (0.1662)	
Epoch: [3][18510/27046]	Time 0.021 (0.023)	Loss 0.1325 (0.1663)	
Epoch: [3][18520/27046]	Time 0.019 (0.023)	Loss 0.0147 (0.1663)	
Epoch: [3][18530/27046]	Time 0.026 (0.023)	Loss 0.0011 (0.1663)	
Epoch: [3][18540/27046]	Time 0.025 (0.023)	Loss 0.2241 (0.1663)	
Epoch: [3][18550/27046]	Time 0.020 (0.023)	Loss 0.0087 (0.1663)	
Epoch: [3][18560/27046]	Time 0.087 (0.023)	Loss 0.1666 (0.1662)	
Epoch: [3][18570/27046]	Time 0.021 (0.023)	Loss 0.0347 (0.1662)	
Epoch: [3][18580/27046]	Time 0.019 (0.023)	Loss 0.1584 (0.1662)	
Epoch: [3][18590/27046]	Time 0.026 (0.023)	Loss 0.1876 (0.1662)	
Epoch: [3][18600/27046]	Time 0.022 (0.023)	Loss 0.4377 (0.1662)	
Epoch: [3][18610/27046]	Time 0.027 (0.023)	Loss 0.0007 (0.1661)	
Epoch: [3][18620/27046]	T

Epoch: [3][19750/27046]	Time 0.023 (0.023)	Loss 0.4201 (0.1664)	
Epoch: [3][19760/27046]	Time 0.021 (0.023)	Loss 0.4602 (0.1665)	
Epoch: [3][19770/27046]	Time 0.026 (0.023)	Loss 0.3293 (0.1664)	
Epoch: [3][19780/27046]	Time 0.021 (0.023)	Loss 0.0383 (0.1664)	
Epoch: [3][19790/27046]	Time 0.019 (0.023)	Loss 0.3079 (0.1664)	
Epoch: [3][19800/27046]	Time 0.023 (0.023)	Loss 0.2645 (0.1663)	
Epoch: [3][19810/27046]	Time 0.029 (0.023)	Loss 0.2273 (0.1664)	
Epoch: [3][19820/27046]	Time 0.025 (0.023)	Loss 0.0218 (0.1663)	
Epoch: [3][19830/27046]	Time 0.028 (0.023)	Loss 1.0097 (0.1664)	
Epoch: [3][19840/27046]	Time 0.116 (0.023)	Loss 0.0606 (0.1664)	
Epoch: [3][19850/27046]	Time 0.021 (0.023)	Loss 0.0425 (0.1663)	
Epoch: [3][19860/27046]	Time 0.031 (0.023)	Loss 0.1162 (0.1664)	
Epoch: [3][19870/27046]	Time 0.031 (0.023)	Loss 0.0141 (0.1664)	
Epoch: [3][19880/27046]	Time 0.021 (0.023)	Loss 0.0957 (0.1664)	
Epoch: [3][19890/27046]	Time 0.028 (0.023)	Loss 0.0035 (0.1664)	
Epoch: [3][19900/27046]	T

Epoch: [3][21020/27046]	Time 0.024 (0.023)	Loss 0.1423 (0.1655)	
Epoch: [3][21030/27046]	Time 0.021 (0.023)	Loss 0.0985 (0.1654)	
Epoch: [3][21040/27046]	Time 0.020 (0.023)	Loss 0.0438 (0.1654)	
Epoch: [3][21050/27046]	Time 0.030 (0.023)	Loss 0.3368 (0.1656)	
Epoch: [3][21060/27046]	Time 0.019 (0.023)	Loss 0.1155 (0.1656)	
Epoch: [3][21070/27046]	Time 0.020 (0.023)	Loss 0.2636 (0.1657)	
Epoch: [3][21080/27046]	Time 0.021 (0.023)	Loss 0.2535 (0.1657)	
Epoch: [3][21090/27046]	Time 0.033 (0.023)	Loss 0.0136 (0.1658)	
Epoch: [3][21100/27046]	Time 0.021 (0.023)	Loss 0.1629 (0.1658)	
Epoch: [3][21110/27046]	Time 0.027 (0.023)	Loss 0.0152 (0.1657)	
Epoch: [3][21120/27046]	Time 0.088 (0.023)	Loss 0.0615 (0.1657)	
Epoch: [3][21130/27046]	Time 0.024 (0.023)	Loss 0.2404 (0.1657)	
Epoch: [3][21140/27046]	Time 0.022 (0.023)	Loss 0.1422 (0.1657)	
Epoch: [3][21150/27046]	Time 0.021 (0.023)	Loss 0.0796 (0.1657)	
Epoch: [3][21160/27046]	Time 0.021 (0.023)	Loss 0.1860 (0.1657)	
Epoch: [3][21170/27046]	T

Epoch: [3][22300/27046]	Time 0.021 (0.023)	Loss 0.1716 (0.1647)	
Epoch: [3][22310/27046]	Time 0.022 (0.023)	Loss 0.0227 (0.1646)	
Epoch: [3][22320/27046]	Time 0.020 (0.023)	Loss 0.4153 (0.1646)	
Epoch: [3][22330/27046]	Time 0.024 (0.023)	Loss 0.0305 (0.1646)	
Epoch: [3][22340/27046]	Time 0.021 (0.023)	Loss 0.1346 (0.1646)	
Epoch: [3][22350/27046]	Time 0.020 (0.023)	Loss 0.1935 (0.1647)	
Epoch: [3][22360/27046]	Time 0.019 (0.023)	Loss 0.0334 (0.1647)	
Epoch: [3][22370/27046]	Time 0.027 (0.023)	Loss 0.0987 (0.1647)	
Epoch: [3][22380/27046]	Time 0.025 (0.023)	Loss 0.0915 (0.1647)	
Epoch: [3][22390/27046]	Time 0.025 (0.023)	Loss 0.0198 (0.1648)	
Epoch: [3][22400/27046]	Time 0.087 (0.023)	Loss 0.0099 (0.1648)	
Epoch: [3][22410/27046]	Time 0.028 (0.023)	Loss 0.0303 (0.1648)	
Epoch: [3][22420/27046]	Time 0.023 (0.023)	Loss 0.4197 (0.1648)	
Epoch: [3][22430/27046]	Time 0.027 (0.023)	Loss 0.4535 (0.1648)	
Epoch: [3][22440/27046]	Time 0.025 (0.023)	Loss 0.1198 (0.1648)	
Epoch: [3][22450/27046]	T

Epoch: [3][23580/27046]	Time 0.021 (0.023)	Loss 0.0180 (0.1649)	
Epoch: [3][23590/27046]	Time 0.027 (0.023)	Loss 0.5922 (0.1649)	
Epoch: [3][23600/27046]	Time 0.026 (0.023)	Loss 1.0033 (0.1649)	
Epoch: [3][23610/27046]	Time 0.026 (0.023)	Loss 0.1317 (0.1649)	
Epoch: [3][23620/27046]	Time 0.020 (0.023)	Loss 0.0422 (0.1649)	
Epoch: [3][23630/27046]	Time 0.028 (0.023)	Loss 0.0111 (0.1649)	
Epoch: [3][23640/27046]	Time 0.025 (0.023)	Loss 0.3489 (0.1649)	
Epoch: [3][23650/27046]	Time 0.029 (0.023)	Loss 0.0922 (0.1649)	
Epoch: [3][23660/27046]	Time 0.025 (0.023)	Loss 0.0303 (0.1649)	
Epoch: [3][23670/27046]	Time 0.029 (0.023)	Loss 0.0118 (0.1649)	
Epoch: [3][23680/27046]	Time 0.093 (0.023)	Loss 0.0551 (0.1649)	
Epoch: [3][23690/27046]	Time 0.021 (0.023)	Loss 0.1436 (0.1648)	
Epoch: [3][23700/27046]	Time 0.020 (0.023)	Loss 0.0177 (0.1648)	
Epoch: [3][23710/27046]	Time 0.022 (0.023)	Loss 0.0091 (0.1648)	
Epoch: [3][23720/27046]	Time 0.026 (0.023)	Loss 0.1591 (0.1648)	
Epoch: [3][23730/27046]	T

Epoch: [3][24860/27046]	Time 0.019 (0.023)	Loss 0.0006 (0.1642)	
Epoch: [3][24870/27046]	Time 0.025 (0.023)	Loss 0.2418 (0.1642)	
Epoch: [3][24880/27046]	Time 0.021 (0.023)	Loss 0.0168 (0.1642)	
Epoch: [3][24890/27046]	Time 0.020 (0.023)	Loss 0.0863 (0.1642)	
Epoch: [3][24900/27046]	Time 0.022 (0.023)	Loss 0.0693 (0.1642)	
Epoch: [3][24910/27046]	Time 0.026 (0.023)	Loss 0.3234 (0.1642)	
Epoch: [3][24920/27046]	Time 0.020 (0.023)	Loss 0.0865 (0.1641)	
Epoch: [3][24930/27046]	Time 0.021 (0.023)	Loss 0.0329 (0.1641)	
Epoch: [3][24940/27046]	Time 0.025 (0.023)	Loss 0.0968 (0.1641)	
Epoch: [3][24950/27046]	Time 0.021 (0.023)	Loss 0.1273 (0.1642)	
Epoch: [3][24960/27046]	Time 0.082 (0.023)	Loss 0.1849 (0.1642)	
Epoch: [3][24970/27046]	Time 0.027 (0.023)	Loss 0.0252 (0.1642)	
Epoch: [3][24980/27046]	Time 0.026 (0.023)	Loss 0.0058 (0.1641)	
Epoch: [3][24990/27046]	Time 0.020 (0.023)	Loss 0.1141 (0.1641)	
Epoch: [3][25000/27046]	Time 0.020 (0.023)	Loss 0.0403 (0.1641)	
Epoch: [3][25010/27046]	T

Epoch: [3][26130/27046]	Time 0.028 (0.023)	Loss 0.3030 (0.1643)	
Epoch: [3][26140/27046]	Time 0.019 (0.023)	Loss 0.1315 (0.1643)	
Epoch: [3][26150/27046]	Time 0.020 (0.023)	Loss 0.2219 (0.1643)	
Epoch: [3][26160/27046]	Time 0.027 (0.023)	Loss 0.2241 (0.1643)	
Epoch: [3][26170/27046]	Time 0.020 (0.023)	Loss 0.0043 (0.1643)	
Epoch: [3][26180/27046]	Time 0.020 (0.023)	Loss 0.1741 (0.1643)	
Epoch: [3][26190/27046]	Time 0.030 (0.023)	Loss 0.0529 (0.1643)	


KeyboardInterrupt: 

In [22]:
# %%experiment 
# {
#     'name': 'Vanilla ViT model Optimization test',
#     'metrics': [
#         {
#             'name': 'MSE',
#             'strategy': 'optimize',
#             'objective': 'minimize',
#         }
#     ],
#     'parameters': [
#         {
#             'name': 'reg',
#             'type': 'double',
#             'bounds': {'min': 0.0001, 'max': 0.5},
#             'transformation': 'log'
#         },
#         {
#             'name': 'learning_rate',
#             'type': 'double',
#             'bounds': {'min': 0.0001, 'max': 0.9},
#             'transformation': 'log'
#         },
#         {
#             'name': 'batch_size',
#             'type': 'categorical',
#             'categorical_values': ['32', '64']
#         }
#     ],
#     'budget': 30
# }

UsageError: Cell magic `%%experiment` not found.


In [23]:
# %%optimize vanilla_vit_optimization_run_test
# evaluate(args)

UsageError: Cell magic `%%optimize` not found.
