# Inicialização

In [1]:
import torch
from torch import nn
from torch.utils.data import Dataset, DataLoader
import torchvision
from torchvision import datasets
from torchvision.transforms import ToTensor
import torch.optim as optim
from torcheval.metrics.functional import multiclass_f1_score
from torchinfo import summary

import plotly.express as px
import plotly.graph_objects as go
import numpy as np
import pandas as pd
import copy
from tqdm import tqdm
import time
import os
from scipy import signal
from sklearn.model_selection import train_test_split
from sklearn.neighbors import KNeighborsClassifier
from sklearn.metrics import accuracy_score
from natsort import natsorted

In [2]:
device = (
    "cuda"
    if torch.cuda.is_available()
    else "mps"
    if torch.backends.mps.is_available()
    else "cpu"
)
print(f"Using {device} device")

Using cuda device


In [3]:
# Vamos definir a pasta que está o dataset
workspace = 'C:\\Meu Drive\\Doutorado Unicamp\\Projeto\\Dataset\\'
root = 'C:\\Meu Drive\\Doutorado Unicamp\\Projeto\\Dataset\\RealWorld\\'

# Lista de usuários e atividades
users = natsorted(os.listdir(root))
tarefas = ['climbingdown', 'climbingup', 'jumping', 'lying', 'running', 'sitting', 'standing', 'walking']
SAC = ['sitting', 'standing', 'walking', 'climbingup', 'climbingdown', 'running']
posicao = ['chest', 'forearm', 'head', 'shin', 'thigh', 'upperarm', 'waist']
posicaopt = ['peito', 'antebraço', 'cabeça', 'canela', 'coxa', 'braço', 'cintura']

In [4]:
pasta = 'C:\\Meu Drive\\Doutorado Unicamp\\Projeto\\Dataset\\realworld views\\'
D = [None] * 7
D[0] = pd.read_csv(pasta+posicao[0]+'_nova50hz.csv')
D[1] = pd.read_csv(pasta+posicao[1]+'_nova50hz.csv')
D[2] = pd.read_csv(pasta+posicao[2]+'_nova50hz.csv')
D[3] = pd.read_csv(pasta+posicao[3]+'_nova50hz.csv')
D[4] = pd.read_csv(pasta+posicao[4]+'_nova50hz.csv')
D[5] = pd.read_csv(pasta+posicao[5]+'_nova50hz.csv')
D[6] = pd.read_csv(pasta+posicao[6]+'_nova50hz.csv')

# Definição dos dados e modelos

In [5]:
X = D[0].values[:,:450] / 30
y = D[0].values[:,-3]
X_train, X_test, y_train, y_test = train_test_split(
    X, y, test_size=0.2, random_state=1, stratify=y)
X_train, X_val, y_train, y_val = train_test_split(
    X_train, y_train, test_size=0.1, random_state=1, stratify=y_train)
X_train = torch.tensor(X_train, dtype=torch.float32, device=device).detach()
X_test = torch.tensor(X_test, dtype=torch.float32, device=device).detach()
X_val = torch.tensor(X_val, dtype=torch.float32, device=device).detach()

In [6]:
class automlpacc(nn.Module):
    def __init__(self, dim):
        super().__init__()
        raw_dim = 450
        self.encoder = torch.nn.Sequential(

            nn.Flatten(start_dim=1),
            nn.Linear(raw_dim, dim),
            # nn.ReLU(),
            # nn.LeakyReLU(),
            nn.Tanh()
        )

        self.decoder = nn.Linear(dim, raw_dim)

    def forward(self, x):
        x = self.encoder(x)
        logits = self.decoder(x)
        return logits

In [161]:
class automlp(nn.Module):
    def __init__(self):
        super().__init__()
        dim = 600
        self.encoder = torch.nn.Sequential(

            nn.Flatten(start_dim=1),
            nn.Linear(900, dim),
            # nn.ReLU(),
            # nn.LeakyReLU(),
            nn.Tanh()
        )

        self.decoder = nn.Linear(dim, 900)

    def forward(self, x):
        x = self.encoder(x)
        logits = self.decoder(x)
        return logits

In [137]:
class automlp2(nn.Module):
    def __init__(self):
        super().__init__()
        dim1 = 600
        dim2 = 600
        self.all_layers = torch.nn.Sequential(

            # Encoder
            nn.Flatten(start_dim=1),
            nn.Linear(900, dim1),
            # nn.ReLU(),
            # nn.LeakyReLU(),
            nn.Tanh(),
            nn.Linear(dim1, dim2),
            nn.Tanh(),

            # Decoder
            nn.Linear(dim2, dim1),
            nn.Tanh(),
            nn.Linear(dim1, 900),
        )

    def forward(self, x):
        logits = self.all_layers(x)
        return logits

In [52]:
model = automlpacc().to(device)
loss_fn = nn.MSELoss()
optimizer = optim.Adam(model.parameters(), lr=0.001)
n_epochs = 20   # number of epochs to run
batch_size = 150  # size of each batch
batch_start = torch.arange(0, len(X_train), batch_size)
trainLoss = []
valLoss = []

In [64]:
summary(model, input_size=(batch_size, 450))

Layer (type:depth-idx)                   Output Shape              Param #
automlpacc                               [150, 450]                --
├─Sequential: 1-1                        [150, 100]                --
│    └─Flatten: 2-1                      [150, 450]                --
│    └─Linear: 2-2                       [150, 100]                45,100
│    └─Tanh: 2-3                         [150, 100]                --
├─Linear: 1-2                            [150, 450]                45,450
Total params: 90,550
Trainable params: 90,550
Non-trainable params: 0
Total mult-adds (Units.MEGABYTES): 13.58
Input size (MB): 0.27
Forward/backward pass size (MB): 0.66
Params size (MB): 0.36
Estimated Total Size (MB): 1.29

# Treinamento de modelos automlp de uma camada

In [7]:
lat_dim = [10, 20, 30, 50, 70, 100, 150, 200, 250, 300, 350, 400]
models1 = [None] * len(lat_dim)

In [8]:
for i, dim in enumerate(lat_dim):
    models1[i] = automlpacc(dim).to(device)
    loss_fn = nn.MSELoss()
    optimizer = optim.Adam(models1[i].parameters(), lr=0.001)
    n_epochs = 20   # number of epochs to run
    batch_size = 150  # size of each batch
    batch_start = torch.arange(0, len(X_train), batch_size)
    trainLoss = []
    valLoss = []
    for epoch in range(n_epochs):
        models1[i].train()
        with tqdm(batch_start, unit="batch", mininterval=0, disable=False) as bar:
            bar.set_description(f"Epoch {epoch}")
            for start in bar:
                # take a batch
                X_batch = X_train[start:start+batch_size,:]
                # forward pass
                Xh = models1[i](X_batch)
                loss = loss_fn(Xh, X_batch)
                # backward pass
                optimizer.zero_grad()
                loss.backward()
                # update weights
                optimizer.step()
                # print progress
                bar.set_postfix(loss=float(loss))
        # evaluate accuracy at end of each epoch
        models1[i].eval()
        Xh = models1[i](X_val)
        valLoss.append(float(loss_fn(Xh, X_val)))
        Xh = models1[i](X_train)
        trainLoss.append(float(loss_fn(Xh, X_train)))
    fig = go.Figure()
    fig.add_trace(go.Scatter(y=valLoss, mode="lines", showlegend=True, name='validação'))
    fig.add_trace(go.Scatter(y=trainLoss, mode="lines", showlegend=True, name='treino'))
    fig.show()

Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 178.49batch/s, loss=0.00715]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 214.78batch/s, loss=0.00471]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 238.27batch/s, loss=0.00449]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 243.69batch/s, loss=0.00435]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 224.00batch/s, loss=0.00417]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 220.14batch/s, loss=0.00397]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 222.22batch/s, loss=0.00378]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 206.61batch/s, loss=0.00363]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 222.70batch/s, loss=0.00351]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 211.26batch/s, loss=0.00342]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 185.66batch/s, loss=0.00336]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 233.93batch/s, loss=0.00331]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 230.89batch/s, loss=0.003

Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 215.99batch/s, loss=0.00481]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 209.45batch/s, loss=0.00393]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 230.00batch/s, loss=0.00338]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 167.79batch/s, loss=0.00312]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 143.90batch/s, loss=0.00293]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 190.00batch/s, loss=0.00277]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 173.19batch/s, loss=0.00264]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 168.65batch/s, loss=0.00257]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 166.88batch/s, loss=0.00253]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 174.76batch/s, loss=0.0025] 
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 178.74batch/s, loss=0.00249]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 179.51batch/s, loss=0.00248]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 176.92batch/s, loss=0.002

Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 154.00batch/s, loss=0.00407]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 187.76batch/s, loss=0.00319]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 163.47batch/s, loss=0.00283]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 209.18batch/s, loss=0.00261]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 175.62batch/s, loss=0.00248]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 185.60batch/s, loss=0.00239]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 179.79batch/s, loss=0.00233]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 212.80batch/s, loss=0.00229]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 234.49batch/s, loss=0.00225]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 187.83batch/s, loss=0.00223]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 206.35batch/s, loss=0.00221]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 209.50batch/s, loss=0.00219]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 207.74batch/s, loss=0.002

Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 208.11batch/s, loss=0.0032] 
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 221.31batch/s, loss=0.00246]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 234.13batch/s, loss=0.00211]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 229.04batch/s, loss=0.00192]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 220.77batch/s, loss=0.0018] 
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 246.32batch/s, loss=0.00172]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 244.71batch/s, loss=0.00165]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 229.89batch/s, loss=0.00161]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 231.15batch/s, loss=0.00157]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 246.03batch/s, loss=0.00155]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 205.27batch/s, loss=0.00154]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 191.68batch/s, loss=0.00153]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 191.84batch/s, loss=0.001

Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 191.32batch/s, loss=0.00279]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 200.92batch/s, loss=0.0021] 
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 211.35batch/s, loss=0.00178]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 184.22batch/s, loss=0.00158]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 200.62batch/s, loss=0.00144]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 189.32batch/s, loss=0.00133]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 197.96batch/s, loss=0.00125]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 201.76batch/s, loss=0.00119]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 193.23batch/s, loss=0.00115]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 181.39batch/s, loss=0.00112]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 189.61batch/s, loss=0.00109]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 193.70batch/s, loss=0.00108]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 199.83batch/s, loss=0.001

Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 167.38batch/s, loss=0.00235]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 174.91batch/s, loss=0.00168]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 180.43batch/s, loss=0.00132]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 124.95batch/s, loss=0.00107]
Epoch 4: 100%|██████████| 109/109 [00:02<00:00, 37.83batch/s, loss=0.000908]
Epoch 5: 100%|██████████| 109/109 [00:01<00:00, 76.99batch/s, loss=0.000804]
Epoch 6: 100%|██████████| 109/109 [00:01<00:00, 75.63batch/s, loss=0.000738]
Epoch 7: 100%|██████████| 109/109 [00:01<00:00, 95.48batch/s, loss=0.000694] 
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 216.68batch/s, loss=0.000665]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 235.59batch/s, loss=0.000644]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 213.06batch/s, loss=0.000628]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 236.67batch/s, loss=0.000617]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 201.79batch/s, loss=

Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 198.32batch/s, loss=0.00196]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 185.97batch/s, loss=0.00115]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 186.62batch/s, loss=0.000777]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 168.90batch/s, loss=0.000572]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 169.89batch/s, loss=0.000465]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 177.98batch/s, loss=0.000406]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 166.99batch/s, loss=0.00037] 
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 182.39batch/s, loss=0.000346]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 165.27batch/s, loss=0.000329]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 170.18batch/s, loss=0.000317]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 171.34batch/s, loss=0.000308]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 179.14batch/s, loss=0.000303]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 182.77batch/s, 

Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 184.02batch/s, loss=0.00163]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 171.30batch/s, loss=0.00086]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 172.14batch/s, loss=0.000526]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 175.42batch/s, loss=0.000365]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 180.65batch/s, loss=0.000279]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 167.39batch/s, loss=0.000233]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 181.56batch/s, loss=0.000206]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 181.95batch/s, loss=0.00019] 
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 180.86batch/s, loss=0.00018] 
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 167.08batch/s, loss=0.000174]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 175.23batch/s, loss=0.000171]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 173.09batch/s, loss=0.00017] 
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 173.84batch/s, 

Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 164.00batch/s, loss=0.00139]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 208.58batch/s, loss=0.000666]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 221.47batch/s, loss=0.000381]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 217.09batch/s, loss=0.000249]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 222.05batch/s, loss=0.000182]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 181.46batch/s, loss=0.000144]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 230.49batch/s, loss=0.000123]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 227.01batch/s, loss=0.00011] 
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 213.16batch/s, loss=0.000102]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 223.09batch/s, loss=0.000101]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 208.03batch/s, loss=9.36e-5] 
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 198.56batch/s, loss=8.9e-5]  
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 155.24batch/s,

Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 170.22batch/s, loss=0.00133]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 184.70batch/s, loss=0.000543]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 181.53batch/s, loss=0.000285]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 156.29batch/s, loss=0.000184]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 146.30batch/s, loss=0.000133]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 160.37batch/s, loss=0.000106]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 163.71batch/s, loss=8.91e-5] 
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 156.09batch/s, loss=7.8e-5]  
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 151.57batch/s, loss=7.14e-5] 
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 158.75batch/s, loss=6.71e-5] 
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 147.33batch/s, loss=6.04e-5] 
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 152.63batch/s, loss=6.01e-5] 
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 142.51batch/s,

Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 171.06batch/s, loss=0.00109]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 162.85batch/s, loss=0.000406]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 185.18batch/s, loss=0.000207]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 181.09batch/s, loss=0.000129]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 185.29batch/s, loss=9.16e-5]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 235.61batch/s, loss=6.95e-5] 
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 229.75batch/s, loss=5.46e-5]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 243.49batch/s, loss=4.46e-5]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 224.33batch/s, loss=3.8e-5]  
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 167.41batch/s, loss=3.86e-5] 
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 162.61batch/s, loss=3.22e-5] 
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 178.97batch/s, loss=3.14e-5] 
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 169.11batch/s, lo

Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 174.33batch/s, loss=0.000995]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 172.39batch/s, loss=0.000337]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 171.46batch/s, loss=0.000165]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 172.08batch/s, loss=9.97e-5] 
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 175.66batch/s, loss=7.05e-5] 
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 162.75batch/s, loss=5.4e-5]  
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 176.29batch/s, loss=4.34e-5] 
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 171.22batch/s, loss=3.7e-5]  
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 163.01batch/s, loss=3.45e-5] 
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 135.69batch/s, loss=2.73e-5] 
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 138.26batch/s, loss=2.69e-5] 
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 152.43batch/s, loss=2.22e-5]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 168.76batch/s,

In [9]:
valLoss = []
for model in models1:
    model.eval()
    Xh = model(X_val)
    valLoss.append(float(loss_fn(Xh, X_val)))
px.bar(x=lat_dim, y=valLoss, title='MSE de reconstrução por dimensão', labels={'y':'MSE', 'x':'Dimensão'}, width=1000)

In [10]:
aux = X_val.cpu().detach().numpy()
i = 12
print(tarefas[int(y_val[i])])
fig = go.Figure()
fig.add_trace(go.Scatter(y=aux[i,:], mode="lines", showlegend=True, name='original'))
for model in models1:
    Xh = model(X_val).cpu().detach().numpy()
    fig.add_trace(go.Scatter(y=Xh[i,:], mode="lines", showlegend=True, name='reconstrução '+str(lat_dim[models1.index(model)])))
fig.show()

running


# Treinamento de modelos a partir do espaço latente dos automlp

In [11]:
emb_train = [None] * len(lat_dim)
emb_val = [None] * len(lat_dim)
for i, model in enumerate(models1):
    emb_train[i] = model.encoder(X_train).detach()
    emb_val[i] = model.encoder(X_val).detach()

In [12]:
lat_dim = [10, 20, 30, 50, 70, 100, 150, 200, 250, 300, 350, 400]
models2 = [None] * len(lat_dim)

In [13]:
class automlp2(nn.Module):
    def __init__(self, dim1, dim2):
        super().__init__()
        self.encoder = torch.nn.Sequential(

            nn.Flatten(start_dim=1),
            nn.Linear(dim1, dim2),
            # nn.ReLU(),
            # nn.LeakyReLU(),
            nn.Tanh()
        )

        self.decoder = nn.Linear(dim2, dim1)

    def forward(self, x):
        x = self.encoder(x)
        logits = self.decoder(x)
        return logits

In [15]:
lossMat = np.zeros((len(lat_dim), len(lat_dim)))
for i, dim1 in enumerate(lat_dim):
    X_train = emb_train[i]
    X_val = emb_val[i]
    for j, dim2 in enumerate(lat_dim):
        print(dim1,dim2)
        models2[j] = automlp2(dim1, dim2).to(device)
        loss_fn = nn.MSELoss()
        optimizer = optim.Adam(models2[j].parameters(), lr=0.001)
        n_epochs = 20   # number of epochs to run
        batch_size = 150  # size of each batch
        batch_start = torch.arange(0, len(X_train), batch_size)
        trainLoss = []
        valLoss = []
        for epoch in range(n_epochs):
            models2[j].train()
            with tqdm(batch_start, unit="batch", mininterval=0, disable=False) as bar:
                bar.set_description(f"Epoch {epoch}")
                for start in bar:
                    # take a batch
                    X_batch = X_train[start:start+batch_size,:]
                    # forward pass
                    Xh = models2[j](X_batch)
                    loss = loss_fn(Xh, X_batch)
                    # backward pass
                    optimizer.zero_grad()
                    loss.backward()
                    # update weights
                    optimizer.step()
                    # print progress
                    bar.set_postfix(loss=float(loss))
            # evaluate accuracy at end of each epoch
            models2[j].eval()
            Xh = models2[j](X_val)
            valLoss.append(float(loss_fn(Xh, X_val)))
            Xh = models2[j](X_train)
            trainLoss.append(float(loss_fn(Xh, X_train)))
        # fig = go.Figure()
        # fig.add_trace(go.Scatter(y=valLoss, mode="lines", showlegend=True, name='validação'))
        # fig.add_trace(go.Scatter(y=trainLoss, mode="lines", showlegend=True, name='treino'))
        # fig.show()
    valLoss = []
    for model in models2:
        model.eval()
        Xh = model(X_val)
        valLoss.append(float(loss_fn(Xh, X_val)))
    lossMat[:,i] = np.array(valLoss)
    # px.bar(x=lat_dim, y=valLoss, title='MSE de reconstrução por dimensão', labels={'y':'MSE', 'x':'Dimensão'}, width=1000)

10 10


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 235.99batch/s, loss=0.00922]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 200.05batch/s, loss=0.00585]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 243.54batch/s, loss=0.00458]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 226.00batch/s, loss=0.00364]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 223.00batch/s, loss=0.00293]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 225.56batch/s, loss=0.00233]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 239.75batch/s, loss=0.00183]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 229.90batch/s, loss=0.00143]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 244.63batch/s, loss=0.00114]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 257.86batch/s, loss=0.000915]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 251.74batch/s, loss=0.000731]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 248.99batch/s, loss=0.000568]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 254.72batch/s, loss=0.

10 20


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 274.33batch/s, loss=0.00386]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 268.05batch/s, loss=0.00197]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 260.39batch/s, loss=0.000802]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 214.62batch/s, loss=0.000315]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 198.46batch/s, loss=0.000146]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 204.80batch/s, loss=7.7e-5]  
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 189.56batch/s, loss=4.93e-5] 
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 201.16batch/s, loss=3.82e-5]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 205.38batch/s, loss=3.33e-5]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 213.36batch/s, loss=3.04e-5]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 191.62batch/s, loss=2.82e-5]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 209.32batch/s, loss=2.62e-5]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 213.30batch/s, loss=

10 30


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 206.97batch/s, loss=0.00401]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 213.43batch/s, loss=0.00198]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 202.72batch/s, loss=0.000654]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 212.21batch/s, loss=0.000216]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 214.94batch/s, loss=9.48e-5] 
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 203.61batch/s, loss=5e-5]    
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 208.81batch/s, loss=3.37e-5]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 218.61batch/s, loss=2.71e-5]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 177.24batch/s, loss=2.35e-5]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 176.55batch/s, loss=2.1e-5] 
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 171.35batch/s, loss=1.92e-5]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 192.26batch/s, loss=1.76e-5]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 182.88batch/s, loss=1

10 50


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 182.58batch/s, loss=0.00189]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 192.14batch/s, loss=0.000468]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 183.27batch/s, loss=0.000106]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 156.42batch/s, loss=3.65e-5]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 179.74batch/s, loss=1.98e-5]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 170.02batch/s, loss=1.47e-5]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 201.01batch/s, loss=1.19e-5]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 208.38batch/s, loss=9.7e-6] 
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 179.15batch/s, loss=7.95e-6]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 204.13batch/s, loss=6.56e-6]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 198.98batch/s, loss=5.49e-6]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 169.22batch/s, loss=4.7e-6] 
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 165.87batch/s, loss=4.0

10 70


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 196.81batch/s, loss=0.00144]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 207.98batch/s, loss=0.000243]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 208.63batch/s, loss=6.02e-5] 
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 204.07batch/s, loss=2.46e-5]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 203.70batch/s, loss=1.75e-5]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 186.24batch/s, loss=1.38e-5]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 184.59batch/s, loss=1.09e-5]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 177.81batch/s, loss=8.33e-6]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 165.98batch/s, loss=6.46e-6]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 170.21batch/s, loss=5.11e-6]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 173.44batch/s, loss=4.14e-6]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 177.03batch/s, loss=3.44e-6]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 173.88batch/s, loss=2.9

10 100


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 194.83batch/s, loss=0.000796]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 197.22batch/s, loss=0.000131]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 187.32batch/s, loss=2.54e-5]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 175.42batch/s, loss=1.14e-5]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 175.91batch/s, loss=8.33e-6]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 185.53batch/s, loss=6.42e-6]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 179.69batch/s, loss=4.91e-6]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 188.04batch/s, loss=3.74e-6]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 178.97batch/s, loss=2.84e-6]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 184.70batch/s, loss=2.17e-6]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 181.41batch/s, loss=1.7e-6] 
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 181.83batch/s, loss=1.39e-6]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 179.95batch/s, loss=1.1

10 150


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 188.90batch/s, loss=0.00064] 
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 195.20batch/s, loss=4.45e-5]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 207.86batch/s, loss=1.66e-5]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 197.79batch/s, loss=1.25e-5]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 191.98batch/s, loss=9.87e-6]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 205.01batch/s, loss=7.67e-6]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 206.10batch/s, loss=5.78e-6]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 198.69batch/s, loss=4.33e-6]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 195.06batch/s, loss=3.27e-6]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 201.91batch/s, loss=2.51e-6]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 186.72batch/s, loss=2.09e-6]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 198.38batch/s, loss=1.75e-6]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 187.62batch/s, loss=1.55

10 200


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 211.11batch/s, loss=0.00014] 
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 200.71batch/s, loss=1.42e-5]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 208.03batch/s, loss=7.3e-6] 
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 205.17batch/s, loss=4.69e-6]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 205.54batch/s, loss=3.15e-6]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 206.01batch/s, loss=2.34e-6]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 212.22batch/s, loss=1.88e-6]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 212.66batch/s, loss=1.64e-6]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 194.65batch/s, loss=1.53e-6]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 214.62batch/s, loss=1.42e-6]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 194.92batch/s, loss=1.27e-6]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 200.73batch/s, loss=1.31e-6]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 211.61batch/s, loss=1.45

10 250


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 209.59batch/s, loss=0.000106]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 209.71batch/s, loss=1.2e-5] 
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 211.05batch/s, loss=7.27e-6]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 197.54batch/s, loss=4.72e-6]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 199.56batch/s, loss=3.13e-6]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 217.56batch/s, loss=2.26e-6]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 201.56batch/s, loss=1.74e-6]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 207.11batch/s, loss=1.44e-6]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 205.44batch/s, loss=1.21e-6]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 211.52batch/s, loss=1.09e-6]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 199.74batch/s, loss=1.07e-6]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 197.46batch/s, loss=1.2e-6] 
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 213.05batch/s, loss=9.88

10 300


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 155.85batch/s, loss=8.61e-5] 
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 194.02batch/s, loss=1.66e-5]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 198.85batch/s, loss=9.24e-6]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 188.75batch/s, loss=5.68e-6]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 212.66batch/s, loss=3.63e-6]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 209.64batch/s, loss=2.45e-6]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 197.80batch/s, loss=1.73e-6]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 204.73batch/s, loss=1.33e-6]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 199.72batch/s, loss=1.08e-6]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 208.26batch/s, loss=1.06e-6]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 203.21batch/s, loss=1.05e-6]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 199.40batch/s, loss=8.24e-7]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 206.80batch/s, loss=7.77

10 350


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 202.58batch/s, loss=7.14e-5] 
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 218.77batch/s, loss=1.15e-5]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 202.72batch/s, loss=6.41e-6]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 217.22batch/s, loss=3.39e-6]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 205.77batch/s, loss=1.9e-6] 
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 211.28batch/s, loss=1.21e-6]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 204.14batch/s, loss=9.12e-7]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 192.54batch/s, loss=7.36e-7]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 211.89batch/s, loss=6.91e-7]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 201.98batch/s, loss=7.01e-7]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 209.61batch/s, loss=7.48e-7]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 203.20batch/s, loss=6.79e-7]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 214.22batch/s, loss=7.52

10 400


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 203.67batch/s, loss=4.14e-5] 
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 205.20batch/s, loss=9.6e-6] 
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 210.71batch/s, loss=5.08e-6]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 206.57batch/s, loss=2.73e-6]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 209.70batch/s, loss=1.73e-6]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 201.05batch/s, loss=1.31e-6]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 213.92batch/s, loss=1.08e-6]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 200.78batch/s, loss=8.85e-7]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 203.27batch/s, loss=8.05e-7]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 207.64batch/s, loss=7.77e-7]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 193.01batch/s, loss=1.41e-6]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 209.72batch/s, loss=8.27e-7]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 191.93batch/s, loss=9.37

20 10


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 210.56batch/s, loss=0.0093]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 203.69batch/s, loss=0.00651]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 209.38batch/s, loss=0.00522]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 209.22batch/s, loss=0.00407]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 195.25batch/s, loss=0.00327]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 205.48batch/s, loss=0.00281]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 212.14batch/s, loss=0.00251]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 204.74batch/s, loss=0.00231]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 199.87batch/s, loss=0.00217]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 199.93batch/s, loss=0.00207]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 200.45batch/s, loss=0.002]  
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 202.05batch/s, loss=0.00194]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 196.31batch/s, loss=0.0019

20 20


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 207.95batch/s, loss=0.00529]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 200.18batch/s, loss=0.003]  
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 204.00batch/s, loss=0.00181]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 205.95batch/s, loss=0.00131]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 212.95batch/s, loss=0.00101]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 199.91batch/s, loss=0.000794]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 204.29batch/s, loss=0.000634]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 206.64batch/s, loss=0.000504]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 189.57batch/s, loss=0.000394]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 206.10batch/s, loss=0.000303]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 206.35batch/s, loss=0.000227]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 198.18batch/s, loss=0.000165]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 207.44batch/s, los

20 30


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 196.66batch/s, loss=0.00491]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 211.93batch/s, loss=0.00245]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 200.10batch/s, loss=0.00126]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 204.56batch/s, loss=0.000701]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 212.69batch/s, loss=0.000397]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 197.82batch/s, loss=0.000227]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 208.74batch/s, loss=0.000133]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 203.81batch/s, loss=8.19e-5] 
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 202.61batch/s, loss=5.27e-5] 
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 211.57batch/s, loss=3.61e-5]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 194.80batch/s, loss=2.74e-5]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 197.38batch/s, loss=2.29e-5]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 207.92batch/s, loss

20 50


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 197.41batch/s, loss=0.0028] 
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 198.19batch/s, loss=0.000992]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 205.77batch/s, loss=0.000386]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 200.33batch/s, loss=0.000144]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 210.15batch/s, loss=5.67e-5] 
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 199.67batch/s, loss=2.84e-5]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 216.25batch/s, loss=1.87e-5]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 202.64batch/s, loss=1.42e-5]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 209.28batch/s, loss=1.15e-5]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 195.57batch/s, loss=9.45e-6]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 206.53batch/s, loss=7.87e-6]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 214.58batch/s, loss=6.58e-6]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 194.53batch/s, loss=5

20 70


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 205.78batch/s, loss=0.00209]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 209.85batch/s, loss=0.000626]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 192.01batch/s, loss=0.000218]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 217.27batch/s, loss=7.41e-5] 
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 203.17batch/s, loss=3.03e-5]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 209.66batch/s, loss=1.81e-5]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 198.52batch/s, loss=1.34e-5]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 208.98batch/s, loss=1.03e-5]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 209.95batch/s, loss=7.93e-6]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 204.26batch/s, loss=6.05e-6]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 200.09batch/s, loss=4.59e-6]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 210.90batch/s, loss=3.53e-6]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 201.55batch/s, loss=2.

20 100


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 187.17batch/s, loss=0.00117]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 192.07batch/s, loss=0.000199]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 224.25batch/s, loss=4.86e-5]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 200.51batch/s, loss=2.42e-5]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 206.00batch/s, loss=1.68e-5]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 206.01batch/s, loss=1.21e-5]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 209.03batch/s, loss=8.71e-6]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 200.78batch/s, loss=6.27e-6]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 200.38batch/s, loss=4.6e-6] 
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 195.94batch/s, loss=3.51e-6]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 194.41batch/s, loss=2.86e-6]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 195.45batch/s, loss=2.49e-6]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 204.49batch/s, loss=2.26

20 150


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 199.56batch/s, loss=0.000578]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 220.98batch/s, loss=7.62e-5] 
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 200.92batch/s, loss=2.26e-5]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 203.78batch/s, loss=1.11e-5]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 217.32batch/s, loss=7.25e-6]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 203.41batch/s, loss=4.65e-6]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 159.31batch/s, loss=2.97e-6]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 169.81batch/s, loss=2.07e-6]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 176.61batch/s, loss=1.64e-6]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 196.68batch/s, loss=1.44e-6]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 205.98batch/s, loss=1.36e-6]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 207.88batch/s, loss=1.34e-6]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 188.73batch/s, loss=1.3

20 200


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 212.14batch/s, loss=0.000271]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 201.27batch/s, loss=3.38e-5]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 204.53batch/s, loss=1.27e-5]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 196.29batch/s, loss=6.8e-6] 
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 201.44batch/s, loss=3.71e-6]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 204.60batch/s, loss=2.23e-6]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 189.22batch/s, loss=1.63e-6]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 205.03batch/s, loss=1.41e-6]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 208.04batch/s, loss=1.37e-6]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 201.84batch/s, loss=1.34e-6]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 191.03batch/s, loss=1.25e-6]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 181.34batch/s, loss=1.23e-6]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 182.26batch/s, loss=1.26

20 250


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 202.46batch/s, loss=0.000215]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 196.43batch/s, loss=2.4e-5] 
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 198.26batch/s, loss=7.3e-6] 
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 200.55batch/s, loss=3.21e-6]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 200.84batch/s, loss=1.77e-6]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 203.49batch/s, loss=1.26e-6]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 196.95batch/s, loss=1.07e-6]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 212.25batch/s, loss=1.02e-6]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 179.16batch/s, loss=1e-6]   
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 201.71batch/s, loss=9.93e-7]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 192.88batch/s, loss=9.9e-7] 
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 204.48batch/s, loss=9.69e-7]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 205.83batch/s, loss=9.59

20 300


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 199.42batch/s, loss=0.000194]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 204.76batch/s, loss=2.58e-5]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 203.97batch/s, loss=8.95e-6]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 200.60batch/s, loss=4.5e-6] 
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 200.96batch/s, loss=2.45e-6]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 200.09batch/s, loss=1.57e-6]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 206.86batch/s, loss=1.22e-6]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 195.39batch/s, loss=1.12e-6]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 211.34batch/s, loss=1.07e-6]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 206.05batch/s, loss=1.1e-6] 
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 197.34batch/s, loss=1.13e-6]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 196.75batch/s, loss=1.07e-6]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 210.60batch/s, loss=1.04

20 350


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 199.61batch/s, loss=6.83e-5] 
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 210.90batch/s, loss=1.18e-5]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 208.79batch/s, loss=5.01e-6]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 207.27batch/s, loss=2.09e-6]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 206.32batch/s, loss=1.06e-6]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 212.46batch/s, loss=8.04e-7]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 212.71batch/s, loss=7.95e-7]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 216.00batch/s, loss=7.97e-7]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 200.29batch/s, loss=7.38e-7]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 214.53batch/s, loss=7.3e-7] 
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 199.82batch/s, loss=8.63e-7]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 202.66batch/s, loss=9.03e-7]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 207.51batch/s, loss=1.02

20 400


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 210.83batch/s, loss=3.95e-5]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 208.78batch/s, loss=6.48e-6]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 203.86batch/s, loss=2.82e-6]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 213.71batch/s, loss=1.44e-6]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 213.99batch/s, loss=1.09e-6]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 204.87batch/s, loss=9.59e-7]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 210.27batch/s, loss=8.8e-7] 
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 213.14batch/s, loss=8.3e-7] 
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 197.17batch/s, loss=1.01e-6]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 196.47batch/s, loss=8.81e-7]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 213.79batch/s, loss=1.04e-6]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 215.03batch/s, loss=9.68e-7]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 202.31batch/s, loss=9.47e

30 10


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 208.00batch/s, loss=0.00851]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 188.61batch/s, loss=0.00619]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 202.71batch/s, loss=0.0057] 
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 198.57batch/s, loss=0.00548]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 210.20batch/s, loss=0.0053] 
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 208.78batch/s, loss=0.00511]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 206.70batch/s, loss=0.00489]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 198.78batch/s, loss=0.00465]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 211.57batch/s, loss=0.00441]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 207.66batch/s, loss=0.00421]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 205.09batch/s, loss=0.00403]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 215.64batch/s, loss=0.00387]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 191.45batch/s, loss=0.003

30 20


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 204.54batch/s, loss=0.00545]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 203.14batch/s, loss=0.00354]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 208.00batch/s, loss=0.00229]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 206.41batch/s, loss=0.00173]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 206.77batch/s, loss=0.0014] 
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 195.78batch/s, loss=0.00118]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 211.32batch/s, loss=0.00106]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 201.79batch/s, loss=0.000988]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 201.29batch/s, loss=0.000948]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 207.26batch/s, loss=0.000924]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 207.60batch/s, loss=0.000906]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 198.18batch/s, loss=0.000889]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 192.07batch/s, loss=

30 30


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 202.60batch/s, loss=0.00495]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 218.73batch/s, loss=0.00291]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 203.88batch/s, loss=0.00187]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 204.15batch/s, loss=0.00127]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 205.52batch/s, loss=0.000892]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 208.87batch/s, loss=0.000625]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 203.18batch/s, loss=0.000436]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 197.15batch/s, loss=0.000304]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 211.13batch/s, loss=0.000205]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 203.72batch/s, loss=0.000132]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 205.78batch/s, loss=8.08e-5] 
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 200.15batch/s, loss=4.93e-5] 
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 202.76batch/s, lo

30 50


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 216.02batch/s, loss=0.00363]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 201.49batch/s, loss=0.00151]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 196.41batch/s, loss=0.000741]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 201.93batch/s, loss=0.000348]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 192.28batch/s, loss=0.000128]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 191.50batch/s, loss=4.36e-5] 
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 197.74batch/s, loss=2.05e-5]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 210.55batch/s, loss=1.54e-5]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 203.61batch/s, loss=1.42e-5]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 202.59batch/s, loss=1.36e-5]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 208.73batch/s, loss=1.29e-5]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 205.83batch/s, loss=1.2e-5] 
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 199.97batch/s, loss=1

30 70


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 205.41batch/s, loss=0.00231]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 201.80batch/s, loss=0.000795]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 215.71batch/s, loss=0.00027] 
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 204.22batch/s, loss=8.6e-5]  
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 205.58batch/s, loss=2.81e-5]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 210.88batch/s, loss=1.34e-5]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 195.73batch/s, loss=9.48e-6]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 210.86batch/s, loss=7.72e-6]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 197.47batch/s, loss=6.47e-6]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 212.63batch/s, loss=5.45e-6]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 201.66batch/s, loss=4.64e-6]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 206.82batch/s, loss=3.99e-6]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 209.97batch/s, loss=3.

30 100


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 203.78batch/s, loss=0.00189]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 213.29batch/s, loss=0.000538]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 202.00batch/s, loss=0.000134]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 204.02batch/s, loss=2.52e-5]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 217.86batch/s, loss=8.29e-6]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 198.52batch/s, loss=6.05e-6]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 211.51batch/s, loss=5e-6]   
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 201.42batch/s, loss=4.14e-6]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 211.77batch/s, loss=3.44e-6]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 204.49batch/s, loss=2.9e-6] 
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 211.83batch/s, loss=2.5e-6] 
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 204.57batch/s, loss=2.21e-6]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 209.12batch/s, loss=2.0

30 150


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 201.73batch/s, loss=0.00078] 
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 206.63batch/s, loss=9.55e-5] 
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 212.09batch/s, loss=1.48e-5]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 203.92batch/s, loss=8.12e-6]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 208.10batch/s, loss=6.15e-6]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 215.23batch/s, loss=4.58e-6]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 207.83batch/s, loss=3.45e-6]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 200.40batch/s, loss=2.71e-6]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 215.16batch/s, loss=2.22e-6]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 205.72batch/s, loss=1.92e-6]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 210.37batch/s, loss=1.74e-6]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 196.55batch/s, loss=1.62e-6]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 210.48batch/s, loss=1.5

30 200


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 214.10batch/s, loss=0.000592]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 199.52batch/s, loss=6.3e-5]  
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 199.39batch/s, loss=1.19e-5]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 210.49batch/s, loss=7.05e-6]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 212.21batch/s, loss=5.32e-6]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 204.69batch/s, loss=3.92e-6]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 204.40batch/s, loss=2.92e-6]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 212.15batch/s, loss=2.27e-6]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 217.84batch/s, loss=1.84e-6]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 198.66batch/s, loss=1.58e-6]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 215.93batch/s, loss=1.4e-6] 
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 212.93batch/s, loss=1.29e-6]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 207.04batch/s, loss=1.2

30 250


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 211.67batch/s, loss=0.000338]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 206.80batch/s, loss=2.12e-5]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 209.69batch/s, loss=6.12e-6]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 197.97batch/s, loss=3.69e-6]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 200.97batch/s, loss=2.41e-6]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 212.24batch/s, loss=1.74e-6]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 199.00batch/s, loss=1.38e-6]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 212.26batch/s, loss=1.21e-6]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 201.85batch/s, loss=1.15e-6]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 206.43batch/s, loss=1.12e-6]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 199.08batch/s, loss=1.11e-6]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 203.80batch/s, loss=1.12e-6]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 205.12batch/s, loss=1.11

30 300


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 198.96batch/s, loss=0.000181]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 218.08batch/s, loss=1.07e-5]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 209.15batch/s, loss=4.73e-6]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 204.37batch/s, loss=2.64e-6]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 217.73batch/s, loss=1.66e-6]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 202.53batch/s, loss=1.22e-6]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 204.29batch/s, loss=1.03e-6]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 203.28batch/s, loss=9.4e-7] 
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 210.72batch/s, loss=9.02e-7]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 199.73batch/s, loss=9.06e-7]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 199.79batch/s, loss=8.99e-7]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 205.12batch/s, loss=8.62e-7]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 190.99batch/s, loss=9.02

30 350


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 206.46batch/s, loss=0.000185]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 209.31batch/s, loss=9.98e-6]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 205.43batch/s, loss=4.15e-6]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 208.50batch/s, loss=2.28e-6]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 207.14batch/s, loss=1.47e-6]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 197.17batch/s, loss=1.13e-6]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 200.05batch/s, loss=9.98e-7]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 214.34batch/s, loss=9.47e-7]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 201.12batch/s, loss=9.51e-7]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 202.68batch/s, loss=9.39e-7]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 204.35batch/s, loss=9.23e-7]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 211.41batch/s, loss=8.89e-7]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 197.20batch/s, loss=9.17

30 400


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 183.42batch/s, loss=9.32e-5] 
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 184.03batch/s, loss=7.04e-6]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 167.65batch/s, loss=3.51e-6]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 174.62batch/s, loss=1.92e-6]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 178.66batch/s, loss=1.26e-6]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 175.06batch/s, loss=9.99e-7]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 181.28batch/s, loss=8.98e-7]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 172.44batch/s, loss=8.41e-7]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 170.34batch/s, loss=8.81e-7]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 179.15batch/s, loss=8.64e-7]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 199.64batch/s, loss=8.95e-7]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 195.07batch/s, loss=9.55e-7]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 207.99batch/s, loss=9.4e

50 10


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 196.42batch/s, loss=0.00799]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 172.20batch/s, loss=0.00591]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 195.59batch/s, loss=0.00534]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 207.44batch/s, loss=0.00495]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 201.54batch/s, loss=0.0047] 
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 201.74batch/s, loss=0.00453]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 199.01batch/s, loss=0.00441]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 203.21batch/s, loss=0.00431]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 202.28batch/s, loss=0.00423]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 202.91batch/s, loss=0.00417]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 208.76batch/s, loss=0.00412]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 194.43batch/s, loss=0.00407]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 209.11batch/s, loss=0.004

50 20


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 205.28batch/s, loss=0.00517]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 205.98batch/s, loss=0.00392]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 200.18batch/s, loss=0.00321]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 206.62batch/s, loss=0.00282]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 204.32batch/s, loss=0.00267]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 211.34batch/s, loss=0.00261]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 202.05batch/s, loss=0.00258]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 204.70batch/s, loss=0.00255]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 208.97batch/s, loss=0.00253]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 197.76batch/s, loss=0.00252]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 207.90batch/s, loss=0.00251]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 201.94batch/s, loss=0.0025] 
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 204.45batch/s, loss=0.002

50 30


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 207.67batch/s, loss=0.00544]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 205.27batch/s, loss=0.00389]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 207.39batch/s, loss=0.00294]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 179.63batch/s, loss=0.00236]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 183.03batch/s, loss=0.00203]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 171.41batch/s, loss=0.00184]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 183.53batch/s, loss=0.00173]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 162.20batch/s, loss=0.00168]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 168.51batch/s, loss=0.00165]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 180.10batch/s, loss=0.00164]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 174.09batch/s, loss=0.00163]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 185.80batch/s, loss=0.00164]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 207.34batch/s, loss=0.001

50 50


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 211.30batch/s, loss=0.00359]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 200.25batch/s, loss=0.00173]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 214.91batch/s, loss=0.001]  
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 211.12batch/s, loss=0.000603]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 190.52batch/s, loss=0.000377]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 206.99batch/s, loss=0.000228]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 207.02batch/s, loss=0.00012] 
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 216.19batch/s, loss=7.38e-5] 
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 202.12batch/s, loss=5.02e-5] 
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 202.71batch/s, loss=3.28e-5]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 204.33batch/s, loss=2.27e-5]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 201.33batch/s, loss=1.97e-5]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 211.24batch/s, loss

50 70


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 209.02batch/s, loss=0.00308]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 214.84batch/s, loss=0.00142]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 200.21batch/s, loss=0.000686]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 209.65batch/s, loss=0.000285]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 213.23batch/s, loss=0.000102]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 214.01batch/s, loss=3.79e-5]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 202.41batch/s, loss=1.91e-5]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 206.65batch/s, loss=1.36e-5]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 199.09batch/s, loss=1.13e-5]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 189.29batch/s, loss=9.8e-6] 
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 208.22batch/s, loss=8.71e-6]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 183.91batch/s, loss=7.86e-6]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 208.98batch/s, loss=7.

50 100


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 212.73batch/s, loss=0.00236]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 200.00batch/s, loss=0.00075] 
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 200.36batch/s, loss=0.000236]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 204.58batch/s, loss=5.52e-5]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 190.22batch/s, loss=1.46e-5]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 181.09batch/s, loss=8.45e-6]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 173.37batch/s, loss=6.42e-6]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 172.41batch/s, loss=5.12e-6]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 181.35batch/s, loss=4.22e-6]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 171.08batch/s, loss=3.65e-6]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 169.11batch/s, loss=3.33e-6]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 163.89batch/s, loss=3.16e-6]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 113.85batch/s, loss=3.0

50 150


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 177.32batch/s, loss=0.00127]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 181.21batch/s, loss=0.000185]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 170.43batch/s, loss=2.68e-5]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 182.06batch/s, loss=1.04e-5]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 177.91batch/s, loss=6.98e-6]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 185.16batch/s, loss=4.85e-6]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 194.71batch/s, loss=3.45e-6]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 205.22batch/s, loss=2.65e-6]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 209.19batch/s, loss=2.24e-6]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 204.00batch/s, loss=2.05e-6]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 201.08batch/s, loss=1.96e-6]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 195.01batch/s, loss=1.9e-6] 
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 207.29batch/s, loss=1.85

50 200


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 178.75batch/s, loss=0.000967]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 189.49batch/s, loss=0.000121]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 184.04batch/s, loss=1.55e-5]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 187.41batch/s, loss=6.45e-6]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 186.40batch/s, loss=3.86e-6]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 176.17batch/s, loss=2.44e-6]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 191.80batch/s, loss=1.71e-6]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 201.70batch/s, loss=1.39e-6]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 206.17batch/s, loss=1.28e-6]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 194.45batch/s, loss=1.25e-6]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 202.11batch/s, loss=1.24e-6]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 210.82batch/s, loss=1.24e-6]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 197.38batch/s, loss=1.2

50 250


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 174.70batch/s, loss=0.000649]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 209.33batch/s, loss=3.57e-5]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 206.07batch/s, loss=6.58e-6]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 201.61batch/s, loss=3.39e-6]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 209.78batch/s, loss=1.93e-6]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 197.61batch/s, loss=1.3e-6] 
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 214.52batch/s, loss=1.1e-6] 
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 195.63batch/s, loss=1.06e-6]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 198.85batch/s, loss=1.06e-6]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 202.83batch/s, loss=1.07e-6]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 211.78batch/s, loss=1.07e-6]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 193.45batch/s, loss=1.06e-6]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 207.71batch/s, loss=1.04

50 300


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 168.61batch/s, loss=0.000408]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 179.92batch/s, loss=2.02e-5]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 173.79batch/s, loss=5.92e-6]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 179.33batch/s, loss=3.01e-6]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 180.91batch/s, loss=1.68e-6]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 164.21batch/s, loss=1.21e-6]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 181.99batch/s, loss=1.08e-6]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 174.30batch/s, loss=1.06e-6]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 182.59batch/s, loss=1.07e-6]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 173.65batch/s, loss=1.07e-6]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 172.84batch/s, loss=1.08e-6]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 170.26batch/s, loss=1.08e-6]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 173.71batch/s, loss=1.09

50 350


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 179.63batch/s, loss=0.000299]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 177.17batch/s, loss=1.34e-5]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 179.64batch/s, loss=5.88e-6]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 170.44batch/s, loss=3.27e-6]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 173.33batch/s, loss=2.06e-6]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 166.13batch/s, loss=1.66e-6]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 173.82batch/s, loss=1.51e-6]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 208.03batch/s, loss=1.47e-6]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 201.28batch/s, loss=1.47e-6]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 207.32batch/s, loss=1.46e-6]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 201.03batch/s, loss=1.45e-6]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 205.05batch/s, loss=1.45e-6]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 192.15batch/s, loss=1.42

50 400


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 211.62batch/s, loss=0.000191]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 193.46batch/s, loss=8.68e-6]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 206.92batch/s, loss=3.49e-6]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 206.42batch/s, loss=1.52e-6]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 206.82batch/s, loss=1.01e-6]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 194.66batch/s, loss=9.08e-7]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 207.31batch/s, loss=8.89e-7]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 210.68batch/s, loss=8.93e-7]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 201.81batch/s, loss=9.02e-7]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 195.75batch/s, loss=9.43e-7]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 213.65batch/s, loss=9.91e-7]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 204.77batch/s, loss=1.01e-6]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 194.72batch/s, loss=9.92

70 10


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 204.13batch/s, loss=0.00794]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 211.12batch/s, loss=0.00646]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 207.12batch/s, loss=0.00608]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 203.82batch/s, loss=0.00579]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 201.52batch/s, loss=0.00555]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 201.55batch/s, loss=0.00538]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 208.27batch/s, loss=0.00525]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 203.89batch/s, loss=0.00514]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 197.20batch/s, loss=0.00504]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 211.01batch/s, loss=0.00496]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 201.23batch/s, loss=0.00489]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 200.31batch/s, loss=0.00484]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 206.32batch/s, loss=0.004

70 20


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 195.05batch/s, loss=0.00588]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 215.65batch/s, loss=0.00506]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 200.68batch/s, loss=0.00451]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 205.20batch/s, loss=0.00414]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 194.76batch/s, loss=0.00393]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 208.30batch/s, loss=0.0038] 
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 211.52batch/s, loss=0.00372]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 199.90batch/s, loss=0.00367]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 183.90batch/s, loss=0.00362]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 167.14batch/s, loss=0.00358]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 155.77batch/s, loss=0.00355]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 172.39batch/s, loss=0.00351]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 175.29batch/s, loss=0.003

70 30


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 166.57batch/s, loss=0.00535]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 167.75batch/s, loss=0.00377]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 181.58batch/s, loss=0.00318]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 194.80batch/s, loss=0.00293]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 197.53batch/s, loss=0.00281]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 213.00batch/s, loss=0.00274]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 199.07batch/s, loss=0.00271]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 209.93batch/s, loss=0.0027] 
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 194.73batch/s, loss=0.0027] 
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 208.50batch/s, loss=0.0027] 
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 211.85batch/s, loss=0.00271]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 195.11batch/s, loss=0.00271]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 204.62batch/s, loss=0.002

70 50


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 205.58batch/s, loss=0.00449]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 202.06batch/s, loss=0.00295]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 213.63batch/s, loss=0.00232]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 207.69batch/s, loss=0.00193]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 205.12batch/s, loss=0.0017] 
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 207.44batch/s, loss=0.00159]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 199.34batch/s, loss=0.00154] 
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 207.36batch/s, loss=0.0015]  
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 200.91batch/s, loss=0.00147] 
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 207.06batch/s, loss=0.00145] 
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 190.97batch/s, loss=0.00142] 
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 167.31batch/s, loss=0.0014]  
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 166.15batch/s, loss

70 70


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 207.87batch/s, loss=0.00364]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 197.64batch/s, loss=0.00188]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 211.14batch/s, loss=0.00115] 
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 212.65batch/s, loss=0.000703]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 214.41batch/s, loss=0.000396]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 197.76batch/s, loss=0.000212]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 208.28batch/s, loss=0.000116]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 212.64batch/s, loss=7.07e-5]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 201.89batch/s, loss=4.98e-5]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 205.97batch/s, loss=4.12e-5]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 210.01batch/s, loss=3.83e-5]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 203.40batch/s, loss=3.67e-5]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 211.46batch/s, loss=

70 100


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 175.52batch/s, loss=0.00271]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 174.87batch/s, loss=0.00113]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 187.28batch/s, loss=0.000474]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 174.48batch/s, loss=0.000174]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 180.52batch/s, loss=5.6e-5] 
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 178.38batch/s, loss=2.56e-5]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 191.45batch/s, loss=1.87e-5]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 173.67batch/s, loss=1.57e-5]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 177.52batch/s, loss=1.36e-5]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 177.30batch/s, loss=1.18e-5]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 197.12batch/s, loss=1.04e-5]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 199.72batch/s, loss=9.32e-6]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 211.46batch/s, loss=8.4

70 150


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 203.73batch/s, loss=0.00187]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 202.19batch/s, loss=0.000485]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 210.36batch/s, loss=0.000107]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 206.90batch/s, loss=2.41e-5]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 211.81batch/s, loss=1.1e-5] 
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 191.90batch/s, loss=7.79e-6]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 204.85batch/s, loss=5.83e-6]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 200.69batch/s, loss=4.52e-6]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 207.73batch/s, loss=3.76e-6]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 202.03batch/s, loss=3.35e-6]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 194.82batch/s, loss=3.14e-6]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 203.87batch/s, loss=3.01e-6]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 197.54batch/s, loss=2.9

70 200


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 163.68batch/s, loss=0.00125]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 182.48batch/s, loss=0.000193]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 184.73batch/s, loss=2.65e-5]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 179.96batch/s, loss=1.07e-5]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 206.11batch/s, loss=6.71e-6]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 197.53batch/s, loss=4.4e-6] 
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 209.62batch/s, loss=3.21e-6]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 199.81batch/s, loss=2.69e-6]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 203.47batch/s, loss=2.45e-6]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 198.75batch/s, loss=2.32e-6]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 206.16batch/s, loss=2.22e-6]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 201.04batch/s, loss=2.14e-6]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 198.07batch/s, loss=2.06

70 250


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 197.40batch/s, loss=0.00112] 
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 202.40batch/s, loss=0.000109]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 215.10batch/s, loss=1.7e-5] 
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 208.14batch/s, loss=8.49e-6]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 199.59batch/s, loss=4.78e-6]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 203.92batch/s, loss=2.91e-6]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 205.30batch/s, loss=2.13e-6]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 204.75batch/s, loss=1.85e-6]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 193.07batch/s, loss=1.75e-6]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 190.08batch/s, loss=1.71e-6]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 171.70batch/s, loss=1.68e-6]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 175.32batch/s, loss=1.66e-6]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 169.98batch/s, loss=1.6

70 300


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 168.70batch/s, loss=0.000754]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 171.39batch/s, loss=4.51e-5]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 174.70batch/s, loss=9.31e-6]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 171.57batch/s, loss=4.53e-6]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 198.65batch/s, loss=2.3e-6] 
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 208.59batch/s, loss=1.48e-6]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 191.97batch/s, loss=1.24e-6]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 211.44batch/s, loss=1.19e-6]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 207.70batch/s, loss=1.18e-6]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 196.99batch/s, loss=1.19e-6]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 194.45batch/s, loss=1.21e-6]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 200.70batch/s, loss=1.22e-6]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 194.36batch/s, loss=1.23

70 350


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 194.52batch/s, loss=0.000514]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 208.45batch/s, loss=2.53e-5]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 201.08batch/s, loss=6.61e-6]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 212.56batch/s, loss=3.24e-6]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 190.77batch/s, loss=2e-6]   
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 208.02batch/s, loss=1.63e-6]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 199.87batch/s, loss=1.53e-6]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 199.92batch/s, loss=1.51e-6]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 189.91batch/s, loss=1.51e-6]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 180.24batch/s, loss=1.51e-6]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 167.64batch/s, loss=1.5e-6] 
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 175.58batch/s, loss=1.47e-6]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 166.38batch/s, loss=1.43

70 400


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 175.85batch/s, loss=0.00047] 
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 178.23batch/s, loss=2.6e-5] 
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 171.67batch/s, loss=6.61e-6]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 177.24batch/s, loss=2.63e-6]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 172.24batch/s, loss=1.42e-6]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 179.66batch/s, loss=1.14e-6]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 171.86batch/s, loss=1.08e-6]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 169.96batch/s, loss=1.1e-6] 
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 170.23batch/s, loss=1.12e-6]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 180.90batch/s, loss=1.13e-6]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 159.49batch/s, loss=1.14e-6]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 167.56batch/s, loss=1.16e-6]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 177.65batch/s, loss=1.18

100 10


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 183.56batch/s, loss=0.00722]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 174.40batch/s, loss=0.00601]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 182.93batch/s, loss=0.00565]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 173.72batch/s, loss=0.0055] 
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 167.65batch/s, loss=0.00539]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 186.35batch/s, loss=0.00528]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 169.16batch/s, loss=0.00517]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 173.96batch/s, loss=0.00507]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 174.58batch/s, loss=0.00498]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 179.21batch/s, loss=0.00492]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 168.10batch/s, loss=0.00487]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 164.83batch/s, loss=0.00483]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 171.70batch/s, loss=0.004

100 20


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 172.63batch/s, loss=0.00592]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 194.16batch/s, loss=0.00514]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 211.54batch/s, loss=0.00464]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 203.67batch/s, loss=0.00435]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 207.89batch/s, loss=0.00421]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 203.00batch/s, loss=0.00413]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 211.49batch/s, loss=0.00408]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 207.95batch/s, loss=0.00405]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 207.13batch/s, loss=0.00402]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 204.50batch/s, loss=0.004]  
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 189.48batch/s, loss=0.00397]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 168.77batch/s, loss=0.00396]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 177.94batch/s, loss=0.003

100 30


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 199.96batch/s, loss=0.00528]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 216.65batch/s, loss=0.00418]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 201.58batch/s, loss=0.00371]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 209.84batch/s, loss=0.00348]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 200.77batch/s, loss=0.00337]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 212.86batch/s, loss=0.00331]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 207.23batch/s, loss=0.00328]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 199.25batch/s, loss=0.00326]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 205.49batch/s, loss=0.00326]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 202.80batch/s, loss=0.00326]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 210.72batch/s, loss=0.00327]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 197.61batch/s, loss=0.00328]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 199.26batch/s, loss=0.003

100 50


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 206.14batch/s, loss=0.00431]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 201.18batch/s, loss=0.00311]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 210.47batch/s, loss=0.00259]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 194.60batch/s, loss=0.00236]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 211.48batch/s, loss=0.00226]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 211.34batch/s, loss=0.00222]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 206.20batch/s, loss=0.0022] 
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 208.06batch/s, loss=0.00218]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 192.62batch/s, loss=0.00216]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 210.04batch/s, loss=0.00214]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 204.37batch/s, loss=0.00212]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 194.04batch/s, loss=0.00211]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 186.78batch/s, loss=0.002

100 70


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 203.40batch/s, loss=0.00384]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 195.32batch/s, loss=0.00251]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 184.90batch/s, loss=0.00186]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 167.57batch/s, loss=0.00152]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 178.77batch/s, loss=0.00135]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 171.63batch/s, loss=0.00127] 
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 180.43batch/s, loss=0.00122] 
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 172.11batch/s, loss=0.00118] 
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 172.46batch/s, loss=0.00115] 
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 175.77batch/s, loss=0.00112] 
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 174.07batch/s, loss=0.0011]  
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 172.90batch/s, loss=0.00108] 
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 173.58batch/s, los

100 100


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 167.62batch/s, loss=0.00325]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 176.56batch/s, loss=0.00185]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 180.13batch/s, loss=0.00109] 
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 168.55batch/s, loss=0.000642]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 178.06batch/s, loss=0.000355]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 178.75batch/s, loss=0.000194]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 176.83batch/s, loss=0.000115]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 180.63batch/s, loss=6.39e-5]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 166.33batch/s, loss=3.25e-5]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 176.36batch/s, loss=1.92e-5]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 175.90batch/s, loss=1.39e-5]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 179.07batch/s, loss=1.12e-5]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 199.20batch/s, loss=

100 150


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 193.83batch/s, loss=0.00252]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 202.85batch/s, loss=0.00106] 
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 198.16batch/s, loss=0.000371]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 205.75batch/s, loss=8.33e-5]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 202.33batch/s, loss=1.39e-5]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 200.24batch/s, loss=6.09e-6]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 191.87batch/s, loss=5.09e-6]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 202.97batch/s, loss=4.49e-6]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 204.54batch/s, loss=4.09e-6]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 187.57batch/s, loss=3.88e-6]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 196.57batch/s, loss=3.76e-6]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 197.47batch/s, loss=3.69e-6]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 202.61batch/s, loss=3.6

100 200


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 200.35batch/s, loss=0.00188]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 191.51batch/s, loss=0.000487]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 190.82batch/s, loss=9.62e-5]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 209.39batch/s, loss=1.32e-5]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 198.18batch/s, loss=4.42e-6]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 198.79batch/s, loss=3.06e-6]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 190.28batch/s, loss=2.52e-6]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 185.22batch/s, loss=2.3e-6] 
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 197.61batch/s, loss=2.2e-6] 
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 192.03batch/s, loss=2.16e-6]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 200.23batch/s, loss=2.13e-6]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 193.14batch/s, loss=2.1e-6] 
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 207.59batch/s, loss=2.07

100 250


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 165.54batch/s, loss=0.00168]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 180.74batch/s, loss=0.000319]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 192.08batch/s, loss=3.74e-5]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 189.02batch/s, loss=6.21e-6]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 204.11batch/s, loss=3.89e-6]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 187.42batch/s, loss=3.29e-6]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 197.14batch/s, loss=3.05e-6]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 193.10batch/s, loss=2.94e-6]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 192.87batch/s, loss=2.85e-6]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 191.70batch/s, loss=2.77e-6]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 163.15batch/s, loss=2.69e-6]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 163.74batch/s, loss=2.59e-6]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 167.78batch/s, loss=2.5e

100 300


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 159.34batch/s, loss=0.00133] 
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 179.54batch/s, loss=0.000169]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 176.26batch/s, loss=1.35e-5]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 162.94batch/s, loss=3.22e-6]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 192.12batch/s, loss=2.06e-6]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 203.24batch/s, loss=1.74e-6]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 194.17batch/s, loss=1.65e-6]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 190.79batch/s, loss=1.63e-6]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 203.35batch/s, loss=1.61e-6]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 205.84batch/s, loss=1.58e-6]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 187.50batch/s, loss=1.55e-6]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 191.52batch/s, loss=1.51e-6]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 201.56batch/s, loss=1.4

100 350


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 187.56batch/s, loss=0.00104] 
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 170.98batch/s, loss=7.98e-5]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 174.97batch/s, loss=5.2e-6] 
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 156.12batch/s, loss=2.04e-6]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 173.26batch/s, loss=1.37e-6]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 171.88batch/s, loss=1.18e-6]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 169.69batch/s, loss=1.14e-6]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 161.13batch/s, loss=1.14e-6]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 172.45batch/s, loss=1.13e-6]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 165.65batch/s, loss=1.12e-6]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 164.63batch/s, loss=1.11e-6]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 166.54batch/s, loss=1.11e-6]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 167.96batch/s, loss=1.11

100 400


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 159.72batch/s, loss=0.000919]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 170.26batch/s, loss=5.03e-5]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 170.35batch/s, loss=3.36e-6]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 152.65batch/s, loss=1.87e-6]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 164.95batch/s, loss=1.56e-6]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 172.79batch/s, loss=1.48e-6]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 165.25batch/s, loss=1.45e-6]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 166.35batch/s, loss=1.41e-6]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 161.57batch/s, loss=1.38e-6]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 168.10batch/s, loss=1.35e-6]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 153.25batch/s, loss=1.32e-6]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 170.48batch/s, loss=1.29e-6]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 163.47batch/s, loss=1.26

150 10


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 163.36batch/s, loss=0.00671]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 166.24batch/s, loss=0.00544]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 172.33batch/s, loss=0.00526]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 170.11batch/s, loss=0.00513]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 169.08batch/s, loss=0.00501]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 164.04batch/s, loss=0.00489]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 172.14batch/s, loss=0.00478]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 171.49batch/s, loss=0.00469]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 171.74batch/s, loss=0.00461]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 163.05batch/s, loss=0.00455]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 168.58batch/s, loss=0.00449]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 165.54batch/s, loss=0.00445]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 163.76batch/s, loss=0.004

150 20


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 174.25batch/s, loss=0.00528]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 165.11batch/s, loss=0.00471]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 174.72batch/s, loss=0.0044] 
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 172.35batch/s, loss=0.0042] 
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 174.25batch/s, loss=0.00407]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 163.81batch/s, loss=0.00398]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 197.56batch/s, loss=0.00392]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 198.33batch/s, loss=0.00388]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 204.60batch/s, loss=0.00385]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 195.00batch/s, loss=0.00383]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 205.55batch/s, loss=0.00381]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 195.36batch/s, loss=0.00378]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 200.33batch/s, loss=0.003

150 30


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 167.26batch/s, loss=0.00482]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 176.36batch/s, loss=0.00395]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 187.00batch/s, loss=0.00363]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 199.84batch/s, loss=0.0035] 
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 198.84batch/s, loss=0.00344]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 198.93batch/s, loss=0.00342]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 208.43batch/s, loss=0.00342]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 186.41batch/s, loss=0.00341]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 205.36batch/s, loss=0.00341]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 194.54batch/s, loss=0.00341]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 196.86batch/s, loss=0.00341]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 193.12batch/s, loss=0.0034] 
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 190.70batch/s, loss=0.003

150 50


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 172.80batch/s, loss=0.00426]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 200.64batch/s, loss=0.00318]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 197.33batch/s, loss=0.00282]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 189.08batch/s, loss=0.00267]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 191.64batch/s, loss=0.0026] 
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 198.31batch/s, loss=0.00255]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 199.18batch/s, loss=0.00251]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 188.85batch/s, loss=0.00248]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 204.70batch/s, loss=0.00246]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 194.72batch/s, loss=0.00245]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 207.07batch/s, loss=0.00244]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 179.32batch/s, loss=0.00243]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 202.34batch/s, loss=0.002

150 70


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 196.48batch/s, loss=0.00371]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 197.99batch/s, loss=0.00274]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 215.31batch/s, loss=0.00235]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 188.71batch/s, loss=0.00218]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 208.19batch/s, loss=0.00209]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 197.71batch/s, loss=0.00203]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 202.26batch/s, loss=0.00199]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 199.59batch/s, loss=0.00196]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 202.98batch/s, loss=0.00194]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 190.32batch/s, loss=0.00193]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 205.99batch/s, loss=0.00191]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 189.46batch/s, loss=0.0019] 
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 201.79batch/s, loss=0.001

150 100


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 190.93batch/s, loss=0.0033] 
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 196.32batch/s, loss=0.00223]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 189.86batch/s, loss=0.0017] 
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 202.19batch/s, loss=0.00141]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 203.51batch/s, loss=0.00125]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 201.21batch/s, loss=0.00115] 
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 195.20batch/s, loss=0.00107] 
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 185.58batch/s, loss=0.00101] 
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 203.28batch/s, loss=0.000956]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 186.58batch/s, loss=0.000911]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 169.09batch/s, loss=0.000874]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 168.34batch/s, loss=0.000845]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 175.38batch/s, los

150 150


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 159.54batch/s, loss=0.00257]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 168.60batch/s, loss=0.00119]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 166.10batch/s, loss=0.000557]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 192.74batch/s, loss=0.000292]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 195.74batch/s, loss=0.000163]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 207.22batch/s, loss=8.65e-5] 
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 207.01batch/s, loss=4.53e-5]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 192.68batch/s, loss=2.18e-5]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 197.01batch/s, loss=8.93e-6]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 181.11batch/s, loss=5.21e-6]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 204.97batch/s, loss=4.66e-6]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 191.60batch/s, loss=4.46e-6]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 177.26batch/s, loss=4

150 200


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 161.87batch/s, loss=0.00219]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 162.30batch/s, loss=0.000755]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 174.61batch/s, loss=0.000227]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 170.08batch/s, loss=4.99e-5]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 164.79batch/s, loss=9.02e-6]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 160.65batch/s, loss=3.95e-6]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 189.96batch/s, loss=3.34e-6]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 196.67batch/s, loss=3.16e-6]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 197.52batch/s, loss=3.09e-6]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 183.37batch/s, loss=3.03e-6]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 195.38batch/s, loss=2.99e-6]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 192.10batch/s, loss=2.94e-6]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 199.61batch/s, loss=2.8

150 250


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 169.38batch/s, loss=0.00177]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 175.52batch/s, loss=0.000457]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 196.46batch/s, loss=8.4e-5]  
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 184.61batch/s, loss=1.11e-5]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 201.48batch/s, loss=2.54e-6]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 202.02batch/s, loss=1.85e-6]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 185.94batch/s, loss=1.74e-6]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 192.90batch/s, loss=1.74e-6]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 196.20batch/s, loss=1.76e-6]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 179.51batch/s, loss=1.77e-6]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 186.36batch/s, loss=1.78e-6]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 204.66batch/s, loss=1.78e-6]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 193.47batch/s, loss=1.7

150 300


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 162.34batch/s, loss=0.00157]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 166.82batch/s, loss=0.00031] 
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 150.66batch/s, loss=3.43e-5]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 173.93batch/s, loss=3.43e-6]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 169.41batch/s, loss=1.55e-6]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 160.75batch/s, loss=1.41e-6]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 164.78batch/s, loss=1.43e-6]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 157.42batch/s, loss=1.47e-6]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 171.48batch/s, loss=1.51e-6]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 150.36batch/s, loss=1.54e-6]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 174.20batch/s, loss=1.55e-6]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 163.92batch/s, loss=1.55e-6]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 153.42batch/s, loss=1.56

150 350


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 146.72batch/s, loss=0.00137] 
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 125.58batch/s, loss=0.000183]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 145.30batch/s, loss=1.22e-5]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 134.58batch/s, loss=1.98e-6]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 142.44batch/s, loss=1.49e-6]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 136.64batch/s, loss=1.46e-6]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 133.73batch/s, loss=1.47e-6]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 138.96batch/s, loss=1.48e-6]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 134.99batch/s, loss=1.48e-6]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 136.14batch/s, loss=1.48e-6]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 143.14batch/s, loss=1.48e-6]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 140.33batch/s, loss=1.47e-6]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 133.10batch/s, loss=1.4

150 400


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 129.05batch/s, loss=0.00119] 
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 133.87batch/s, loss=0.000114]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 125.01batch/s, loss=8.3e-6] 
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 112.43batch/s, loss=1.47e-6]
Epoch 4: 100%|██████████| 109/109 [00:01<00:00, 75.51batch/s, loss=1.25e-6]
Epoch 5: 100%|██████████| 109/109 [00:01<00:00, 91.18batch/s, loss=1.29e-6] 
Epoch 6: 100%|██████████| 109/109 [00:01<00:00, 88.35batch/s, loss=1.33e-6] 
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 149.14batch/s, loss=1.36e-6]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 156.59batch/s, loss=1.37e-6]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 158.11batch/s, loss=1.37e-6]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 165.25batch/s, loss=1.36e-6]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 156.53batch/s, loss=1.34e-6]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 159.06batch/s, loss=1.32

200 10


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 169.25batch/s, loss=0.00588]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 165.05batch/s, loss=0.00482]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 167.95batch/s, loss=0.00457]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 174.97batch/s, loss=0.00444]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 175.97batch/s, loss=0.00436]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 164.89batch/s, loss=0.00429]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 180.36batch/s, loss=0.00421]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 165.58batch/s, loss=0.00414]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 163.19batch/s, loss=0.00408]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 166.12batch/s, loss=0.00402]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 179.26batch/s, loss=0.00397]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 173.22batch/s, loss=0.00392]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 170.20batch/s, loss=0.003

200 20


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 167.22batch/s, loss=0.00475]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 180.11batch/s, loss=0.00424]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 176.69batch/s, loss=0.00393]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 162.27batch/s, loss=0.00367]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 173.18batch/s, loss=0.00351]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 171.88batch/s, loss=0.00342]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 168.93batch/s, loss=0.00337]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 165.18batch/s, loss=0.00333]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 169.50batch/s, loss=0.00331]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 164.45batch/s, loss=0.00329]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 184.76batch/s, loss=0.00328]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 197.03batch/s, loss=0.00327]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 199.28batch/s, loss=0.003

200 30


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 201.73batch/s, loss=0.00452]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 207.75batch/s, loss=0.00359]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 201.12batch/s, loss=0.00326]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 203.05batch/s, loss=0.00313]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 193.04batch/s, loss=0.00306]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 207.63batch/s, loss=0.00302]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 199.61batch/s, loss=0.00299]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 191.19batch/s, loss=0.00297]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 194.18batch/s, loss=0.00296]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 200.25batch/s, loss=0.00295]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 204.19batch/s, loss=0.00295]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 189.59batch/s, loss=0.00295]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 200.75batch/s, loss=0.002

200 50


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 197.18batch/s, loss=0.00371]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 197.23batch/s, loss=0.00297]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 197.62batch/s, loss=0.0027] 
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 183.60batch/s, loss=0.00258]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 197.18batch/s, loss=0.00252]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 205.77batch/s, loss=0.00248]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 194.65batch/s, loss=0.00246]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 189.65batch/s, loss=0.00244]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 198.24batch/s, loss=0.00242]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 193.71batch/s, loss=0.00241]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 201.76batch/s, loss=0.00241]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 194.34batch/s, loss=0.0024] 
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 204.17batch/s, loss=0.002

200 70


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 198.91batch/s, loss=0.00332]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 190.22batch/s, loss=0.00249]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 194.71batch/s, loss=0.00215]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 198.70batch/s, loss=0.002]  
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 197.55batch/s, loss=0.00193]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 189.22batch/s, loss=0.00188]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 192.73batch/s, loss=0.00185]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 182.97batch/s, loss=0.00182]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 197.52batch/s, loss=0.0018] 
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 190.27batch/s, loss=0.00179]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 204.45batch/s, loss=0.00178]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 190.55batch/s, loss=0.00177]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 195.81batch/s, loss=0.001

200 100


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 163.18batch/s, loss=0.00289]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 167.63batch/s, loss=0.00208]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 168.02batch/s, loss=0.00167]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 175.63batch/s, loss=0.00143]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 165.02batch/s, loss=0.00129]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 167.29batch/s, loss=0.00121]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 164.44batch/s, loss=0.00115]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 171.58batch/s, loss=0.00111]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 171.32batch/s, loss=0.00107]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 165.42batch/s, loss=0.00105]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 172.23batch/s, loss=0.00103]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 170.85batch/s, loss=0.00101]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 162.69batch/s, loss=0.000

200 150


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 176.46batch/s, loss=0.00245]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 162.58batch/s, loss=0.00138]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 168.91batch/s, loss=0.000916]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 159.22batch/s, loss=0.000693]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 167.01batch/s, loss=0.000576]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 173.67batch/s, loss=0.000519]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 165.77batch/s, loss=0.000485]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 156.42batch/s, loss=0.00046] 
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 149.29batch/s, loss=0.000441]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 170.86batch/s, loss=0.000426]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 166.94batch/s, loss=0.000415]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 157.17batch/s, loss=0.000408]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 154.32batch/s, 

200 200


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 190.77batch/s, loss=0.00213]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 177.01batch/s, loss=0.000966]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 187.05batch/s, loss=0.000445]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 187.14batch/s, loss=0.000219]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 181.07batch/s, loss=0.000111]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 187.75batch/s, loss=5.2e-5]  
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 198.36batch/s, loss=2.72e-5]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 180.59batch/s, loss=1.6e-5] 
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 190.25batch/s, loss=9.72e-6]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 170.31batch/s, loss=6.01e-6]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 186.93batch/s, loss=4.47e-6]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 183.36batch/s, loss=4.18e-6]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 192.72batch/s, loss=

200 250


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 185.45batch/s, loss=0.00181]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 180.14batch/s, loss=0.000663]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 176.90batch/s, loss=0.000204]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 185.34batch/s, loss=5.38e-5] 
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 175.67batch/s, loss=1.1e-5] 
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 169.03batch/s, loss=2.83e-6]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 165.13batch/s, loss=1.92e-6]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 143.17batch/s, loss=1.85e-6]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 131.38batch/s, loss=1.86e-6]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 147.49batch/s, loss=1.9e-6] 
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 152.71batch/s, loss=1.94e-6]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 148.81batch/s, loss=1.97e-6]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 163.23batch/s, loss=1.

200 300


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 175.25batch/s, loss=0.00154]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 181.38batch/s, loss=0.00044] 
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 172.18batch/s, loss=0.000114]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 169.93batch/s, loss=2.18e-5]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 165.15batch/s, loss=3.5e-6] 
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 116.21batch/s, loss=1.84e-6]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 124.59batch/s, loss=1.67e-6]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 153.25batch/s, loss=1.63e-6]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 166.16batch/s, loss=1.65e-6]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 167.68batch/s, loss=1.67e-6]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 161.27batch/s, loss=1.68e-6]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 188.89batch/s, loss=1.7e-6] 
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 157.67batch/s, loss=1.7

200 350


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 153.64batch/s, loss=0.00127]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 155.06batch/s, loss=0.000265]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 154.69batch/s, loss=4.23e-5]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 149.77batch/s, loss=6.1e-6] 
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 159.47batch/s, loss=2.05e-6]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 168.86batch/s, loss=1.64e-6]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 157.08batch/s, loss=1.61e-6]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 158.51batch/s, loss=1.63e-6]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 155.68batch/s, loss=1.65e-6]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 156.90batch/s, loss=1.66e-6]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 159.08batch/s, loss=1.66e-6]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 141.90batch/s, loss=1.66e-6]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 135.26batch/s, loss=1.67

200 400


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 163.56batch/s, loss=0.00117] 
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 154.06batch/s, loss=0.000195]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 170.52batch/s, loss=1.95e-5]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 162.69batch/s, loss=2.59e-6]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 145.24batch/s, loss=1.35e-6]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 133.77batch/s, loss=1.19e-6]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 138.14batch/s, loss=1.18e-6]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 135.19batch/s, loss=1.19e-6]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 139.18batch/s, loss=1.21e-6]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 142.74batch/s, loss=1.22e-6]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 144.74batch/s, loss=1.23e-6]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 136.12batch/s, loss=1.24e-6]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 128.47batch/s, loss=1.2

250 10


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 183.49batch/s, loss=0.00533]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 177.27batch/s, loss=0.00449]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 170.93batch/s, loss=0.00439]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 171.56batch/s, loss=0.00429]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 141.33batch/s, loss=0.00416]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 143.27batch/s, loss=0.00404]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 140.20batch/s, loss=0.00392]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 139.99batch/s, loss=0.00383]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 141.04batch/s, loss=0.00374]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 134.49batch/s, loss=0.00367]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 149.68batch/s, loss=0.00362]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 156.91batch/s, loss=0.00358]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 163.18batch/s, loss=0.003

250 20


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 163.75batch/s, loss=0.00441]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 174.80batch/s, loss=0.00387]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 167.65batch/s, loss=0.00353]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 165.62batch/s, loss=0.00335]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 162.82batch/s, loss=0.00325]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 169.60batch/s, loss=0.00318]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 165.57batch/s, loss=0.00313]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 178.96batch/s, loss=0.00308]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 185.01batch/s, loss=0.00305]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 185.57batch/s, loss=0.00301]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 164.86batch/s, loss=0.00298]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 167.11batch/s, loss=0.00296]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 163.25batch/s, loss=0.002

250 30


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 193.15batch/s, loss=0.0039] 
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 208.55batch/s, loss=0.0033] 
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 194.36batch/s, loss=0.00306]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 185.80batch/s, loss=0.00296]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 207.58batch/s, loss=0.0029] 
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 191.38batch/s, loss=0.00286]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 190.75batch/s, loss=0.00283]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 171.20batch/s, loss=0.0028] 
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 189.75batch/s, loss=0.00277]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 176.28batch/s, loss=0.00275]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 179.84batch/s, loss=0.00274]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 179.42batch/s, loss=0.00273]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 187.65batch/s, loss=0.002

250 50


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 207.80batch/s, loss=0.0033] 
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 231.39batch/s, loss=0.00276]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 205.48batch/s, loss=0.00256]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 206.06batch/s, loss=0.00246]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 201.08batch/s, loss=0.0024] 
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 205.04batch/s, loss=0.00234]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 200.68batch/s, loss=0.0023] 
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 198.98batch/s, loss=0.00226]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 207.68batch/s, loss=0.00223]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 203.78batch/s, loss=0.00221]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 210.98batch/s, loss=0.0022] 
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 188.14batch/s, loss=0.00219]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 192.70batch/s, loss=0.002

250 70


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 198.80batch/s, loss=0.00312]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 217.74batch/s, loss=0.00249]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 223.64batch/s, loss=0.00221]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 206.52batch/s, loss=0.00206]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 207.46batch/s, loss=0.00196]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 193.69batch/s, loss=0.00189]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 193.04batch/s, loss=0.00185]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 187.60batch/s, loss=0.00181]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 186.97batch/s, loss=0.00178]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 178.63batch/s, loss=0.00176]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 194.79batch/s, loss=0.00174]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 178.02batch/s, loss=0.00173]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 181.55batch/s, loss=0.001

250 100


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 164.36batch/s, loss=0.00281]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 162.68batch/s, loss=0.00196]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 175.35batch/s, loss=0.0016] 
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 184.59batch/s, loss=0.00143]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 190.80batch/s, loss=0.00133]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 179.41batch/s, loss=0.00125]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 189.18batch/s, loss=0.00119]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 189.23batch/s, loss=0.00114]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 192.00batch/s, loss=0.0011] 
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 211.51batch/s, loss=0.00106]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 216.66batch/s, loss=0.00104]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 199.90batch/s, loss=0.00102]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 187.85batch/s, loss=0.001

250 150


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 167.89batch/s, loss=0.00225]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 162.76batch/s, loss=0.00139]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 166.61batch/s, loss=0.00097]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 169.09batch/s, loss=0.000763]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 164.36batch/s, loss=0.000663]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 168.07batch/s, loss=0.000603]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 164.81batch/s, loss=0.000558]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 161.88batch/s, loss=0.000522]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 165.73batch/s, loss=0.000492]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 161.60batch/s, loss=0.000467]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 149.22batch/s, loss=0.000447]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 148.36batch/s, loss=0.000431]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 163.43batch/s, l

250 200


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 153.16batch/s, loss=0.00203]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 176.15batch/s, loss=0.00105]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 163.82batch/s, loss=0.000599]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 152.28batch/s, loss=0.000367]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 164.64batch/s, loss=0.000262]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 154.34batch/s, loss=0.000219]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 161.50batch/s, loss=0.000199]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 144.09batch/s, loss=0.000187]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 169.83batch/s, loss=0.000179]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 180.43batch/s, loss=0.000173]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 164.42batch/s, loss=0.000169]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 163.95batch/s, loss=0.000166]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 162.86batch/s, 

250 250


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 158.85batch/s, loss=0.00175]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 158.40batch/s, loss=0.000724]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 160.29batch/s, loss=0.000313]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 155.01batch/s, loss=0.000145]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 158.34batch/s, loss=7.68e-5] 
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 162.48batch/s, loss=4.54e-5] 
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 151.89batch/s, loss=2.64e-5]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 164.98batch/s, loss=1.58e-5]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 170.36batch/s, loss=1.05e-5]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 159.76batch/s, loss=7.98e-6]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 160.20batch/s, loss=6.28e-6]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 172.37batch/s, loss=4.84e-6]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 157.29batch/s, loss=

250 300


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 170.87batch/s, loss=0.00155]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 177.43batch/s, loss=0.000515]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 153.61batch/s, loss=0.000176]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 150.63batch/s, loss=6.41e-5] 
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 168.62batch/s, loss=2.26e-5]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 158.40batch/s, loss=7.18e-6]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 171.95batch/s, loss=2.92e-6]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 166.76batch/s, loss=2.1e-6] 
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 164.43batch/s, loss=2.02e-6]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 169.45batch/s, loss=2.04e-6]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 146.69batch/s, loss=2.07e-6]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 168.85batch/s, loss=2.08e-6]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 169.25batch/s, loss=2.

250 350


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 156.24batch/s, loss=0.00145]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 160.02batch/s, loss=0.000407]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 158.12batch/s, loss=9.8e-5]  
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 145.53batch/s, loss=2.64e-5]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 148.30batch/s, loss=7.61e-6]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 135.73batch/s, loss=2.49e-6]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 127.77batch/s, loss=1.44e-6]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 122.36batch/s, loss=1.34e-6]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 118.83batch/s, loss=1.38e-6]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 129.16batch/s, loss=1.42e-6]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 147.14batch/s, loss=1.47e-6]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 142.64batch/s, loss=1.5e-6] 
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 129.13batch/s, loss=1.5

250 400


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 118.60batch/s, loss=0.00121]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 129.08batch/s, loss=0.000268]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 128.34batch/s, loss=6.89e-5] 
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 113.75batch/s, loss=1.6e-5] 
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 116.52batch/s, loss=3.25e-6]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 128.30batch/s, loss=1.33e-6]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 125.24batch/s, loss=1.2e-6] 
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 161.24batch/s, loss=1.22e-6]
Epoch 8: 100%|██████████| 109/109 [00:01<00:00, 100.47batch/s, loss=1.24e-6]
Epoch 9: 100%|██████████| 109/109 [00:01<00:00, 104.17batch/s, loss=1.27e-6]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 118.95batch/s, loss=1.29e-6]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 137.97batch/s, loss=1.33e-6]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 132.55batch/s, loss=1.3

300 10


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 136.66batch/s, loss=0.00511]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 125.20batch/s, loss=0.0041] 
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 145.43batch/s, loss=0.004]  
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 139.64batch/s, loss=0.00392]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 129.84batch/s, loss=0.00386]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 138.97batch/s, loss=0.0038] 
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 126.34batch/s, loss=0.00374]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 134.13batch/s, loss=0.00368]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 132.41batch/s, loss=0.00363]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 129.98batch/s, loss=0.00357]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 137.21batch/s, loss=0.00351]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 140.71batch/s, loss=0.00345]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 135.50batch/s, loss=0.003

300 20


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 133.04batch/s, loss=0.00411]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 150.02batch/s, loss=0.00366]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 174.34batch/s, loss=0.00343]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 165.91batch/s, loss=0.00326]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 147.24batch/s, loss=0.00313]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 161.71batch/s, loss=0.00305]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 160.53batch/s, loss=0.00299]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 154.94batch/s, loss=0.00296]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 162.61batch/s, loss=0.00294]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 154.41batch/s, loss=0.00292]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 159.97batch/s, loss=0.0029] 
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 167.04batch/s, loss=0.00289]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 158.79batch/s, loss=0.002

300 30


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 191.87batch/s, loss=0.00373]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 188.92batch/s, loss=0.00316]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 183.68batch/s, loss=0.00286]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 179.18batch/s, loss=0.00272]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 191.93batch/s, loss=0.00263]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 188.31batch/s, loss=0.00258]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 197.06batch/s, loss=0.00255]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 177.23batch/s, loss=0.00253]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 173.96batch/s, loss=0.00252]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 169.72batch/s, loss=0.00252]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 188.45batch/s, loss=0.00251]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 185.62batch/s, loss=0.00251]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 172.68batch/s, loss=0.002

300 50


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 179.32batch/s, loss=0.00322]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 181.79batch/s, loss=0.00264]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 174.84batch/s, loss=0.00242]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 210.28batch/s, loss=0.00229]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 202.30batch/s, loss=0.0022] 
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 199.80batch/s, loss=0.00214]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 204.37batch/s, loss=0.00209]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 186.22batch/s, loss=0.00206]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 162.97batch/s, loss=0.00204]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 158.52batch/s, loss=0.00203]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 171.42batch/s, loss=0.00202]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 156.10batch/s, loss=0.00202]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 172.20batch/s, loss=0.002

300 70


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 142.78batch/s, loss=0.00284]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 158.00batch/s, loss=0.00224]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 175.93batch/s, loss=0.002]  
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 156.43batch/s, loss=0.00187]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 153.97batch/s, loss=0.00178]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 170.02batch/s, loss=0.0017] 
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 152.63batch/s, loss=0.00164]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 176.24batch/s, loss=0.00159]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 214.96batch/s, loss=0.00154]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 198.98batch/s, loss=0.0015] 
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 192.34batch/s, loss=0.00147]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 188.95batch/s, loss=0.00144]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 176.05batch/s, loss=0.001

300 100


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 172.06batch/s, loss=0.00251]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 181.68batch/s, loss=0.00182]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 160.57batch/s, loss=0.00151]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 207.66batch/s, loss=0.00136]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 212.84batch/s, loss=0.00126]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 181.06batch/s, loss=0.00119]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 193.22batch/s, loss=0.00114]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 191.61batch/s, loss=0.0011] 
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 171.87batch/s, loss=0.00107]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 184.65batch/s, loss=0.00104]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 188.57batch/s, loss=0.00102]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 160.32batch/s, loss=0.00101]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 143.32batch/s, loss=0.000

300 150


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 154.91batch/s, loss=0.00223]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 159.67batch/s, loss=0.00142]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 164.77batch/s, loss=0.000999]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 155.34batch/s, loss=0.000773]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 151.43batch/s, loss=0.000656]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 164.42batch/s, loss=0.000587]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 173.61batch/s, loss=0.000543]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 153.64batch/s, loss=0.000514]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 161.41batch/s, loss=0.000494]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 168.33batch/s, loss=0.00048] 
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 152.12batch/s, loss=0.000469]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 159.68batch/s, loss=0.00046] 
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 154.83batch/s, 

300 200


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 141.70batch/s, loss=0.00188]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 153.25batch/s, loss=0.000997]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 158.78batch/s, loss=0.000599]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 155.49batch/s, loss=0.000411]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 156.83batch/s, loss=0.000318]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 170.68batch/s, loss=0.000271]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 156.68batch/s, loss=0.000245]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 144.25batch/s, loss=0.000227]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 167.03batch/s, loss=0.000215]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 162.33batch/s, loss=0.000205]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 162.44batch/s, loss=0.000198]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 170.80batch/s, loss=0.000192]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 163.75batch/s,

300 250


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 155.21batch/s, loss=0.00162]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 161.12batch/s, loss=0.000726]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 164.65batch/s, loss=0.000358]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 176.13batch/s, loss=0.000216]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 163.08batch/s, loss=0.00015] 
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 142.52batch/s, loss=0.000114]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 154.90batch/s, loss=9.38e-5] 
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 147.30batch/s, loss=8.23e-5] 
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 153.53batch/s, loss=7.56e-5] 
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 176.29batch/s, loss=7.16e-5] 
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 139.67batch/s, loss=6.87e-5] 
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 148.54batch/s, loss=6.66e-5] 
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 163.94batch/s,

300 300


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 159.76batch/s, loss=0.00147]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 147.07batch/s, loss=0.000566]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 165.25batch/s, loss=0.000232]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 183.64batch/s, loss=0.000109]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 163.33batch/s, loss=6.07e-5] 
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 155.26batch/s, loss=3.84e-5] 
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 145.39batch/s, loss=2.57e-5] 
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 121.58batch/s, loss=1.78e-5]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 136.60batch/s, loss=1.28e-5]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 133.15batch/s, loss=9.24e-6]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 117.69batch/s, loss=6.75e-6]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 126.04batch/s, loss=5.31e-6]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 131.45batch/s, loss

300 350


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 119.28batch/s, loss=0.0013] 
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 132.07batch/s, loss=0.00044] 
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 127.62batch/s, loss=0.000165]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 128.76batch/s, loss=7.08e-5] 
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 145.50batch/s, loss=3.49e-5] 
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 125.62batch/s, loss=1.91e-5]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 125.15batch/s, loss=1.11e-5]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 147.93batch/s, loss=6.29e-6]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 121.85batch/s, loss=3.5e-6] 
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 131.62batch/s, loss=2.22e-6]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 122.96batch/s, loss=1.77e-6]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 125.77batch/s, loss=1.66e-6]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 130.21batch/s, loss=1

300 400


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 123.04batch/s, loss=0.00117]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 130.24batch/s, loss=0.000333]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 118.72batch/s, loss=0.000106]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 127.26batch/s, loss=4.3e-5]  
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 121.12batch/s, loss=2e-5]   
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 125.86batch/s, loss=1.01e-5]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 124.71batch/s, loss=5.16e-6]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 120.98batch/s, loss=2.73e-6]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 126.87batch/s, loss=1.73e-6]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 119.44batch/s, loss=1.4e-6] 
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 125.43batch/s, loss=1.36e-6]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 122.08batch/s, loss=1.4e-6] 
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 126.38batch/s, loss=1.

350 10


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 148.22batch/s, loss=0.00488]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 136.37batch/s, loss=0.00395]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 124.93batch/s, loss=0.00387]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 149.08batch/s, loss=0.0038] 
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 128.37batch/s, loss=0.00374]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 150.33batch/s, loss=0.00367]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 125.64batch/s, loss=0.0036] 
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 139.45batch/s, loss=0.00353]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 141.98batch/s, loss=0.00345]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 129.58batch/s, loss=0.00338]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 136.70batch/s, loss=0.00331]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 136.72batch/s, loss=0.00324]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 144.70batch/s, loss=0.003

350 20


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 130.37batch/s, loss=0.00384]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 135.86batch/s, loss=0.00337]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 136.17batch/s, loss=0.00314]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 119.46batch/s, loss=0.00295]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 136.92batch/s, loss=0.00283]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 140.45batch/s, loss=0.00275]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 163.06batch/s, loss=0.0027] 
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 159.28batch/s, loss=0.00265]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 157.90batch/s, loss=0.00262]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 170.27batch/s, loss=0.00259]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 153.50batch/s, loss=0.00257]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 164.47batch/s, loss=0.00255]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 160.61batch/s, loss=0.002

350 30


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 165.13batch/s, loss=0.00355]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 154.62batch/s, loss=0.00303]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 163.96batch/s, loss=0.00274]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 176.71batch/s, loss=0.0026] 
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 169.39batch/s, loss=0.00251]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 155.62batch/s, loss=0.00245]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 167.60batch/s, loss=0.00241]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 177.26batch/s, loss=0.00237]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 166.48batch/s, loss=0.00234]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 172.26batch/s, loss=0.00232]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 159.97batch/s, loss=0.0023] 
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 164.71batch/s, loss=0.00229]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 158.41batch/s, loss=0.002

350 50


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 184.76batch/s, loss=0.00294]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 177.26batch/s, loss=0.00236]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 203.76batch/s, loss=0.00215]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 185.62batch/s, loss=0.00202]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 183.18batch/s, loss=0.00193]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 177.30batch/s, loss=0.00187]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 186.82batch/s, loss=0.00183]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 167.02batch/s, loss=0.0018] 
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 185.82batch/s, loss=0.00178]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 184.53batch/s, loss=0.00177]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 182.90batch/s, loss=0.00176]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 183.48batch/s, loss=0.00175]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 197.38batch/s, loss=0.001

350 70


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 180.42batch/s, loss=0.00266]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 190.61batch/s, loss=0.0021] 
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 215.90batch/s, loss=0.00188]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 204.40batch/s, loss=0.00176]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 162.55batch/s, loss=0.00166]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 174.04batch/s, loss=0.00159]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 159.84batch/s, loss=0.00153]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 149.96batch/s, loss=0.00148]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 164.73batch/s, loss=0.00145]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 163.98batch/s, loss=0.00143]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 156.34batch/s, loss=0.00141]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 165.51batch/s, loss=0.00139]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 164.17batch/s, loss=0.001

350 100


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 158.73batch/s, loss=0.00233]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 149.69batch/s, loss=0.00176]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 151.11batch/s, loss=0.00146]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 159.89batch/s, loss=0.00129]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 156.73batch/s, loss=0.00117]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 151.84batch/s, loss=0.00109]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 158.58batch/s, loss=0.00104]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 150.15batch/s, loss=0.000994]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 174.55batch/s, loss=0.000962]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 165.11batch/s, loss=0.000938]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 160.95batch/s, loss=0.00092]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 182.30batch/s, loss=0.000905]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 178.28batch/s, loss=0

350 150


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 163.69batch/s, loss=0.00192]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 157.58batch/s, loss=0.00117]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 176.50batch/s, loss=0.000838]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 166.07batch/s, loss=0.000663]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 154.09batch/s, loss=0.000571]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 157.12batch/s, loss=0.000518]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 157.72batch/s, loss=0.000485]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 156.98batch/s, loss=0.000462]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 162.20batch/s, loss=0.000445]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 160.98batch/s, loss=0.000432]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 147.81batch/s, loss=0.000421]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 153.80batch/s, loss=0.000413]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 138.36batch/s, 

350 200


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 135.64batch/s, loss=0.00169]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 151.60batch/s, loss=0.000904]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 142.24batch/s, loss=0.000552]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 150.06batch/s, loss=0.000385]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 173.70batch/s, loss=0.000307]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 149.91batch/s, loss=0.000268]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 153.01batch/s, loss=0.000248]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 152.68batch/s, loss=0.000237]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 146.19batch/s, loss=0.00023] 
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 150.18batch/s, loss=0.000225]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 148.19batch/s, loss=0.000221]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 153.54batch/s, loss=0.000219]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 155.70batch/s,

350 250


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 120.99batch/s, loss=0.00148]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 122.10batch/s, loss=0.000722]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 127.65batch/s, loss=0.000379]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 123.51batch/s, loss=0.000238]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 125.14batch/s, loss=0.00017] 
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 132.50batch/s, loss=0.000133]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 134.63batch/s, loss=0.000113]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 131.04batch/s, loss=0.000102]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 112.92batch/s, loss=9.6e-5]  
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 120.95batch/s, loss=9.19e-5] 
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 119.50batch/s, loss=8.89e-5] 
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 125.59batch/s, loss=8.67e-5] 
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 128.05batch/s,

350 300


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 143.98batch/s, loss=0.00126]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 129.88batch/s, loss=0.000516]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 122.37batch/s, loss=0.000245]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 131.83batch/s, loss=0.000142]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 120.87batch/s, loss=9.51e-5] 
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 124.03batch/s, loss=7.06e-5] 
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 126.29batch/s, loss=5.63e-5] 
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 122.33batch/s, loss=4.71e-5] 
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 127.90batch/s, loss=4.11e-5] 
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 127.10batch/s, loss=3.7e-5]  
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 118.65batch/s, loss=3.45e-5] 
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 132.63batch/s, loss=3.31e-5] 
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 133.34batch/s,

350 350


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 134.87batch/s, loss=0.00116]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 124.96batch/s, loss=0.000417]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 121.33batch/s, loss=0.000182]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 122.04batch/s, loss=9.12e-5] 
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 125.45batch/s, loss=5.51e-5] 
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 133.85batch/s, loss=3.86e-5] 
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 120.56batch/s, loss=2.87e-5] 
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 123.73batch/s, loss=2.18e-5]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 131.88batch/s, loss=1.67e-5]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 126.55batch/s, loss=1.25e-5]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 125.66batch/s, loss=9.45e-6]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 113.05batch/s, loss=7.51e-6]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 127.30batch/s, loss

350 400


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 122.89batch/s, loss=0.00106]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 127.54batch/s, loss=0.000327]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 125.71batch/s, loss=0.00014] 
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 122.29batch/s, loss=7.24e-5] 
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 122.57batch/s, loss=4.18e-5] 
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 112.55batch/s, loss=2.66e-5]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 133.98batch/s, loss=1.79e-5]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 121.08batch/s, loss=1.23e-5]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 118.56batch/s, loss=8.49e-6]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 125.65batch/s, loss=5.88e-6]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 129.86batch/s, loss=4.27e-6]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 126.25batch/s, loss=3.29e-6]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 125.42batch/s, loss=2

400 10


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 137.24batch/s, loss=0.00465]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 115.78batch/s, loss=0.00371]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 130.40batch/s, loss=0.00364]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 133.98batch/s, loss=0.00357]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 140.72batch/s, loss=0.00348]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 135.92batch/s, loss=0.00339]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 120.44batch/s, loss=0.00332]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 137.08batch/s, loss=0.00325]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 131.15batch/s, loss=0.00319]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 132.79batch/s, loss=0.00314]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 127.64batch/s, loss=0.00308]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 131.13batch/s, loss=0.00303]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 132.83batch/s, loss=0.002

400 20


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 132.39batch/s, loss=0.00367]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 130.98batch/s, loss=0.00328]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 137.55batch/s, loss=0.00304]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 131.42batch/s, loss=0.00287]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 158.97batch/s, loss=0.00275]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 147.36batch/s, loss=0.00266]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 138.64batch/s, loss=0.00259]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 164.57batch/s, loss=0.00253]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 160.83batch/s, loss=0.00248]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 150.18batch/s, loss=0.00245]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 165.50batch/s, loss=0.00242]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 150.88batch/s, loss=0.00239]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 159.12batch/s, loss=0.002

400 30


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 165.84batch/s, loss=0.00344]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 189.53batch/s, loss=0.0029] 
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 215.47batch/s, loss=0.00259]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 180.99batch/s, loss=0.00245]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 186.92batch/s, loss=0.00237]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 173.59batch/s, loss=0.00231]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 162.55batch/s, loss=0.00226]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 163.20batch/s, loss=0.00222]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 165.02batch/s, loss=0.0022] 
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 162.80batch/s, loss=0.00218]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 169.10batch/s, loss=0.00216]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 166.02batch/s, loss=0.00215]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 146.17batch/s, loss=0.002

400 50


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 189.41batch/s, loss=0.00285]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 204.48batch/s, loss=0.00228]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 187.37batch/s, loss=0.00206]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 209.81batch/s, loss=0.00193]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 215.32batch/s, loss=0.00184]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 189.27batch/s, loss=0.00179]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 185.28batch/s, loss=0.00174]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 190.29batch/s, loss=0.00171]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 198.46batch/s, loss=0.0017] 
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 182.59batch/s, loss=0.00168]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 185.83batch/s, loss=0.00167]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 186.81batch/s, loss=0.00167]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 183.01batch/s, loss=0.001

400 70


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 190.43batch/s, loss=0.00247]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 197.34batch/s, loss=0.00198]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 175.82batch/s, loss=0.00178]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 168.83batch/s, loss=0.00165]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 158.50batch/s, loss=0.00156]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 161.38batch/s, loss=0.00149]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 163.24batch/s, loss=0.00144]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 185.68batch/s, loss=0.0014] 
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 138.86batch/s, loss=0.00137]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 148.95batch/s, loss=0.00135]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 150.14batch/s, loss=0.00133]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 146.22batch/s, loss=0.00132]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 156.33batch/s, loss=0.001

400 100


Epoch 0: 100%|██████████| 109/109 [00:01<00:00, 106.57batch/s, loss=0.00212]
Epoch 1: 100%|██████████| 109/109 [00:01<00:00, 100.32batch/s, loss=0.00156]
Epoch 2: 100%|██████████| 109/109 [00:01<00:00, 98.98batch/s, loss=0.0013]  
Epoch 3: 100%|██████████| 109/109 [00:01<00:00, 105.63batch/s, loss=0.00116]
Epoch 4: 100%|██████████| 109/109 [00:01<00:00, 108.00batch/s, loss=0.00107]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 128.83batch/s, loss=0.00101]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 137.30batch/s, loss=0.000975]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 153.92batch/s, loss=0.000947]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 137.52batch/s, loss=0.000925]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 143.38batch/s, loss=0.000907]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 137.79batch/s, loss=0.000892]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 146.41batch/s, loss=0.000879]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 151.51batch/s, loss

400 150


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 163.06batch/s, loss=0.00184]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 154.39batch/s, loss=0.00119]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 158.03batch/s, loss=0.000874]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 153.90batch/s, loss=0.000696]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 136.13batch/s, loss=0.000589]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 134.43batch/s, loss=0.000525]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 122.08batch/s, loss=0.000483]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 123.80batch/s, loss=0.000454]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 125.98batch/s, loss=0.000434]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 132.54batch/s, loss=0.000419]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 150.57batch/s, loss=0.000408]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 144.76batch/s, loss=0.0004]  
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 157.65batch/s, 

400 200


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 142.60batch/s, loss=0.00161]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 145.36batch/s, loss=0.000911]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 141.53batch/s, loss=0.000577]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 149.46batch/s, loss=0.000401]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 153.04batch/s, loss=0.000301]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 144.04batch/s, loss=0.000249]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 147.21batch/s, loss=0.000222]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 145.89batch/s, loss=0.000209]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 149.71batch/s, loss=0.000201]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 167.44batch/s, loss=0.000197]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 143.15batch/s, loss=0.000194]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 153.07batch/s, loss=0.000192]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 150.85batch/s,

400 250


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 158.10batch/s, loss=0.00147]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 144.88batch/s, loss=0.000685]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 151.58batch/s, loss=0.000366]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 130.04batch/s, loss=0.00023] 
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 111.87batch/s, loss=0.000162]
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 113.34batch/s, loss=0.000129]
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 115.57batch/s, loss=0.000112]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 135.74batch/s, loss=0.000103]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 125.15batch/s, loss=9.78e-5] 
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 129.29batch/s, loss=9.49e-5] 
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 117.91batch/s, loss=9.3e-5]  
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 125.65batch/s, loss=9.21e-5] 
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 140.10batch/s,

400 300


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 157.63batch/s, loss=0.00128]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 123.32batch/s, loss=0.000541]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 126.56batch/s, loss=0.000255]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 127.96batch/s, loss=0.000143]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 120.82batch/s, loss=9.73e-5] 
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 134.07batch/s, loss=7.53e-5] 
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 120.60batch/s, loss=6.33e-5] 
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 126.04batch/s, loss=5.58e-5] 
Epoch 8: 100%|██████████| 109/109 [00:01<00:00, 108.12batch/s, loss=5.08e-5]
Epoch 9: 100%|██████████| 109/109 [00:01<00:00, 97.90batch/s, loss=4.73e-5] 
Epoch 10: 100%|██████████| 109/109 [00:01<00:00, 99.22batch/s, loss=4.49e-5]  
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 127.02batch/s, loss=4.4e-5]  
Epoch 12: 100%|██████████| 109/109 [00:01<00:00, 107.81batch/s, l

400 350


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 145.25batch/s, loss=0.00112]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 155.56batch/s, loss=0.000381]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 170.18batch/s, loss=0.000168]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 161.59batch/s, loss=9.73e-5] 
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 173.47batch/s, loss=6.58e-5] 
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 165.63batch/s, loss=4.74e-5] 
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 158.15batch/s, loss=3.51e-5] 
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 131.12batch/s, loss=2.75e-5] 
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 132.60batch/s, loss=2.29e-5]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 137.94batch/s, loss=1.97e-5]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 126.19batch/s, loss=1.78e-5]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 130.22batch/s, loss=1.61e-5]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 130.12batch/s, los

400 400


Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 129.45batch/s, loss=0.00101]
Epoch 1: 100%|██████████| 109/109 [00:01<00:00, 106.02batch/s, loss=0.000339]
Epoch 2: 100%|██████████| 109/109 [00:01<00:00, 88.77batch/s, loss=0.000143]
Epoch 3: 100%|██████████| 109/109 [00:01<00:00, 72.66batch/s, loss=7.67e-5] 
Epoch 4: 100%|██████████| 109/109 [00:01<00:00, 77.51batch/s, loss=4.85e-5] 
Epoch 5: 100%|██████████| 109/109 [00:01<00:00, 79.33batch/s, loss=3.28e-5] 
Epoch 6: 100%|██████████| 109/109 [00:01<00:00, 93.25batch/s, loss=2.34e-5] 
Epoch 7: 100%|██████████| 109/109 [00:01<00:00, 82.02batch/s, loss=1.8e-5] 
Epoch 8: 100%|██████████| 109/109 [00:01<00:00, 90.10batch/s, loss=1.46e-5]
Epoch 9: 100%|██████████| 109/109 [00:01<00:00, 91.58batch/s, loss=1.22e-5]
Epoch 10: 100%|██████████| 109/109 [00:01<00:00, 94.86batch/s, loss=1.04e-5]
Epoch 11: 100%|██████████| 109/109 [00:01<00:00, 88.73batch/s, loss=9.38e-6]
Epoch 12: 100%|██████████| 109/109 [00:01<00:00, 92.01batch/s, loss=8.53e-6]
E

In [21]:
lossMat.round(6)

array([[1.280e-04, 2.512e-03, 3.964e-03, 5.087e-03, 5.620e-03, 5.690e-03,
        5.566e-03, 5.331e-03, 5.004e-03, 4.747e-03, 4.501e-03, 4.242e-03],
       [2.200e-05, 5.500e-05, 1.194e-03, 2.874e-03, 3.656e-03, 4.188e-03,
        4.440e-03, 4.374e-03, 4.173e-03, 3.925e-03, 3.659e-03, 3.390e-03],
       [1.500e-05, 1.600e-05, 2.400e-05, 1.612e-03, 2.531e-03, 3.273e-03,
        3.715e-03, 3.799e-03, 3.676e-03, 3.468e-03, 3.248e-03, 3.033e-03],
       [4.000e-06, 7.000e-06, 1.000e-05, 1.900e-05, 9.520e-04, 1.884e-03,
        2.630e-03, 2.903e-03, 2.910e-03, 2.778e-03, 2.610e-03, 2.427e-03],
       [3.000e-06, 5.000e-06, 5.000e-06, 7.000e-06, 2.000e-05, 9.310e-04,
        1.836e-03, 2.253e-03, 2.352e-03, 2.297e-03, 2.162e-03, 2.022e-03],
       [3.000e-06, 3.000e-06, 4.000e-06, 5.000e-06, 6.000e-06, 8.000e-06,
        9.770e-04, 1.498e-03, 1.707e-03, 1.721e-03, 1.652e-03, 1.544e-03],
       [2.000e-06, 2.000e-06, 2.000e-06, 3.000e-06, 3.000e-06, 4.000e-06,
        6.000e-06, 5.940e-04, 9.

array(['10', '20', '30', '50', '70', '100', '150', '200', '250', '300',
       '350', '400'], dtype='<U11')

In [34]:
px.imshow(lossMat, zmin=0, width=800, height=600,
    title='MSEs',
    labels=dict(x="Dimensão 1", y="Dimensão 2", color="MSE"),
        y=np.array(lat_dim).astype(str),
        x=np.array(lat_dim).astype(str))

In [171]:
deeper = automlp600().to(device)
loss_fn = nn.MSELoss()
optimizer = optim.Adam(deeper.parameters(), lr=0.001)
n_epochs = 20   # number of epochs to run
batch_size = 150  # size of each batch
batch_start = torch.arange(0, len(X_train), batch_size)
trainLoss = []
valLoss = []

In [169]:
# AJUSTAR ESSE TREINAMENTO!!
for epoch in range(n_epochs):
    deeper.train()
    with tqdm(batch_start, unit="batch", mininterval=0, disable=False) as bar:
        bar.set_description(f"Epoch {epoch}")
        for start in bar:
            # take a batch
            X_batch = emb_train[start:start+batch_size,:]
            # forward pass
            Xh = deeper(X_batch)
            loss = loss_fn(Xh, X_batch)
            # backward pass
            optimizer.zero_grad()
            loss.backward()
            # update weights
            optimizer.step()
            # print progress
            bar.set_postfix(loss=float(loss))
    # evaluate accuracy at end of each epoch
    deeper.eval()
    Xh = deeper(emb_val)
    valLoss.append(float(loss_fn(Xh, emb_val)))
    Xh = deeper(emb_train)
    trainLoss.append(float(loss_fn(Xh, emb_train)))

fig = go.Figure()
fig.add_trace(go.Scatter(y=valLoss, mode="lines", showlegend=True, name='validação'))
fig.add_trace(go.Scatter(y=trainLoss, mode="lines", showlegend=True, name='treino'))
fig.show()

Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 142.98batch/s, loss=0.000631]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 221.01batch/s, loss=0.000284]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 232.02batch/s, loss=0.000169]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 245.62batch/s, loss=0.000114]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 212.11batch/s, loss=8.17e-5] 
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 237.10batch/s, loss=6.18e-5] 
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 198.73batch/s, loss=4.89e-5]
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 239.89batch/s, loss=4.15e-5]
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 241.53batch/s, loss=3.73e-5]
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 221.77batch/s, loss=3.15e-5]
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 227.41batch/s, loss=2.86e-5]
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 226.02batch/s, loss=2.37e-5]
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 210.33batch/s, loss

In [172]:
# AJUSTAR ESSE TREINAMENTO!!
for epoch in range(n_epochs):
    deeper.train()
    with tqdm(batch_start, unit="batch", mininterval=0, disable=False) as bar:
        bar.set_description(f"Epoch {epoch}")
        for start in bar:
            # take a batch
            X_batch = emb_train[start:start+batch_size,:]
            # forward pass
            Xh = deeper(X_batch)
            loss = loss_fn(Xh, X_batch)
            # backward pass
            optimizer.zero_grad()
            loss.backward()
            # update weights
            optimizer.step()
            # print progress
            bar.set_postfix(loss=float(loss))
    # evaluate accuracy at end of each epoch
    deeper.eval()
    Xh = deeper(emb_val)
    valLoss.append(float(loss_fn(Xh, emb_val)))
    Xh = deeper(emb_train)
    trainLoss.append(float(loss_fn(Xh, emb_train)))

fig = go.Figure()
fig.add_trace(go.Scatter(y=valLoss, mode="lines", showlegend=True, name='validação'))
fig.add_trace(go.Scatter(y=trainLoss, mode="lines", showlegend=True, name='treino'))
fig.show()

Epoch 0: 100%|██████████| 109/109 [00:00<00:00, 162.29batch/s, loss=0.000737]
Epoch 1: 100%|██████████| 109/109 [00:00<00:00, 207.54batch/s, loss=0.000355]
Epoch 2: 100%|██████████| 109/109 [00:00<00:00, 232.22batch/s, loss=0.000222]
Epoch 3: 100%|██████████| 109/109 [00:00<00:00, 252.72batch/s, loss=0.000156]
Epoch 4: 100%|██████████| 109/109 [00:00<00:00, 227.05batch/s, loss=0.00012] 
Epoch 5: 100%|██████████| 109/109 [00:00<00:00, 224.70batch/s, loss=9.8e-5]  
Epoch 6: 100%|██████████| 109/109 [00:00<00:00, 222.96batch/s, loss=8.42e-5] 
Epoch 7: 100%|██████████| 109/109 [00:00<00:00, 241.34batch/s, loss=7.54e-5] 
Epoch 8: 100%|██████████| 109/109 [00:00<00:00, 245.86batch/s, loss=7.02e-5] 
Epoch 9: 100%|██████████| 109/109 [00:00<00:00, 220.87batch/s, loss=6.8e-5]  
Epoch 10: 100%|██████████| 109/109 [00:00<00:00, 241.76batch/s, loss=6.58e-5] 
Epoch 11: 100%|██████████| 109/109 [00:00<00:00, 240.30batch/s, loss=6.46e-5] 
Epoch 12: 100%|██████████| 109/109 [00:00<00:00, 242.08batch/s

# Que mais?