In [1]:
import os, sys
import random
from glob import glob
import numpy as np
from matplotlib import pyplot as plt
from torchvision.utils import save_image

import torch
import torch.nn as nn
import torch.nn.functional as F
from torch.utils.data import Dataset
from torch.utils.tensorboard import SummaryWriter
import torchvision
from torchvision import transforms
from PIL import Image

from tqdm import tqdm

In [2]:
class RWTHAllImg(Dataset):
    """Class to load all images from RWTH dataset"""
    def __init__(self, globpattern, transform=None):
        self.imglobs = globpattern
        self.transform = transform
    
    def __getitem__(self, idx):
        if torch.is_tensor(idx):
            idx = idx.tolist()
        img = Image.open(self.imglobs[idx])
        if self.transform:
            img = self.transform(img)
        sample = {'image': img}
        return sample
    
    def __len__(self):
        return len(self.imglobs)

In [3]:
class Autoencoder(nn.Module):
    def __init__(self):
        super(Autoencoder, self).__init__()
        

        self.conv1 = nn.Conv2d(3, 6, padding=2, kernel_size=5) # out = b, 6, 
        
        self.maxpool1 = nn.MaxPool2d(4, stride=1, return_indices=True)
        self.conv2 = nn.Conv2d(6, 16, padding=2, kernel_size=5)
        self.maxpool2 = nn.MaxPool2d(2, stride=1, return_indices=True)
        
        self.unpool2 = nn.MaxUnpool2d(2, stride=1)
        self.unconv2 = nn.ConvTranspose2d(16, 6, padding=2, kernel_size=5)
        self.unpool1 = nn.MaxUnpool2d(4, stride=1)
        self.unconv1 = nn.ConvTranspose2d(6, 3, padding=2, kernel_size=5)
        
    def forward(self,x):
        # Encoder
        x = self.conv1(x)
        x = F.relu(x)
        x, indices1 = self.maxpool1(x)
        x = self.conv2(x)
        x = F.relu(x)
        x, indices2 = self.maxpool2(x)
        
        # Decoder
        x = self.unpool2(x, indices2)
        x = F.relu(x)
        x = self.unconv2(x)
        x = self.unpool1(x, indices1)
        x = F.relu(x)
        x = self.unconv1(x)
        #x = F.tanh(x)
        
        return x
    
    def encoder(self, x):
        x = self.conv1(x)
        x = F.relu(x)
        x, indices1 = self.maxpool1(x)
        x = self.conv2(x)
        x = F.relu(x)
        x, indices2 = self.maxpool2(x)
        return x, indices1, indices2

In [4]:
preprocess = transforms.Compose([
    transforms.Resize((256, 256)),
    transforms.CenterCrop(256),
    transforms.ToTensor(),
    transforms.Normalize(mean=[0.485, 0.456, 0.406], std=[0.229, 0.224, 0.225]),
])

In [5]:
traindir = "/home/reverie/datasets/phoenix2014-release/phoenix-2014-multisigner/features/fullFrame-210x260px/train"
train_glob = glob(os.path.join(traindir, "*/*/*.png"))
print(len(train_glob))
np.random.seed(3)
num_samples = 256 * 256
batch_size = 64
train_glob = np.random.choice(train_glob, num_samples, replace=False)
trainloader = torch.utils.data.DataLoader(RWTHAllImg(train_glob, transform=preprocess), batch_size=batch_size)

testdir = "/home/reverie/datasets/phoenix2014-release/phoenix-2014-multisigner/features/fullFrame-210x260px/test"
test_glob = glob(os.path.join(testdir, "*/*/*.png"))
print(len(test_glob))
test_glob  = np.random.choice(test_glob, 1000, replace=False)
testloader = torch.utils.data.DataLoader(RWTHAllImg(test_glob, transform=preprocess), batch_size=batch_size)

633621
89472


In [6]:
total_itr = num_samples // batch_size
total_itr

1024

In [7]:
model = Autoencoder().cuda()
criterion = nn.MSELoss()
optimizer = torch.optim.Adam(model.parameters(), lr=1e-3,
                             weight_decay=1e-5)
scheduler = torch.optim.lr_scheduler.ReduceLROnPlateau(optimizer, 'min', patience=1, verbose = True, factor = 0.1, min_lr=1e-5, threshold=1e-3)
num_epochs = 5

In [8]:
print(model)

Autoencoder(
  (conv1): Conv2d(3, 6, kernel_size=(5, 5), stride=(1, 1), padding=(2, 2))
  (maxpool1): MaxPool2d(kernel_size=4, stride=1, padding=0, dilation=1, ceil_mode=False)
  (conv2): Conv2d(6, 16, kernel_size=(5, 5), stride=(1, 1), padding=(2, 2))
  (maxpool2): MaxPool2d(kernel_size=2, stride=1, padding=0, dilation=1, ceil_mode=False)
  (unpool2): MaxUnpool2d(kernel_size=(2, 2), stride=(1, 1), padding=(0, 0))
  (unconv2): ConvTranspose2d(16, 6, kernel_size=(5, 5), stride=(1, 1), padding=(2, 2))
  (unpool1): MaxUnpool2d(kernel_size=(4, 4), stride=(1, 1), padding=(0, 0))
  (unconv1): ConvTranspose2d(6, 3, kernel_size=(5, 5), stride=(1, 1), padding=(2, 2))
)


In [9]:
def to_img(x):
    x = 0.5 * (x + 1)
    x = x.clamp(0, 1)
    x = x.view(x.size(0), 3, 256, 256)
    return x

In [10]:
def save_checkpoint(model, optimizer, scheduler, epoch, loss, itr):
    chkpt = {
        'model': model.state_dict(),
        'optimizer': optimizer.state_dict(),
        'scheduler': scheduler.state_dict(),
        'epoch': epoch,
        'loss': loss
    }
    torch.save(chkpt, f'chkpt_{epoch}_{itr}.pth')

def load_checkpoint(path, model, optimizer, scheduler):
    if os.path.isfile(path):
        chpkt = torch.load(path)
        print(f"Loading checkpoint epoch:{chpkt['epoch']} and loss:{chpkt['loss']}")
        model.load_state_dict(chpkt['model'])
        optimizer.load_state_dict(chpkt['optimizer'])
        scheduler.load_state_dict(chpkt['scheduler'])
        return model, optimizer, scheduler
    else:
        print(f"{path} is not a valid file")

In [11]:
writer = SummaryWriter()

In [12]:
#model, optimizer, scheduler = load_checkpoint('./chkpt_4_1000.pth', model, optimizer, scheduler)
scheduler.threshold = 1e-5
for epoch in tqdm(range(num_epochs)):
    itr = 0
    for data in tqdm(trainloader):
        img = data['image']
        img = img.cuda()
        # ===================forward=====================
        output = model(img)
        loss = criterion(output, img)
        # ===================backward====================
        optimizer.zero_grad()
        loss.backward()
        optimizer.step()
        
        writer.add_scalar(f'Loss/{epoch}', loss, itr)
        itr += 1
        if itr % 100 == 0:
            print(f"{itr}/{total_itr} iterations, loss:{loss}")
        if itr % 500 == 0:
            save_checkpoint(model, optimizer, scheduler, epoch, loss, itr)
    # ===================log========================
    print('epoch [{}/{}], loss:{:.4f}'
          .format(epoch + 1, num_epochs, loss))
    scheduler.step(loss)
    pic = to_img(output.cpu().data)
    #grid = torchvision.utils.make_grid(pic)
    #writer.add_image('images', grid)
    #writer.add_graph(model, pic.cuda())
    save_image(pic, './dc_img/image_{}.png'.format(epoch))

  0%|          | 0/5 [00:00<?, ?it/s]
  0%|          | 0/1024 [00:00<?, ?it/s][A
  0%|          | 1/1024 [00:00<09:45,  1.75it/s][A
  0%|          | 2/1024 [00:01<09:03,  1.88it/s][A
  0%|          | 3/1024 [00:01<08:36,  1.98it/s][A
  0%|          | 4/1024 [00:01<08:12,  2.07it/s][A
  0%|          | 5/1024 [00:02<07:59,  2.12it/s][A
  1%|          | 6/1024 [00:02<07:47,  2.18it/s][A
  1%|          | 7/1024 [00:03<07:45,  2.19it/s][A
  1%|          | 8/1024 [00:03<07:36,  2.22it/s][A
  1%|          | 9/1024 [00:04<07:31,  2.25it/s][A
  1%|          | 10/1024 [00:04<07:30,  2.25it/s][A
  1%|          | 11/1024 [00:04<07:31,  2.25it/s][A
  1%|          | 12/1024 [00:05<07:37,  2.21it/s][A
  1%|▏         | 13/1024 [00:08<23:09,  1.37s/it][A
  1%|▏         | 14/1024 [00:11<29:28,  1.75s/it][A
  1%|▏         | 15/1024 [00:14<33:52,  2.01s/it][A
  2%|▏         | 16/1024 [00:16<36:27,  2.17s/it][A
  2%|▏         | 17/1024 [00:19<39:42,  2.37s/it][A
  2%|▏         | 18/1024 [

100/1024 iterations, loss:0.169610857963562



 10%|▉         | 101/1024 [04:19<46:26,  3.02s/it][A
 10%|▉         | 102/1024 [04:20<40:50,  2.66s/it][A
 10%|█         | 103/1024 [04:22<36:32,  2.38s/it][A
 10%|█         | 104/1024 [04:24<33:29,  2.18s/it][A
 10%|█         | 105/1024 [04:26<32:05,  2.10s/it][A
 10%|█         | 106/1024 [04:27<29:59,  1.96s/it][A
 10%|█         | 107/1024 [04:29<29:31,  1.93s/it][A
 11%|█         | 108/1024 [04:31<28:04,  1.84s/it][A
 11%|█         | 109/1024 [04:32<26:55,  1.77s/it][A
 11%|█         | 110/1024 [04:34<28:05,  1.84s/it][A
 11%|█         | 111/1024 [04:36<26:54,  1.77s/it][A
 11%|█         | 112/1024 [04:47<1:07:12,  4.42s/it][A
 11%|█         | 113/1024 [04:51<1:08:41,  4.52s/it][A
 11%|█         | 114/1024 [04:54<59:05,  3.90s/it]  [A
 11%|█         | 115/1024 [04:56<49:40,  3.28s/it][A
 11%|█▏        | 116/1024 [04:58<46:23,  3.07s/it][A
 11%|█▏        | 117/1024 [05:01<45:17,  3.00s/it][A
 12%|█▏        | 118/1024 [05:04<44:53,  2.97s/it][A
 12%|█▏        | 119/

200/1024 iterations, loss:0.11516422033309937



 20%|█▉        | 201/1024 [09:00<1:00:46,  4.43s/it][A
 20%|█▉        | 202/1024 [09:03<54:51,  4.00s/it]  [A
 20%|█▉        | 203/1024 [09:06<49:09,  3.59s/it][A
 20%|█▉        | 204/1024 [09:08<42:47,  3.13s/it][A
 20%|██        | 205/1024 [09:09<37:02,  2.71s/it][A
 20%|██        | 206/1024 [09:12<36:49,  2.70s/it][A
 20%|██        | 207/1024 [09:14<35:09,  2.58s/it][A
 20%|██        | 208/1024 [09:17<33:14,  2.44s/it][A
 20%|██        | 209/1024 [09:21<40:10,  2.96s/it][A
 21%|██        | 210/1024 [09:24<39:32,  2.91s/it][A
 21%|██        | 211/1024 [09:33<1:06:16,  4.89s/it][A
 21%|██        | 212/1024 [09:37<1:00:44,  4.49s/it][A
 21%|██        | 213/1024 [09:39<51:09,  3.78s/it]  [A
 21%|██        | 214/1024 [09:41<43:55,  3.25s/it][A
 21%|██        | 215/1024 [09:43<39:21,  2.92s/it][A
 21%|██        | 216/1024 [09:45<35:36,  2.64s/it][A
 21%|██        | 217/1024 [09:48<36:54,  2.74s/it][A
 21%|██▏       | 218/1024 [09:50<34:14,  2.55s/it][A
 21%|██▏       | 

300/1024 iterations, loss:0.197213813662529



 29%|██▉       | 301/1024 [14:14<40:52,  3.39s/it][A
 29%|██▉       | 302/1024 [14:17<39:50,  3.31s/it][A
 30%|██▉       | 303/1024 [14:20<38:11,  3.18s/it][A
 30%|██▉       | 304/1024 [14:22<33:15,  2.77s/it][A
 30%|██▉       | 305/1024 [14:25<34:27,  2.87s/it][A
 30%|██▉       | 306/1024 [14:28<34:32,  2.89s/it][A
 30%|██▉       | 307/1024 [14:30<33:09,  2.78s/it][A
 30%|███       | 308/1024 [14:33<32:35,  2.73s/it][A
 30%|███       | 309/1024 [14:35<30:28,  2.56s/it][A
 30%|███       | 310/1024 [14:45<58:53,  4.95s/it][A
 30%|███       | 311/1024 [14:48<49:36,  4.17s/it][A
 30%|███       | 312/1024 [14:50<42:54,  3.62s/it][A
 31%|███       | 313/1024 [14:52<38:10,  3.22s/it][A
 31%|███       | 314/1024 [14:56<37:52,  3.20s/it][A
 31%|███       | 315/1024 [14:58<36:07,  3.06s/it][A
 31%|███       | 316/1024 [15:02<37:17,  3.16s/it][A
 31%|███       | 317/1024 [15:03<31:52,  2.71s/it][A
 31%|███       | 318/1024 [15:06<32:07,  2.73s/it][A
 31%|███       | 319/1024 [

400/1024 iterations, loss:0.08202064782381058



 39%|███▉      | 401/1024 [18:59<27:51,  2.68s/it][A
 39%|███▉      | 402/1024 [19:01<24:14,  2.34s/it][A
 39%|███▉      | 403/1024 [19:02<22:12,  2.14s/it][A
 39%|███▉      | 404/1024 [19:04<20:46,  2.01s/it][A
 40%|███▉      | 405/1024 [19:06<20:00,  1.94s/it][A
 40%|███▉      | 406/1024 [19:07<19:07,  1.86s/it][A
 40%|███▉      | 407/1024 [19:09<18:27,  1.79s/it][A
 40%|███▉      | 408/1024 [19:11<18:37,  1.81s/it][A
 40%|███▉      | 409/1024 [19:13<18:04,  1.76s/it][A
 40%|████      | 410/1024 [19:14<17:42,  1.73s/it][A
 40%|████      | 411/1024 [19:16<17:58,  1.76s/it][A
 40%|████      | 412/1024 [19:23<35:19,  3.46s/it][A
 40%|████      | 413/1024 [19:33<52:35,  5.16s/it][A
 40%|████      | 414/1024 [19:35<42:46,  4.21s/it][A
 41%|████      | 415/1024 [19:36<34:59,  3.45s/it][A
 41%|████      | 416/1024 [19:38<29:10,  2.88s/it][A
 41%|████      | 417/1024 [19:40<25:52,  2.56s/it][A
 41%|████      | 418/1024 [19:41<23:01,  2.28s/it][A
 41%|████      | 419/1024 [

500/1024 iterations, loss:0.07074828445911407



 49%|████▉     | 501/1024 [23:15<20:25,  2.34s/it][A
 49%|████▉     | 502/1024 [23:17<20:13,  2.32s/it][A
 49%|████▉     | 503/1024 [23:20<21:17,  2.45s/it][A
 49%|████▉     | 504/1024 [23:23<22:11,  2.56s/it][A
 49%|████▉     | 505/1024 [23:35<47:18,  5.47s/it][A
 49%|████▉     | 506/1024 [23:38<40:11,  4.65s/it][A
 50%|████▉     | 507/1024 [23:40<32:21,  3.76s/it][A
 50%|████▉     | 508/1024 [23:42<27:55,  3.25s/it][A
 50%|████▉     | 509/1024 [23:44<25:05,  2.92s/it][A
 50%|████▉     | 510/1024 [23:46<23:36,  2.75s/it][A
 50%|████▉     | 511/1024 [23:49<22:08,  2.59s/it][A
 50%|█████     | 512/1024 [23:51<21:03,  2.47s/it][A
 50%|█████     | 513/1024 [23:53<21:05,  2.48s/it][A
 50%|█████     | 514/1024 [23:56<22:43,  2.67s/it][A
 50%|█████     | 515/1024 [23:59<23:20,  2.75s/it][A
 50%|█████     | 516/1024 [24:01<21:49,  2.58s/it][A
 50%|█████     | 517/1024 [24:13<43:23,  5.14s/it][A
 51%|█████     | 518/1024 [24:15<35:46,  4.24s/it][A
 51%|█████     | 519/1024 [

600/1024 iterations, loss:0.06723137944936752



 59%|█████▊    | 601/1024 [28:21<20:00,  2.84s/it][A
 59%|█████▉    | 602/1024 [28:24<20:22,  2.90s/it][A
 59%|█████▉    | 603/1024 [28:28<22:07,  3.15s/it][A
 59%|█████▉    | 604/1024 [28:29<19:03,  2.72s/it][A
 59%|█████▉    | 605/1024 [28:32<19:25,  2.78s/it][A
 59%|█████▉    | 606/1024 [28:34<17:10,  2.46s/it][A
 59%|█████▉    | 607/1024 [28:37<17:59,  2.59s/it][A
 59%|█████▉    | 608/1024 [28:39<16:02,  2.31s/it][A
 59%|█████▉    | 609/1024 [28:41<16:39,  2.41s/it][A
 60%|█████▉    | 610/1024 [28:48<24:52,  3.61s/it][A
 60%|█████▉    | 611/1024 [28:50<21:38,  3.14s/it][A
 60%|█████▉    | 612/1024 [28:52<19:36,  2.86s/it][A
 60%|█████▉    | 613/1024 [28:54<18:13,  2.66s/it][A
 60%|█████▉    | 614/1024 [28:56<15:57,  2.34s/it][A
 60%|██████    | 615/1024 [28:59<16:57,  2.49s/it][A
 60%|██████    | 616/1024 [29:00<15:34,  2.29s/it][A
 60%|██████    | 617/1024 [29:02<13:53,  2.05s/it][A
 60%|██████    | 618/1024 [29:05<16:25,  2.43s/it][A
 60%|██████    | 619/1024 [

700/1024 iterations, loss:0.058942344039678574



 68%|██████▊   | 701/1024 [33:00<11:56,  2.22s/it][A
 69%|██████▊   | 702/1024 [33:02<11:00,  2.05s/it][A
 69%|██████▊   | 703/1024 [33:04<10:20,  1.93s/it][A
 69%|██████▉   | 704/1024 [33:05<10:00,  1.88s/it][A
 69%|██████▉   | 705/1024 [33:07<09:32,  1.79s/it][A
 69%|██████▉   | 706/1024 [33:09<09:10,  1.73s/it][A
 69%|██████▉   | 707/1024 [33:10<09:17,  1.76s/it][A
 69%|██████▉   | 708/1024 [33:12<08:58,  1.70s/it][A
 69%|██████▉   | 709/1024 [33:14<08:41,  1.66s/it][A
 69%|██████▉   | 710/1024 [33:16<10:37,  2.03s/it][A
 69%|██████▉   | 711/1024 [33:18<10:15,  1.97s/it][A
 70%|██████▉   | 712/1024 [33:34<31:05,  5.98s/it][A
 70%|██████▉   | 713/1024 [33:36<25:50,  4.98s/it][A
 70%|██████▉   | 714/1024 [33:38<20:18,  3.93s/it][A
 70%|██████▉   | 715/1024 [33:40<18:08,  3.52s/it][A
 70%|██████▉   | 716/1024 [33:42<15:00,  2.93s/it][A
 70%|███████   | 717/1024 [33:44<13:03,  2.55s/it][A
 70%|███████   | 718/1024 [33:45<11:52,  2.33s/it][A
 70%|███████   | 719/1024 [

800/1024 iterations, loss:0.05059121176600456



 78%|███████▊  | 801/1024 [37:14<06:25,  1.73s/it][A
 78%|███████▊  | 802/1024 [37:16<06:29,  1.75s/it][A
 78%|███████▊  | 803/1024 [37:18<06:35,  1.79s/it][A
 79%|███████▊  | 804/1024 [37:20<07:10,  1.96s/it][A
 79%|███████▊  | 805/1024 [37:22<06:45,  1.85s/it][A
 79%|███████▊  | 806/1024 [37:24<06:29,  1.79s/it][A
 79%|███████▉  | 807/1024 [37:43<25:08,  6.95s/it][A
 79%|███████▉  | 808/1024 [37:46<21:11,  5.89s/it][A
 79%|███████▉  | 809/1024 [37:49<17:27,  4.87s/it][A
 79%|███████▉  | 810/1024 [37:51<14:40,  4.11s/it][A
 79%|███████▉  | 811/1024 [37:54<13:16,  3.74s/it][A
 79%|███████▉  | 812/1024 [37:57<13:04,  3.70s/it][A
 79%|███████▉  | 813/1024 [37:59<10:50,  3.08s/it][A
 79%|███████▉  | 814/1024 [38:01<09:15,  2.64s/it][A
 80%|███████▉  | 815/1024 [38:03<09:19,  2.68s/it][A
 80%|███████▉  | 816/1024 [38:06<09:25,  2.72s/it][A
 80%|███████▉  | 817/1024 [38:08<08:19,  2.41s/it][A
 80%|███████▉  | 818/1024 [38:10<07:27,  2.17s/it][A
 80%|███████▉  | 819/1024 [

900/1024 iterations, loss:0.05004924535751343



 88%|████████▊ | 901/1024 [41:37<04:26,  2.17s/it][A
 88%|████████▊ | 902/1024 [41:38<04:06,  2.02s/it][A
 88%|████████▊ | 903/1024 [41:40<03:44,  1.85s/it][A
 88%|████████▊ | 904/1024 [41:41<03:39,  1.83s/it][A
 88%|████████▊ | 905/1024 [41:43<03:27,  1.74s/it][A
 88%|████████▊ | 906/1024 [41:45<03:17,  1.68s/it][A
 89%|████████▊ | 907/1024 [41:46<03:16,  1.68s/it][A
 89%|████████▊ | 908/1024 [41:48<03:15,  1.68s/it][A
 89%|████████▉ | 909/1024 [42:06<12:45,  6.66s/it][A
 89%|████████▉ | 910/1024 [42:08<09:53,  5.21s/it][A
 89%|████████▉ | 911/1024 [42:10<07:48,  4.15s/it][A
 89%|████████▉ | 912/1024 [42:11<06:18,  3.38s/it][A
 89%|████████▉ | 913/1024 [42:13<05:22,  2.91s/it][A
 89%|████████▉ | 914/1024 [42:15<04:36,  2.51s/it][A
 89%|████████▉ | 915/1024 [42:16<04:06,  2.26s/it][A
 89%|████████▉ | 916/1024 [42:18<03:42,  2.06s/it][A
 90%|████████▉ | 917/1024 [42:20<03:36,  2.02s/it][A
 90%|████████▉ | 918/1024 [42:21<03:21,  1.90s/it][A
 90%|████████▉ | 919/1024 [

1000/1024 iterations, loss:0.04699109494686127



 98%|█████████▊| 1001/1024 [46:03<00:56,  2.47s/it][A
 98%|█████████▊| 1002/1024 [46:05<00:50,  2.30s/it][A
 98%|█████████▊| 1003/1024 [46:06<00:45,  2.16s/it][A
 98%|█████████▊| 1004/1024 [46:08<00:40,  2.04s/it][A
 98%|█████████▊| 1005/1024 [46:10<00:37,  1.95s/it][A
 98%|█████████▊| 1006/1024 [46:12<00:33,  1.86s/it][A
 98%|█████████▊| 1007/1024 [46:13<00:30,  1.79s/it][A
 98%|█████████▊| 1008/1024 [46:15<00:29,  1.85s/it][A
 99%|█████████▊| 1009/1024 [46:17<00:27,  1.81s/it][A
 99%|█████████▊| 1010/1024 [46:18<00:24,  1.72s/it][A
 99%|█████████▊| 1011/1024 [46:20<00:22,  1.77s/it][A
 99%|█████████▉| 1012/1024 [46:30<00:50,  4.23s/it][A
 99%|█████████▉| 1013/1024 [46:37<00:55,  5.05s/it][A
 99%|█████████▉| 1014/1024 [46:39<00:42,  4.20s/it][A
 99%|█████████▉| 1015/1024 [46:41<00:31,  3.45s/it][A
 99%|█████████▉| 1016/1024 [46:43<00:23,  2.94s/it][A
 99%|█████████▉| 1017/1024 [46:45<00:18,  2.58s/it][A
 99%|█████████▉| 1018/1024 [46:46<00:14,  2.34s/it][A
100%|████

epoch [1/5], loss:0.0445


 20%|██        | 1/5 [46:58<3:07:53, 2818.36s/it]
  0%|          | 0/1024 [00:00<?, ?it/s][A
  0%|          | 1/1024 [00:00<07:26,  2.29it/s][A
  0%|          | 2/1024 [00:00<07:28,  2.28it/s][A
  0%|          | 3/1024 [00:01<07:29,  2.27it/s][A
  0%|          | 4/1024 [00:01<07:27,  2.28it/s][A
  0%|          | 5/1024 [00:02<07:27,  2.28it/s][A
  1%|          | 6/1024 [00:02<07:28,  2.27it/s][A
  1%|          | 7/1024 [00:03<07:27,  2.27it/s][A
  1%|          | 8/1024 [00:03<07:25,  2.28it/s][A
  1%|          | 9/1024 [00:03<07:28,  2.26it/s][A
  1%|          | 10/1024 [00:04<07:26,  2.27it/s][A
  1%|          | 11/1024 [00:04<07:27,  2.26it/s][A
  1%|          | 12/1024 [00:05<07:27,  2.26it/s][A
  1%|▏         | 13/1024 [00:05<07:27,  2.26it/s][A
  1%|▏         | 14/1024 [00:06<07:27,  2.26it/s][A
  1%|▏         | 15/1024 [00:06<07:27,  2.25it/s][A
  2%|▏         | 16/1024 [00:07<07:25,  2.26it/s][A
  2%|▏         | 17/1024 [00:07<07:24,  2.27it/s][A
  2%|▏        

100/1024 iterations, loss:0.043123167008161545



 10%|▉         | 101/1024 [00:45<07:01,  2.19it/s][A
 10%|▉         | 102/1024 [00:45<06:59,  2.20it/s][A
 10%|█         | 103/1024 [00:45<07:01,  2.18it/s][A
 10%|█         | 104/1024 [00:46<06:57,  2.20it/s][A
 10%|█         | 105/1024 [00:46<06:53,  2.22it/s][A
 10%|█         | 106/1024 [00:47<06:49,  2.24it/s][A
 10%|█         | 107/1024 [00:47<06:47,  2.25it/s][A
 11%|█         | 108/1024 [00:48<06:49,  2.24it/s][A
 11%|█         | 109/1024 [00:48<06:42,  2.27it/s][A
 11%|█         | 110/1024 [00:49<06:41,  2.28it/s][A
 11%|█         | 111/1024 [00:49<06:40,  2.28it/s][A
 11%|█         | 112/1024 [00:49<06:41,  2.27it/s][A
 11%|█         | 113/1024 [00:50<06:41,  2.27it/s][A
 11%|█         | 114/1024 [00:50<06:41,  2.27it/s][A
 11%|█         | 115/1024 [00:51<06:39,  2.27it/s][A
 11%|█▏        | 116/1024 [00:51<06:38,  2.28it/s][A
 11%|█▏        | 117/1024 [00:52<06:38,  2.27it/s][A
 12%|█▏        | 118/1024 [00:52<06:42,  2.25it/s][A
 12%|█▏        | 119/1024 [

200/1024 iterations, loss:0.044824838638305664



 20%|█▉        | 201/1024 [01:38<08:00,  1.71it/s][A
 20%|█▉        | 202/1024 [01:38<08:01,  1.71it/s][A
 20%|█▉        | 203/1024 [01:39<07:59,  1.71it/s][A
 20%|█▉        | 204/1024 [01:39<07:57,  1.72it/s][A
 20%|██        | 205/1024 [01:40<07:55,  1.72it/s][A
 20%|██        | 206/1024 [01:41<07:57,  1.71it/s][A
 20%|██        | 207/1024 [01:41<07:55,  1.72it/s][A
 20%|██        | 208/1024 [01:42<07:55,  1.72it/s][A
 20%|██        | 209/1024 [01:42<07:55,  1.71it/s][A
 21%|██        | 210/1024 [01:43<07:54,  1.72it/s][A
 21%|██        | 211/1024 [01:44<07:53,  1.72it/s][A
 21%|██        | 212/1024 [01:44<07:54,  1.71it/s][A
 21%|██        | 213/1024 [01:45<08:00,  1.69it/s][A
 21%|██        | 214/1024 [01:45<07:59,  1.69it/s][A
 21%|██        | 215/1024 [01:46<07:55,  1.70it/s][A
 21%|██        | 216/1024 [01:46<07:54,  1.70it/s][A
 21%|██        | 217/1024 [01:47<07:52,  1.71it/s][A
 21%|██▏       | 218/1024 [01:48<07:56,  1.69it/s][A
 21%|██▏       | 219/1024 [

300/1024 iterations, loss:0.04803142324090004



 29%|██▉       | 301/1024 [02:36<07:00,  1.72it/s][A
 29%|██▉       | 302/1024 [02:37<07:03,  1.70it/s][A
 30%|██▉       | 303/1024 [02:37<07:04,  1.70it/s][A
 30%|██▉       | 304/1024 [02:38<07:01,  1.71it/s][A
 30%|██▉       | 305/1024 [02:39<07:01,  1.70it/s][A
 30%|██▉       | 306/1024 [02:39<06:59,  1.71it/s][A
 30%|██▉       | 307/1024 [02:40<07:02,  1.70it/s][A
 30%|███       | 308/1024 [02:40<07:00,  1.70it/s][A
 30%|███       | 309/1024 [02:41<07:01,  1.69it/s][A
 30%|███       | 310/1024 [02:42<07:01,  1.69it/s][A
 30%|███       | 311/1024 [02:42<07:03,  1.68it/s][A
 30%|███       | 312/1024 [02:43<07:04,  1.68it/s][A
 31%|███       | 313/1024 [02:43<07:04,  1.68it/s][A
 31%|███       | 314/1024 [02:44<07:00,  1.69it/s][A
 31%|███       | 315/1024 [02:44<06:59,  1.69it/s][A
 31%|███       | 316/1024 [02:45<06:58,  1.69it/s][A
 31%|███       | 317/1024 [02:46<06:57,  1.69it/s][A
 31%|███       | 318/1024 [02:46<06:58,  1.69it/s][A
 31%|███       | 319/1024 [

400/1024 iterations, loss:0.0500030480325222



 39%|███▉      | 401/1024 [03:35<06:04,  1.71it/s][A
 39%|███▉      | 402/1024 [03:35<06:02,  1.72it/s][A
 39%|███▉      | 403/1024 [03:36<06:02,  1.71it/s][A
 39%|███▉      | 404/1024 [03:36<06:00,  1.72it/s][A
 40%|███▉      | 405/1024 [03:37<05:59,  1.72it/s][A
 40%|███▉      | 406/1024 [03:38<05:59,  1.72it/s][A
 40%|███▉      | 407/1024 [03:38<05:59,  1.72it/s][A
 40%|███▉      | 408/1024 [03:39<05:58,  1.72it/s][A
 40%|███▉      | 409/1024 [03:39<05:57,  1.72it/s][A
 40%|████      | 410/1024 [03:40<05:56,  1.72it/s][A
 40%|████      | 411/1024 [03:41<05:55,  1.72it/s][A
 40%|████      | 412/1024 [03:41<05:54,  1.73it/s][A
 40%|████      | 413/1024 [03:42<05:53,  1.73it/s][A
 40%|████      | 414/1024 [03:42<05:53,  1.73it/s][A
 41%|████      | 415/1024 [03:43<05:54,  1.72it/s][A
 41%|████      | 416/1024 [03:43<05:53,  1.72it/s][A
 41%|████      | 417/1024 [03:44<05:53,  1.72it/s][A
 41%|████      | 418/1024 [03:45<05:53,  1.72it/s][A
 41%|████      | 419/1024 [

500/1024 iterations, loss:0.036287639290094376



 49%|████▉     | 501/1024 [04:33<05:06,  1.70it/s][A
 49%|████▉     | 502/1024 [04:34<05:04,  1.71it/s][A
 49%|████▉     | 503/1024 [04:34<05:02,  1.72it/s][A
 49%|████▉     | 504/1024 [04:35<05:01,  1.72it/s][A
 49%|████▉     | 505/1024 [04:35<05:00,  1.73it/s][A
 49%|████▉     | 506/1024 [04:36<05:00,  1.72it/s][A
 50%|████▉     | 507/1024 [04:37<05:02,  1.71it/s][A
 50%|████▉     | 508/1024 [04:37<05:01,  1.71it/s][A
 50%|████▉     | 509/1024 [04:38<05:00,  1.71it/s][A
 50%|████▉     | 510/1024 [04:38<04:59,  1.72it/s][A
 50%|████▉     | 511/1024 [04:39<04:57,  1.72it/s][A
 50%|█████     | 512/1024 [04:40<04:57,  1.72it/s][A
 50%|█████     | 513/1024 [04:40<04:56,  1.72it/s][A
 50%|█████     | 514/1024 [04:41<04:56,  1.72it/s][A
 50%|█████     | 515/1024 [04:41<04:55,  1.72it/s][A
 50%|█████     | 516/1024 [04:42<04:55,  1.72it/s][A
 50%|█████     | 517/1024 [04:42<04:54,  1.72it/s][A
 51%|█████     | 518/1024 [04:43<04:56,  1.71it/s][A
 51%|█████     | 519/1024 [

600/1024 iterations, loss:0.0403955839574337



 59%|█████▊    | 601/1024 [05:31<04:04,  1.73it/s][A
 59%|█████▉    | 602/1024 [05:32<04:04,  1.73it/s][A
 59%|█████▉    | 603/1024 [05:33<04:03,  1.73it/s][A
 59%|█████▉    | 604/1024 [05:33<04:03,  1.72it/s][A
 59%|█████▉    | 605/1024 [05:34<04:03,  1.72it/s][A
 59%|█████▉    | 606/1024 [05:34<04:02,  1.72it/s][A
 59%|█████▉    | 607/1024 [05:35<04:02,  1.72it/s][A
 59%|█████▉    | 608/1024 [05:35<04:02,  1.72it/s][A
 59%|█████▉    | 609/1024 [05:36<04:01,  1.72it/s][A
 60%|█████▉    | 610/1024 [05:37<04:01,  1.71it/s][A
 60%|█████▉    | 611/1024 [05:37<04:01,  1.71it/s][A
 60%|█████▉    | 612/1024 [05:38<04:00,  1.71it/s][A
 60%|█████▉    | 613/1024 [05:38<03:59,  1.71it/s][A
 60%|█████▉    | 614/1024 [05:39<04:00,  1.71it/s][A
 60%|██████    | 615/1024 [05:40<03:59,  1.71it/s][A
 60%|██████    | 616/1024 [05:40<03:57,  1.71it/s][A
 60%|██████    | 617/1024 [05:41<03:56,  1.72it/s][A
 60%|██████    | 618/1024 [05:41<03:55,  1.72it/s][A
 60%|██████    | 619/1024 [

700/1024 iterations, loss:0.03549725189805031



 68%|██████▊   | 701/1024 [06:30<03:09,  1.70it/s][A
 69%|██████▊   | 702/1024 [06:30<03:10,  1.69it/s][A
 69%|██████▊   | 703/1024 [06:31<03:08,  1.70it/s][A
 69%|██████▉   | 704/1024 [06:32<03:07,  1.71it/s][A
 69%|██████▉   | 705/1024 [06:32<03:07,  1.71it/s][A
 69%|██████▉   | 706/1024 [06:33<03:05,  1.71it/s][A
 69%|██████▉   | 707/1024 [06:33<03:04,  1.71it/s][A
 69%|██████▉   | 708/1024 [06:34<03:03,  1.72it/s][A
 69%|██████▉   | 709/1024 [06:34<03:03,  1.71it/s][A
 69%|██████▉   | 710/1024 [06:35<03:03,  1.71it/s][A
 69%|██████▉   | 711/1024 [06:36<03:02,  1.72it/s][A
 70%|██████▉   | 712/1024 [06:36<03:01,  1.72it/s][A
 70%|██████▉   | 713/1024 [06:37<03:00,  1.72it/s][A
 70%|██████▉   | 714/1024 [06:37<03:00,  1.72it/s][A
 70%|██████▉   | 715/1024 [06:38<02:59,  1.72it/s][A
 70%|██████▉   | 716/1024 [06:39<02:59,  1.72it/s][A
 70%|███████   | 717/1024 [06:39<02:58,  1.72it/s][A
 70%|███████   | 718/1024 [06:40<02:57,  1.72it/s][A
 70%|███████   | 719/1024 [

800/1024 iterations, loss:0.04218891263008118



 78%|███████▊  | 801/1024 [07:28<02:09,  1.72it/s][A
 78%|███████▊  | 802/1024 [07:29<02:09,  1.72it/s][A
 78%|███████▊  | 803/1024 [07:29<02:08,  1.71it/s][A
 79%|███████▊  | 804/1024 [07:30<02:08,  1.71it/s][A
 79%|███████▊  | 805/1024 [07:30<02:08,  1.71it/s][A
 79%|███████▊  | 806/1024 [07:31<02:07,  1.71it/s][A
 79%|███████▉  | 807/1024 [07:32<02:06,  1.71it/s][A
 79%|███████▉  | 808/1024 [07:32<02:05,  1.72it/s][A
 79%|███████▉  | 809/1024 [07:33<02:05,  1.71it/s][A
 79%|███████▉  | 810/1024 [07:33<02:04,  1.72it/s][A
 79%|███████▉  | 811/1024 [07:34<02:03,  1.72it/s][A
 79%|███████▉  | 812/1024 [07:35<02:03,  1.72it/s][A
 79%|███████▉  | 813/1024 [07:35<02:02,  1.72it/s][A
 79%|███████▉  | 814/1024 [07:36<02:01,  1.72it/s][A
 80%|███████▉  | 815/1024 [07:36<02:01,  1.72it/s][A
 80%|███████▉  | 816/1024 [07:37<02:00,  1.72it/s][A
 80%|███████▉  | 817/1024 [07:37<02:00,  1.72it/s][A
 80%|███████▉  | 818/1024 [07:38<01:59,  1.72it/s][A
 80%|███████▉  | 819/1024 [

900/1024 iterations, loss:0.03554781153798103



 88%|████████▊ | 901/1024 [08:26<01:11,  1.72it/s][A
 88%|████████▊ | 902/1024 [08:27<01:10,  1.72it/s][A
 88%|████████▊ | 903/1024 [08:28<01:10,  1.72it/s][A
 88%|████████▊ | 904/1024 [08:28<01:11,  1.69it/s][A
 88%|████████▊ | 905/1024 [08:29<01:10,  1.69it/s][A
 88%|████████▊ | 906/1024 [08:29<01:09,  1.70it/s][A
 89%|████████▊ | 907/1024 [08:30<01:08,  1.71it/s][A
 89%|████████▊ | 908/1024 [08:31<01:07,  1.72it/s][A
 89%|████████▉ | 909/1024 [08:31<01:07,  1.71it/s][A
 89%|████████▉ | 910/1024 [08:32<01:06,  1.72it/s][A
 89%|████████▉ | 911/1024 [08:32<01:05,  1.72it/s][A
 89%|████████▉ | 912/1024 [08:33<01:05,  1.72it/s][A
 89%|████████▉ | 913/1024 [08:33<01:04,  1.71it/s][A
 89%|████████▉ | 914/1024 [08:34<01:04,  1.72it/s][A
 89%|████████▉ | 915/1024 [08:35<01:03,  1.71it/s][A
 89%|████████▉ | 916/1024 [08:35<01:02,  1.72it/s][A
 90%|████████▉ | 917/1024 [08:36<01:02,  1.71it/s][A
 90%|████████▉ | 918/1024 [08:36<01:01,  1.71it/s][A
 90%|████████▉ | 919/1024 [

1000/1024 iterations, loss:0.05129751190543175



 98%|█████████▊| 1001/1024 [09:25<00:13,  1.72it/s][A
 98%|█████████▊| 1002/1024 [09:25<00:12,  1.71it/s][A
 98%|█████████▊| 1003/1024 [09:26<00:12,  1.72it/s][A
 98%|█████████▊| 1004/1024 [09:27<00:11,  1.72it/s][A
 98%|█████████▊| 1005/1024 [09:27<00:11,  1.72it/s][A
 98%|█████████▊| 1006/1024 [09:28<00:10,  1.73it/s][A
 98%|█████████▊| 1007/1024 [09:28<00:09,  1.73it/s][A
 98%|█████████▊| 1008/1024 [09:29<00:09,  1.72it/s][A
 99%|█████████▊| 1009/1024 [09:29<00:08,  1.72it/s][A
 99%|█████████▊| 1010/1024 [09:30<00:08,  1.73it/s][A
 99%|█████████▊| 1011/1024 [09:31<00:07,  1.73it/s][A
 99%|█████████▉| 1012/1024 [09:31<00:06,  1.73it/s][A
 99%|█████████▉| 1013/1024 [09:32<00:06,  1.73it/s][A
 99%|█████████▉| 1014/1024 [09:32<00:05,  1.72it/s][A
 99%|█████████▉| 1015/1024 [09:33<00:05,  1.73it/s][A
 99%|█████████▉| 1016/1024 [09:34<00:04,  1.72it/s][A
 99%|█████████▉| 1017/1024 [09:34<00:04,  1.72it/s][A
 99%|█████████▉| 1018/1024 [09:35<00:03,  1.72it/s][A
100%|████

epoch [2/5], loss:0.0355


 40%|████      | 2/5 [56:38<1:47:20, 2146.81s/it]
  0%|          | 0/1024 [00:00<?, ?it/s][A
  0%|          | 1/1024 [00:00<10:03,  1.69it/s][A
  0%|          | 2/1024 [00:01<10:05,  1.69it/s][A
  0%|          | 3/1024 [00:01<10:00,  1.70it/s][A
  0%|          | 4/1024 [00:02<09:56,  1.71it/s][A
  0%|          | 5/1024 [00:02<09:56,  1.71it/s][A
  1%|          | 6/1024 [00:03<09:56,  1.71it/s][A
  1%|          | 7/1024 [00:04<09:54,  1.71it/s][A
  1%|          | 8/1024 [00:04<09:53,  1.71it/s][A
  1%|          | 9/1024 [00:05<09:52,  1.71it/s][A
  1%|          | 10/1024 [00:05<09:53,  1.71it/s][A
  1%|          | 11/1024 [00:06<09:51,  1.71it/s][A
  1%|          | 12/1024 [00:07<09:48,  1.72it/s][A
  1%|▏         | 13/1024 [00:07<09:47,  1.72it/s][A
  1%|▏         | 14/1024 [00:08<09:48,  1.72it/s][A
  1%|▏         | 15/1024 [00:08<09:48,  1.71it/s][A
  2%|▏         | 16/1024 [00:09<09:46,  1.72it/s][A
  2%|▏         | 17/1024 [00:09<09:49,  1.71it/s][A
  2%|▏        

100/1024 iterations, loss:0.03346984088420868



 10%|▉         | 101/1024 [00:59<09:04,  1.70it/s][A
 10%|▉         | 102/1024 [00:59<08:59,  1.71it/s][A
 10%|█         | 103/1024 [01:00<08:56,  1.72it/s][A
 10%|█         | 104/1024 [01:00<08:54,  1.72it/s][A
 10%|█         | 105/1024 [01:01<08:52,  1.73it/s][A
 10%|█         | 106/1024 [01:01<08:53,  1.72it/s][A
 10%|█         | 107/1024 [01:02<08:54,  1.71it/s][A
 11%|█         | 108/1024 [01:03<08:54,  1.72it/s][A
 11%|█         | 109/1024 [01:03<08:51,  1.72it/s][A
 11%|█         | 110/1024 [01:04<08:54,  1.71it/s][A
 11%|█         | 111/1024 [01:04<08:53,  1.71it/s][A
 11%|█         | 112/1024 [01:05<08:54,  1.71it/s][A
 11%|█         | 113/1024 [01:06<08:54,  1.71it/s][A
 11%|█         | 114/1024 [01:06<08:52,  1.71it/s][A
 11%|█         | 115/1024 [01:07<08:51,  1.71it/s][A
 11%|█▏        | 116/1024 [01:07<08:49,  1.71it/s][A
 11%|█▏        | 117/1024 [01:08<08:48,  1.72it/s][A
 12%|█▏        | 118/1024 [01:08<08:49,  1.71it/s][A
 12%|█▏        | 119/1024 [

200/1024 iterations, loss:0.03411337360739708



 20%|█▉        | 201/1024 [01:57<07:59,  1.72it/s][A
 20%|█▉        | 202/1024 [01:57<07:59,  1.71it/s][A
 20%|█▉        | 203/1024 [01:58<07:56,  1.72it/s][A
 20%|█▉        | 204/1024 [01:59<07:55,  1.72it/s][A
 20%|██        | 205/1024 [01:59<07:55,  1.72it/s][A
 20%|██        | 206/1024 [02:00<07:56,  1.72it/s][A
 20%|██        | 207/1024 [02:00<07:57,  1.71it/s][A
 20%|██        | 208/1024 [02:01<07:55,  1.72it/s][A
 20%|██        | 209/1024 [02:01<07:53,  1.72it/s][A
 21%|██        | 210/1024 [02:02<07:52,  1.72it/s][A
 21%|██        | 211/1024 [02:03<07:51,  1.72it/s][A
 21%|██        | 212/1024 [02:03<07:50,  1.73it/s][A
 21%|██        | 213/1024 [02:04<07:51,  1.72it/s][A
 21%|██        | 214/1024 [02:04<07:52,  1.72it/s][A
 21%|██        | 215/1024 [02:05<07:50,  1.72it/s][A
 21%|██        | 216/1024 [02:06<07:51,  1.71it/s][A
 21%|██        | 217/1024 [02:06<07:48,  1.72it/s][A
 21%|██▏       | 218/1024 [02:07<07:47,  1.72it/s][A
 21%|██▏       | 219/1024 [

300/1024 iterations, loss:0.035671062767505646



 29%|██▉       | 301/1024 [02:55<07:00,  1.72it/s][A
 29%|██▉       | 302/1024 [02:56<07:00,  1.72it/s][A
 30%|██▉       | 303/1024 [02:56<07:00,  1.71it/s][A
 30%|██▉       | 304/1024 [02:57<06:58,  1.72it/s][A
 30%|██▉       | 305/1024 [02:57<06:59,  1.71it/s][A
 30%|██▉       | 306/1024 [02:58<06:58,  1.72it/s][A
 30%|██▉       | 307/1024 [02:59<06:59,  1.71it/s][A
 30%|███       | 308/1024 [02:59<06:59,  1.71it/s][A
 30%|███       | 309/1024 [03:00<06:58,  1.71it/s][A
 30%|███       | 310/1024 [03:00<06:56,  1.71it/s][A
 30%|███       | 311/1024 [03:01<06:55,  1.72it/s][A
 30%|███       | 312/1024 [03:01<06:54,  1.72it/s][A
 31%|███       | 313/1024 [03:02<06:52,  1.73it/s][A
 31%|███       | 314/1024 [03:03<06:52,  1.72it/s][A
 31%|███       | 315/1024 [03:03<06:51,  1.72it/s][A
 31%|███       | 316/1024 [03:04<06:52,  1.72it/s][A
 31%|███       | 317/1024 [03:04<06:52,  1.71it/s][A
 31%|███       | 318/1024 [03:05<06:50,  1.72it/s][A
 31%|███       | 319/1024 [

400/1024 iterations, loss:0.039356131106615067



 39%|███▉      | 401/1024 [03:53<06:04,  1.71it/s][A
 39%|███▉      | 402/1024 [03:54<06:02,  1.71it/s][A
 39%|███▉      | 403/1024 [03:54<06:01,  1.72it/s][A
 39%|███▉      | 404/1024 [03:55<05:59,  1.72it/s][A
 40%|███▉      | 405/1024 [03:56<05:58,  1.73it/s][A
 40%|███▉      | 406/1024 [03:56<05:58,  1.73it/s][A
 40%|███▉      | 407/1024 [03:57<05:57,  1.73it/s][A
 40%|███▉      | 408/1024 [03:57<05:57,  1.72it/s][A
 40%|███▉      | 409/1024 [03:58<05:56,  1.72it/s][A
 40%|████      | 410/1024 [03:59<05:58,  1.71it/s][A
 40%|████      | 411/1024 [03:59<05:56,  1.72it/s][A
 40%|████      | 412/1024 [04:00<05:56,  1.72it/s][A
 40%|████      | 413/1024 [04:00<05:55,  1.72it/s][A
 40%|████      | 414/1024 [04:01<05:54,  1.72it/s][A
 41%|████      | 415/1024 [04:01<05:53,  1.72it/s][A
 41%|████      | 416/1024 [04:02<05:52,  1.73it/s][A
 41%|████      | 417/1024 [04:03<05:52,  1.72it/s][A
 41%|████      | 418/1024 [04:03<05:52,  1.72it/s][A
 41%|████      | 419/1024 [

500/1024 iterations, loss:0.033845074474811554



 49%|████▉     | 501/1024 [04:52<05:06,  1.71it/s][A
 49%|████▉     | 502/1024 [04:52<05:04,  1.71it/s][A
 49%|████▉     | 503/1024 [04:53<05:03,  1.71it/s][A
 49%|████▉     | 504/1024 [04:53<05:02,  1.72it/s][A
 49%|████▉     | 505/1024 [04:54<05:03,  1.71it/s][A
 49%|████▉     | 506/1024 [04:54<05:03,  1.71it/s][A
 50%|████▉     | 507/1024 [04:55<05:02,  1.71it/s][A
 50%|████▉     | 508/1024 [04:56<05:01,  1.71it/s][A
 50%|████▉     | 509/1024 [04:56<05:00,  1.71it/s][A
 50%|████▉     | 510/1024 [04:57<04:59,  1.72it/s][A
 50%|████▉     | 511/1024 [04:57<04:58,  1.72it/s][A
 50%|█████     | 512/1024 [04:58<04:58,  1.71it/s][A
 50%|█████     | 513/1024 [04:59<04:57,  1.72it/s][A
 50%|█████     | 514/1024 [04:59<04:57,  1.71it/s][A
 50%|█████     | 515/1024 [05:00<04:56,  1.72it/s][A
 50%|█████     | 516/1024 [05:00<04:56,  1.71it/s][A
 50%|█████     | 517/1024 [05:01<04:54,  1.72it/s][A
 51%|█████     | 518/1024 [05:01<04:54,  1.72it/s][A
 51%|█████     | 519/1024 [

600/1024 iterations, loss:0.0353609137237072



 59%|█████▊    | 601/1024 [05:50<04:07,  1.71it/s][A
 59%|█████▉    | 602/1024 [05:50<04:06,  1.71it/s][A
 59%|█████▉    | 603/1024 [05:51<04:05,  1.71it/s][A
 59%|█████▉    | 604/1024 [05:52<04:04,  1.72it/s][A
 59%|█████▉    | 605/1024 [05:52<04:03,  1.72it/s][A
 59%|█████▉    | 606/1024 [05:53<04:03,  1.72it/s][A
 59%|█████▉    | 607/1024 [05:53<04:02,  1.72it/s][A
 59%|█████▉    | 608/1024 [05:54<04:01,  1.72it/s][A
 59%|█████▉    | 609/1024 [05:55<04:00,  1.72it/s][A
 60%|█████▉    | 610/1024 [05:55<04:00,  1.72it/s][A
 60%|█████▉    | 611/1024 [05:56<03:59,  1.73it/s][A
 60%|█████▉    | 612/1024 [05:56<03:58,  1.73it/s][A
 60%|█████▉    | 613/1024 [05:57<03:58,  1.72it/s][A
 60%|█████▉    | 614/1024 [05:57<03:58,  1.72it/s][A
 60%|██████    | 615/1024 [05:58<03:57,  1.72it/s][A
 60%|██████    | 616/1024 [05:59<03:56,  1.72it/s][A
 60%|██████    | 617/1024 [05:59<03:55,  1.73it/s][A
 60%|██████    | 618/1024 [06:00<03:55,  1.72it/s][A
 60%|██████    | 619/1024 [

700/1024 iterations, loss:0.03268197551369667



 68%|██████▊   | 701/1024 [06:48<03:08,  1.71it/s][A
 69%|██████▊   | 702/1024 [06:49<03:07,  1.71it/s][A
 69%|██████▊   | 703/1024 [06:49<03:07,  1.71it/s][A
 69%|██████▉   | 704/1024 [06:50<03:06,  1.72it/s][A
 69%|██████▉   | 705/1024 [06:50<03:05,  1.72it/s][A
 69%|██████▉   | 706/1024 [06:51<03:05,  1.72it/s][A
 69%|██████▉   | 707/1024 [06:52<03:04,  1.72it/s][A
 69%|██████▉   | 708/1024 [06:52<03:03,  1.72it/s][A
 69%|██████▉   | 709/1024 [06:53<03:03,  1.71it/s][A
 69%|██████▉   | 710/1024 [06:53<03:03,  1.71it/s][A
 69%|██████▉   | 711/1024 [06:54<03:01,  1.72it/s][A
 70%|██████▉   | 712/1024 [06:54<03:02,  1.71it/s][A
 70%|██████▉   | 713/1024 [06:55<03:00,  1.72it/s][A
 70%|██████▉   | 714/1024 [06:56<02:59,  1.72it/s][A
 70%|██████▉   | 715/1024 [06:56<02:58,  1.73it/s][A
 70%|██████▉   | 716/1024 [06:57<02:58,  1.73it/s][A
 70%|███████   | 717/1024 [06:57<02:57,  1.73it/s][A
 70%|███████   | 718/1024 [06:58<02:56,  1.73it/s][A
 70%|███████   | 719/1024 [

800/1024 iterations, loss:0.03164006397128105



 78%|███████▊  | 801/1024 [07:46<02:09,  1.72it/s][A
 78%|███████▊  | 802/1024 [07:47<02:08,  1.72it/s][A
 78%|███████▊  | 803/1024 [07:47<02:08,  1.73it/s][A
 79%|███████▊  | 804/1024 [07:48<02:07,  1.72it/s][A
 79%|███████▊  | 805/1024 [07:49<02:07,  1.72it/s][A
 79%|███████▊  | 806/1024 [07:49<02:06,  1.73it/s][A
 79%|███████▉  | 807/1024 [07:50<02:05,  1.73it/s][A
 79%|███████▉  | 808/1024 [07:50<02:05,  1.73it/s][A
 79%|███████▉  | 809/1024 [07:51<02:04,  1.73it/s][A
 79%|███████▉  | 810/1024 [07:52<02:04,  1.72it/s][A
 79%|███████▉  | 811/1024 [07:52<02:03,  1.72it/s][A
 79%|███████▉  | 812/1024 [07:53<02:03,  1.72it/s][A
 79%|███████▉  | 813/1024 [07:53<02:02,  1.72it/s][A
 79%|███████▉  | 814/1024 [07:54<02:01,  1.73it/s][A
 80%|███████▉  | 815/1024 [07:54<02:01,  1.72it/s][A
 80%|███████▉  | 816/1024 [07:55<02:01,  1.72it/s][A
 80%|███████▉  | 817/1024 [07:56<02:00,  1.72it/s][A
 80%|███████▉  | 818/1024 [07:56<01:59,  1.72it/s][A
 80%|███████▉  | 819/1024 [

900/1024 iterations, loss:0.03398633003234863



 88%|████████▊ | 901/1024 [08:44<01:12,  1.70it/s][A
 88%|████████▊ | 902/1024 [08:45<01:11,  1.70it/s][A
 88%|████████▊ | 903/1024 [08:46<01:10,  1.70it/s][A
 88%|████████▊ | 904/1024 [08:46<01:10,  1.71it/s][A
 88%|████████▊ | 905/1024 [08:47<01:09,  1.71it/s][A
 88%|████████▊ | 906/1024 [08:47<01:08,  1.72it/s][A
 89%|████████▊ | 907/1024 [08:48<01:08,  1.72it/s][A
 89%|████████▊ | 908/1024 [08:49<01:07,  1.72it/s][A
 89%|████████▉ | 909/1024 [08:49<01:06,  1.72it/s][A
 89%|████████▉ | 910/1024 [08:50<01:05,  1.73it/s][A
 89%|████████▉ | 911/1024 [08:50<01:05,  1.72it/s][A
 89%|████████▉ | 912/1024 [08:51<01:04,  1.73it/s][A
 89%|████████▉ | 913/1024 [08:51<01:04,  1.73it/s][A
 89%|████████▉ | 914/1024 [08:52<01:03,  1.73it/s][A
 89%|████████▉ | 915/1024 [08:53<01:02,  1.73it/s][A
 89%|████████▉ | 916/1024 [08:53<01:02,  1.73it/s][A
 90%|████████▉ | 917/1024 [08:54<01:01,  1.73it/s][A
 90%|████████▉ | 918/1024 [08:54<01:01,  1.73it/s][A
 90%|████████▉ | 919/1024 [

1000/1024 iterations, loss:0.03351990133523941



 98%|█████████▊| 1001/1024 [09:43<00:13,  1.71it/s][A
 98%|█████████▊| 1002/1024 [09:43<00:12,  1.72it/s][A
 98%|█████████▊| 1003/1024 [09:44<00:12,  1.72it/s][A
 98%|█████████▊| 1004/1024 [09:44<00:11,  1.72it/s][A
 98%|█████████▊| 1005/1024 [09:45<00:11,  1.72it/s][A
 98%|█████████▊| 1006/1024 [09:46<00:10,  1.72it/s][A
 98%|█████████▊| 1007/1024 [09:46<00:09,  1.72it/s][A
 98%|█████████▊| 1008/1024 [09:47<00:09,  1.72it/s][A
 99%|█████████▊| 1009/1024 [09:47<00:08,  1.72it/s][A
 99%|█████████▊| 1010/1024 [09:48<00:08,  1.72it/s][A
 99%|█████████▊| 1011/1024 [09:48<00:07,  1.72it/s][A
 99%|█████████▉| 1012/1024 [09:49<00:06,  1.73it/s][A
 99%|█████████▉| 1013/1024 [09:50<00:06,  1.72it/s][A
 99%|█████████▉| 1014/1024 [09:50<00:05,  1.73it/s][A
 99%|█████████▉| 1015/1024 [09:51<00:05,  1.73it/s][A
 99%|█████████▉| 1016/1024 [09:51<00:04,  1.73it/s][A
 99%|█████████▉| 1017/1024 [09:52<00:04,  1.72it/s][A
 99%|█████████▉| 1018/1024 [09:52<00:03,  1.72it/s][A
100%|████

epoch [3/5], loss:0.0338


 60%|██████    | 3/5 [1:06:35<56:04, 1682.08s/it]
  0%|          | 0/1024 [00:00<?, ?it/s][A
  0%|          | 1/1024 [00:00<10:00,  1.70it/s][A
  0%|          | 2/1024 [00:01<09:57,  1.71it/s][A
  0%|          | 3/1024 [00:01<09:53,  1.72it/s][A
  0%|          | 4/1024 [00:02<09:55,  1.71it/s][A
  0%|          | 5/1024 [00:02<09:51,  1.72it/s][A
  1%|          | 6/1024 [00:03<09:50,  1.72it/s][A
  1%|          | 7/1024 [00:04<09:49,  1.73it/s][A
  1%|          | 8/1024 [00:04<09:46,  1.73it/s][A
  1%|          | 9/1024 [00:05<09:45,  1.73it/s][A
  1%|          | 10/1024 [00:05<09:46,  1.73it/s][A
  1%|          | 11/1024 [00:06<09:47,  1.72it/s][A
  1%|          | 12/1024 [00:06<09:45,  1.73it/s][A
  1%|▏         | 13/1024 [00:07<09:44,  1.73it/s][A
  1%|▏         | 14/1024 [00:08<09:44,  1.73it/s][A
  1%|▏         | 15/1024 [00:08<09:42,  1.73it/s][A
  2%|▏         | 16/1024 [00:09<09:43,  1.73it/s][A
  2%|▏         | 17/1024 [00:09<09:43,  1.73it/s][A
  2%|▏        

100/1024 iterations, loss:0.03151093050837517



 10%|▉         | 101/1024 [00:58<08:58,  1.71it/s][A
 10%|▉         | 102/1024 [00:59<08:55,  1.72it/s][A
 10%|█         | 103/1024 [00:59<08:54,  1.72it/s][A
 10%|█         | 104/1024 [01:00<08:55,  1.72it/s][A
 10%|█         | 105/1024 [01:01<08:52,  1.73it/s][A
 10%|█         | 106/1024 [01:01<08:51,  1.73it/s][A
 10%|█         | 107/1024 [01:02<08:51,  1.72it/s][A
 11%|█         | 108/1024 [01:02<08:50,  1.73it/s][A
 11%|█         | 109/1024 [01:03<08:51,  1.72it/s][A
 11%|█         | 110/1024 [01:04<08:49,  1.72it/s][A
 11%|█         | 111/1024 [01:04<08:50,  1.72it/s][A
 11%|█         | 112/1024 [01:05<08:52,  1.71it/s][A
 11%|█         | 113/1024 [01:05<08:51,  1.72it/s][A
 11%|█         | 114/1024 [01:06<08:52,  1.71it/s][A
 11%|█         | 115/1024 [01:06<08:50,  1.71it/s][A
 11%|█▏        | 116/1024 [01:07<08:50,  1.71it/s][A
 11%|█▏        | 117/1024 [01:08<08:49,  1.71it/s][A
 12%|█▏        | 118/1024 [01:08<08:49,  1.71it/s][A
 12%|█▏        | 119/1024 [

200/1024 iterations, loss:0.03233261778950691



 20%|█▉        | 201/1024 [01:57<07:59,  1.71it/s][A
 20%|█▉        | 202/1024 [01:57<07:58,  1.72it/s][A
 20%|█▉        | 203/1024 [01:58<07:56,  1.72it/s][A
 20%|█▉        | 204/1024 [01:58<07:54,  1.73it/s][A
 20%|██        | 205/1024 [01:59<07:53,  1.73it/s][A
 20%|██        | 206/1024 [01:59<07:54,  1.72it/s][A
 20%|██        | 207/1024 [02:00<07:54,  1.72it/s][A
 20%|██        | 208/1024 [02:01<07:53,  1.72it/s][A
 20%|██        | 209/1024 [02:01<07:51,  1.73it/s][A
 21%|██        | 210/1024 [02:02<07:53,  1.72it/s][A
 21%|██        | 211/1024 [02:02<07:53,  1.72it/s][A
 21%|██        | 212/1024 [02:03<07:52,  1.72it/s][A
 21%|██        | 213/1024 [02:03<07:52,  1.71it/s][A
 21%|██        | 214/1024 [02:04<07:53,  1.71it/s][A
 21%|██        | 215/1024 [02:05<07:51,  1.72it/s][A
 21%|██        | 216/1024 [02:05<07:56,  1.70it/s][A
 21%|██        | 217/1024 [02:06<07:53,  1.70it/s][A
 21%|██▏       | 218/1024 [02:06<07:51,  1.71it/s][A
 21%|██▏       | 219/1024 [

300/1024 iterations, loss:0.033534418791532516



 29%|██▉       | 301/1024 [02:55<06:59,  1.72it/s][A
 29%|██▉       | 302/1024 [02:55<06:58,  1.72it/s][A
 30%|██▉       | 303/1024 [02:56<06:58,  1.72it/s][A
 30%|██▉       | 304/1024 [02:57<06:58,  1.72it/s][A
 30%|██▉       | 305/1024 [02:57<06:57,  1.72it/s][A
 30%|██▉       | 306/1024 [02:58<06:56,  1.73it/s][A
 30%|██▉       | 307/1024 [02:58<06:56,  1.72it/s][A
 30%|███       | 308/1024 [02:59<06:56,  1.72it/s][A
 30%|███       | 309/1024 [02:59<06:55,  1.72it/s][A
 30%|███       | 310/1024 [03:00<06:57,  1.71it/s][A
 30%|███       | 311/1024 [03:01<06:55,  1.71it/s][A
 30%|███       | 312/1024 [03:01<06:55,  1.71it/s][A
 31%|███       | 313/1024 [03:02<06:58,  1.70it/s][A
 31%|███       | 314/1024 [03:02<06:55,  1.71it/s][A
 31%|███       | 315/1024 [03:03<06:54,  1.71it/s][A
 31%|███       | 316/1024 [03:04<06:53,  1.71it/s][A
 31%|███       | 317/1024 [03:04<06:52,  1.71it/s][A
 31%|███       | 318/1024 [03:05<06:50,  1.72it/s][A
 31%|███       | 319/1024 [

400/1024 iterations, loss:0.031804803758859634



 39%|███▉      | 401/1024 [03:53<06:03,  1.71it/s][A
 39%|███▉      | 402/1024 [03:54<06:01,  1.72it/s][A
 39%|███▉      | 403/1024 [03:54<06:00,  1.72it/s][A
 39%|███▉      | 404/1024 [03:55<05:59,  1.73it/s][A
 40%|███▉      | 405/1024 [03:55<05:58,  1.73it/s][A
 40%|███▉      | 406/1024 [03:56<05:59,  1.72it/s][A
 40%|███▉      | 407/1024 [03:57<05:58,  1.72it/s][A
 40%|███▉      | 408/1024 [03:57<05:56,  1.73it/s][A
 40%|███▉      | 409/1024 [03:58<05:57,  1.72it/s][A
 40%|████      | 410/1024 [03:58<05:56,  1.72it/s][A
 40%|████      | 411/1024 [03:59<05:56,  1.72it/s][A
 40%|████      | 412/1024 [04:00<05:56,  1.72it/s][A
 40%|████      | 413/1024 [04:00<05:55,  1.72it/s][A
 40%|████      | 414/1024 [04:01<05:54,  1.72it/s][A
 41%|████      | 415/1024 [04:01<05:52,  1.73it/s][A
 41%|████      | 416/1024 [04:02<05:52,  1.72it/s][A
 41%|████      | 417/1024 [04:02<05:51,  1.73it/s][A
 41%|████      | 418/1024 [04:03<05:50,  1.73it/s][A
 41%|████      | 419/1024 [

500/1024 iterations, loss:0.11459923535585403



 49%|████▉     | 501/1024 [04:51<05:01,  1.73it/s][A
 49%|████▉     | 502/1024 [04:52<05:00,  1.74it/s][A
 49%|████▉     | 503/1024 [04:52<04:59,  1.74it/s][A
 49%|████▉     | 504/1024 [04:53<05:00,  1.73it/s][A
 49%|████▉     | 505/1024 [04:54<04:59,  1.73it/s][A
 49%|████▉     | 506/1024 [04:54<04:59,  1.73it/s][A
 50%|████▉     | 507/1024 [04:55<04:59,  1.73it/s][A
 50%|████▉     | 508/1024 [04:55<04:58,  1.73it/s][A
 50%|████▉     | 509/1024 [04:56<04:57,  1.73it/s][A
 50%|████▉     | 510/1024 [04:56<04:57,  1.73it/s][A
 50%|████▉     | 511/1024 [04:57<04:56,  1.73it/s][A
 50%|█████     | 512/1024 [04:58<04:55,  1.73it/s][A
 50%|█████     | 513/1024 [04:58<04:54,  1.74it/s][A
 50%|█████     | 514/1024 [04:59<04:54,  1.73it/s][A
 50%|█████     | 515/1024 [04:59<04:54,  1.73it/s][A
 50%|█████     | 516/1024 [05:00<04:55,  1.72it/s][A
 50%|█████     | 517/1024 [05:00<04:53,  1.73it/s][A
 51%|█████     | 518/1024 [05:01<04:54,  1.72it/s][A
 51%|█████     | 519/1024 [

600/1024 iterations, loss:0.03174511715769768



 59%|█████▊    | 601/1024 [05:49<04:05,  1.73it/s][A
 59%|█████▉    | 602/1024 [05:50<04:04,  1.72it/s][A
 59%|█████▉    | 603/1024 [05:51<04:04,  1.72it/s][A
 59%|█████▉    | 604/1024 [05:51<04:04,  1.72it/s][A
 59%|█████▉    | 605/1024 [05:52<04:03,  1.72it/s][A
 59%|█████▉    | 606/1024 [05:52<04:02,  1.73it/s][A
 59%|█████▉    | 607/1024 [05:53<04:02,  1.72it/s][A
 59%|█████▉    | 608/1024 [05:53<04:01,  1.73it/s][A
 59%|█████▉    | 609/1024 [05:54<04:00,  1.73it/s][A
 60%|█████▉    | 610/1024 [05:55<03:59,  1.73it/s][A
 60%|█████▉    | 611/1024 [05:55<03:59,  1.72it/s][A
 60%|█████▉    | 612/1024 [05:56<03:59,  1.72it/s][A
 60%|█████▉    | 613/1024 [05:56<03:58,  1.73it/s][A
 60%|█████▉    | 614/1024 [05:57<03:58,  1.72it/s][A
 60%|██████    | 615/1024 [05:57<03:58,  1.72it/s][A
 60%|██████    | 616/1024 [05:58<03:56,  1.72it/s][A
 60%|██████    | 617/1024 [05:59<03:56,  1.72it/s][A
 60%|██████    | 618/1024 [05:59<03:55,  1.72it/s][A
 60%|██████    | 619/1024 [

700/1024 iterations, loss:0.030976759269833565



 68%|██████▊   | 701/1024 [06:48<03:06,  1.73it/s][A
 69%|██████▊   | 702/1024 [06:48<03:06,  1.73it/s][A
 69%|██████▊   | 703/1024 [06:49<03:05,  1.73it/s][A
 69%|██████▉   | 704/1024 [06:49<03:04,  1.73it/s][A
 69%|██████▉   | 705/1024 [06:50<03:04,  1.73it/s][A
 69%|██████▉   | 706/1024 [06:50<03:05,  1.72it/s][A
 69%|██████▉   | 707/1024 [06:51<03:04,  1.72it/s][A
 69%|██████▉   | 708/1024 [06:52<03:04,  1.71it/s][A
 69%|██████▉   | 709/1024 [06:52<03:03,  1.72it/s][A
 69%|██████▉   | 710/1024 [06:53<03:02,  1.72it/s][A
 69%|██████▉   | 711/1024 [06:53<03:01,  1.72it/s][A
 70%|██████▉   | 712/1024 [06:54<03:01,  1.72it/s][A
 70%|██████▉   | 713/1024 [06:54<03:00,  1.72it/s][A
 70%|██████▉   | 714/1024 [06:55<02:59,  1.73it/s][A
 70%|██████▉   | 715/1024 [06:56<02:59,  1.73it/s][A
 70%|██████▉   | 716/1024 [06:56<02:58,  1.73it/s][A
 70%|███████   | 717/1024 [06:57<02:57,  1.73it/s][A
 70%|███████   | 718/1024 [06:57<02:56,  1.73it/s][A
 70%|███████   | 719/1024 [

800/1024 iterations, loss:0.04449846222996712



 78%|███████▊  | 801/1024 [07:46<02:10,  1.71it/s][A
 78%|███████▊  | 802/1024 [07:46<02:09,  1.71it/s][A
 78%|███████▊  | 803/1024 [07:47<02:08,  1.72it/s][A
 79%|███████▊  | 804/1024 [07:47<02:07,  1.72it/s][A
 79%|███████▊  | 805/1024 [07:48<02:07,  1.72it/s][A
 79%|███████▊  | 806/1024 [07:49<02:06,  1.72it/s][A
 79%|███████▉  | 807/1024 [07:49<02:06,  1.72it/s][A
 79%|███████▉  | 808/1024 [07:50<02:05,  1.72it/s][A
 79%|███████▉  | 809/1024 [07:50<02:04,  1.72it/s][A
 79%|███████▉  | 810/1024 [07:51<02:04,  1.72it/s][A
 79%|███████▉  | 811/1024 [07:51<02:03,  1.72it/s][A
 79%|███████▉  | 812/1024 [07:52<02:02,  1.72it/s][A
 79%|███████▉  | 813/1024 [07:53<02:02,  1.72it/s][A
 79%|███████▉  | 814/1024 [07:53<02:02,  1.71it/s][A
 80%|███████▉  | 815/1024 [07:54<02:01,  1.71it/s][A
 80%|███████▉  | 816/1024 [07:54<02:01,  1.71it/s][A
 80%|███████▉  | 817/1024 [07:55<02:00,  1.71it/s][A
 80%|███████▉  | 818/1024 [07:56<02:00,  1.71it/s][A
 80%|███████▉  | 819/1024 [

900/1024 iterations, loss:0.031779829412698746



 88%|████████▊ | 901/1024 [08:44<01:13,  1.68it/s][A
 88%|████████▊ | 902/1024 [08:45<01:11,  1.69it/s][A
 88%|████████▊ | 903/1024 [08:45<01:10,  1.70it/s][A
 88%|████████▊ | 904/1024 [08:46<01:09,  1.72it/s][A
 88%|████████▊ | 905/1024 [08:46<01:09,  1.72it/s][A
 88%|████████▊ | 906/1024 [08:47<01:08,  1.72it/s][A
 89%|████████▊ | 907/1024 [08:47<01:07,  1.73it/s][A
 89%|████████▊ | 908/1024 [08:48<01:07,  1.73it/s][A
 89%|████████▉ | 909/1024 [08:49<01:06,  1.72it/s][A
 89%|████████▉ | 910/1024 [08:49<01:06,  1.72it/s][A
 89%|████████▉ | 911/1024 [08:50<01:05,  1.72it/s][A
 89%|████████▉ | 912/1024 [08:50<01:04,  1.72it/s][A
 89%|████████▉ | 913/1024 [08:51<01:04,  1.73it/s][A
 89%|████████▉ | 914/1024 [08:52<01:03,  1.72it/s][A
 89%|████████▉ | 915/1024 [08:52<01:03,  1.73it/s][A
 89%|████████▉ | 916/1024 [08:53<01:02,  1.72it/s][A
 90%|████████▉ | 917/1024 [08:53<01:02,  1.72it/s][A
 90%|████████▉ | 918/1024 [08:54<01:01,  1.72it/s][A
 90%|████████▉ | 919/1024 [

1000/1024 iterations, loss:0.03156517446041107



 98%|█████████▊| 1001/1024 [09:42<00:13,  1.70it/s][A
 98%|█████████▊| 1002/1024 [09:43<00:12,  1.71it/s][A
 98%|█████████▊| 1003/1024 [09:43<00:12,  1.70it/s][A
 98%|█████████▊| 1004/1024 [09:44<00:11,  1.70it/s][A
 98%|█████████▊| 1005/1024 [09:45<00:11,  1.71it/s][A
 98%|█████████▊| 1006/1024 [09:45<00:10,  1.72it/s][A
 98%|█████████▊| 1007/1024 [09:46<00:09,  1.72it/s][A
 98%|█████████▊| 1008/1024 [09:46<00:09,  1.71it/s][A
 99%|█████████▊| 1009/1024 [09:47<00:08,  1.72it/s][A
 99%|█████████▊| 1010/1024 [09:48<00:08,  1.72it/s][A
 99%|█████████▊| 1011/1024 [09:48<00:07,  1.72it/s][A
 99%|█████████▉| 1012/1024 [09:49<00:06,  1.72it/s][A
 99%|█████████▉| 1013/1024 [09:49<00:06,  1.72it/s][A
 99%|█████████▉| 1014/1024 [09:50<00:05,  1.72it/s][A
 99%|█████████▉| 1015/1024 [09:50<00:05,  1.72it/s][A
 99%|█████████▉| 1016/1024 [09:51<00:04,  1.73it/s][A
 99%|█████████▉| 1017/1024 [09:52<00:04,  1.73it/s][A
 99%|█████████▉| 1018/1024 [09:52<00:03,  1.73it/s][A
100%|████

epoch [4/5], loss:0.0292


 80%|████████  | 4/5 [1:16:33<22:36, 1356.70s/it]
  0%|          | 0/1024 [00:00<?, ?it/s][A
  0%|          | 1/1024 [00:00<09:50,  1.73it/s][A
  0%|          | 2/1024 [00:01<09:49,  1.73it/s][A
  0%|          | 3/1024 [00:01<09:50,  1.73it/s][A
  0%|          | 4/1024 [00:02<09:49,  1.73it/s][A
  0%|          | 5/1024 [00:02<09:54,  1.71it/s][A
  1%|          | 6/1024 [00:03<09:53,  1.71it/s][A
  1%|          | 7/1024 [00:04<09:53,  1.71it/s][A
  1%|          | 8/1024 [00:04<09:50,  1.72it/s][A
  1%|          | 9/1024 [00:05<09:49,  1.72it/s][A
  1%|          | 10/1024 [00:05<09:52,  1.71it/s][A
  1%|          | 11/1024 [00:06<09:50,  1.72it/s][A
  1%|          | 12/1024 [00:06<09:47,  1.72it/s][A
  1%|▏         | 13/1024 [00:07<09:46,  1.72it/s][A
  1%|▏         | 14/1024 [00:08<09:49,  1.71it/s][A
  1%|▏         | 15/1024 [00:08<09:49,  1.71it/s][A
  2%|▏         | 16/1024 [00:09<09:46,  1.72it/s][A
  2%|▏         | 17/1024 [00:09<09:48,  1.71it/s][A
  2%|▏        

100/1024 iterations, loss:0.030146436765789986



 10%|▉         | 101/1024 [00:58<08:59,  1.71it/s][A
 10%|▉         | 102/1024 [00:59<08:57,  1.72it/s][A
 10%|█         | 103/1024 [01:00<08:58,  1.71it/s][A
 10%|█         | 104/1024 [01:00<08:55,  1.72it/s][A
 10%|█         | 105/1024 [01:01<08:55,  1.72it/s][A
 10%|█         | 106/1024 [01:01<08:54,  1.72it/s][A
 10%|█         | 107/1024 [01:02<08:55,  1.71it/s][A
 11%|█         | 108/1024 [01:02<08:57,  1.70it/s][A
 11%|█         | 109/1024 [01:03<08:57,  1.70it/s][A
 11%|█         | 110/1024 [01:04<08:56,  1.70it/s][A
 11%|█         | 111/1024 [01:04<08:53,  1.71it/s][A
 11%|█         | 112/1024 [01:05<08:49,  1.72it/s][A
 11%|█         | 113/1024 [01:05<08:50,  1.72it/s][A
 11%|█         | 114/1024 [01:06<08:48,  1.72it/s][A
 11%|█         | 115/1024 [01:07<08:46,  1.73it/s][A
 11%|█▏        | 116/1024 [01:07<08:43,  1.73it/s][A
 11%|█▏        | 117/1024 [01:08<08:47,  1.72it/s][A
 12%|█▏        | 118/1024 [01:08<08:50,  1.71it/s][A
 12%|█▏        | 119/1024 [

200/1024 iterations, loss:0.0597948394715786



 20%|█▉        | 201/1024 [01:57<07:58,  1.72it/s][A
 20%|█▉        | 202/1024 [01:57<07:58,  1.72it/s][A
 20%|█▉        | 203/1024 [01:58<07:57,  1.72it/s][A
 20%|█▉        | 204/1024 [01:58<07:55,  1.73it/s][A
 20%|██        | 205/1024 [01:59<07:55,  1.72it/s][A
 20%|██        | 206/1024 [01:59<07:56,  1.72it/s][A
 20%|██        | 207/1024 [02:00<07:55,  1.72it/s][A
 20%|██        | 208/1024 [02:01<07:53,  1.72it/s][A
 20%|██        | 209/1024 [02:01<07:52,  1.73it/s][A
 21%|██        | 210/1024 [02:02<07:51,  1.72it/s][A
 21%|██        | 211/1024 [02:02<07:53,  1.72it/s][A
 21%|██        | 212/1024 [02:03<07:53,  1.71it/s][A
 21%|██        | 213/1024 [02:04<07:54,  1.71it/s][A
 21%|██        | 214/1024 [02:04<07:52,  1.72it/s][A
 21%|██        | 215/1024 [02:05<07:50,  1.72it/s][A
 21%|██        | 216/1024 [02:05<07:49,  1.72it/s][A
 21%|██        | 217/1024 [02:06<07:48,  1.72it/s][A
 21%|██▏       | 218/1024 [02:06<07:49,  1.72it/s][A
 21%|██▏       | 219/1024 [

300/1024 iterations, loss:0.06073842942714691



 29%|██▉       | 301/1024 [02:55<07:01,  1.72it/s][A
 29%|██▉       | 302/1024 [02:55<07:01,  1.71it/s][A
 30%|██▉       | 303/1024 [02:56<06:59,  1.72it/s][A
 30%|██▉       | 304/1024 [02:57<06:57,  1.73it/s][A
 30%|██▉       | 305/1024 [02:57<06:56,  1.73it/s][A
 30%|██▉       | 306/1024 [02:58<06:54,  1.73it/s][A
 30%|██▉       | 307/1024 [02:58<06:54,  1.73it/s][A
 30%|███       | 308/1024 [02:59<06:54,  1.73it/s][A
 30%|███       | 309/1024 [03:00<06:56,  1.71it/s][A
 30%|███       | 310/1024 [03:00<06:56,  1.71it/s][A
 30%|███       | 311/1024 [03:01<06:54,  1.72it/s][A
 30%|███       | 312/1024 [03:01<06:53,  1.72it/s][A
 31%|███       | 313/1024 [03:02<06:51,  1.73it/s][A
 31%|███       | 314/1024 [03:02<06:55,  1.71it/s][A
 31%|███       | 315/1024 [03:03<06:54,  1.71it/s][A
 31%|███       | 316/1024 [03:04<06:53,  1.71it/s][A
 31%|███       | 317/1024 [03:04<06:53,  1.71it/s][A
 31%|███       | 318/1024 [03:05<06:52,  1.71it/s][A
 31%|███       | 319/1024 [

400/1024 iterations, loss:0.03477787598967552



 39%|███▉      | 401/1024 [03:53<06:03,  1.71it/s][A
 39%|███▉      | 402/1024 [03:54<06:03,  1.71it/s][A
 39%|███▉      | 403/1024 [03:54<06:02,  1.71it/s][A
 39%|███▉      | 404/1024 [03:55<06:00,  1.72it/s][A
 40%|███▉      | 405/1024 [03:56<06:00,  1.72it/s][A
 40%|███▉      | 406/1024 [03:56<05:59,  1.72it/s][A
 40%|███▉      | 407/1024 [03:57<05:58,  1.72it/s][A
 40%|███▉      | 408/1024 [03:57<05:57,  1.72it/s][A
 40%|███▉      | 409/1024 [03:58<05:56,  1.72it/s][A
 40%|████      | 410/1024 [03:58<05:56,  1.72it/s][A
 40%|████      | 411/1024 [03:59<05:55,  1.72it/s][A
 40%|████      | 412/1024 [04:00<05:56,  1.72it/s][A
 40%|████      | 413/1024 [04:00<05:54,  1.72it/s][A
 40%|████      | 414/1024 [04:01<05:54,  1.72it/s][A
 41%|████      | 415/1024 [04:01<05:54,  1.72it/s][A
 41%|████      | 416/1024 [04:02<05:54,  1.71it/s][A
 41%|████      | 417/1024 [04:03<05:58,  1.69it/s][A
 41%|████      | 418/1024 [04:03<05:56,  1.70it/s][A
 41%|████      | 419/1024 [

500/1024 iterations, loss:0.044843196868896484



 49%|████▉     | 501/1024 [04:52<05:05,  1.71it/s][A
 49%|████▉     | 502/1024 [04:52<05:03,  1.72it/s][A
 49%|████▉     | 503/1024 [04:53<05:03,  1.72it/s][A
 49%|████▉     | 504/1024 [04:54<05:03,  1.71it/s][A
 49%|████▉     | 505/1024 [04:54<05:05,  1.70it/s][A
 49%|████▉     | 506/1024 [04:55<05:03,  1.71it/s][A
 50%|████▉     | 507/1024 [04:55<05:01,  1.71it/s][A
 50%|████▉     | 508/1024 [04:56<05:01,  1.71it/s][A
 50%|████▉     | 509/1024 [04:57<05:01,  1.71it/s][A
 50%|████▉     | 510/1024 [04:57<05:00,  1.71it/s][A
 50%|████▉     | 511/1024 [04:58<05:00,  1.71it/s][A
 50%|█████     | 512/1024 [04:58<04:59,  1.71it/s][A
 50%|█████     | 513/1024 [04:59<04:58,  1.71it/s][A
 50%|█████     | 514/1024 [04:59<04:57,  1.72it/s][A
 50%|█████     | 515/1024 [05:00<04:56,  1.72it/s][A
 50%|█████     | 516/1024 [05:01<04:54,  1.72it/s][A
 50%|█████     | 517/1024 [05:01<04:55,  1.72it/s][A
 51%|█████     | 518/1024 [05:02<04:55,  1.71it/s][A
 51%|█████     | 519/1024 [

600/1024 iterations, loss:0.029980888590216637



 59%|█████▊    | 601/1024 [05:50<04:06,  1.72it/s][A
 59%|█████▉    | 602/1024 [05:51<04:05,  1.72it/s][A
 59%|█████▉    | 603/1024 [05:51<04:04,  1.72it/s][A
 59%|█████▉    | 604/1024 [05:52<04:03,  1.73it/s][A
 59%|█████▉    | 605/1024 [05:53<04:02,  1.73it/s][A
 59%|█████▉    | 606/1024 [05:53<04:01,  1.73it/s][A
 59%|█████▉    | 607/1024 [05:54<04:00,  1.73it/s][A
 59%|█████▉    | 608/1024 [05:54<04:00,  1.73it/s][A
 59%|█████▉    | 609/1024 [05:55<04:00,  1.72it/s][A
 60%|█████▉    | 610/1024 [05:56<04:00,  1.72it/s][A
 60%|█████▉    | 611/1024 [05:56<03:59,  1.72it/s][A
 60%|█████▉    | 612/1024 [05:57<03:59,  1.72it/s][A
 60%|█████▉    | 613/1024 [05:57<03:58,  1.72it/s][A
 60%|█████▉    | 614/1024 [05:58<03:57,  1.73it/s][A
 60%|██████    | 615/1024 [05:58<03:57,  1.72it/s][A
 60%|██████    | 616/1024 [05:59<03:56,  1.72it/s][A
 60%|██████    | 617/1024 [06:00<03:57,  1.72it/s][A
 60%|██████    | 618/1024 [06:00<03:56,  1.72it/s][A
 60%|██████    | 619/1024 [

700/1024 iterations, loss:0.02934993803501129



 68%|██████▊   | 701/1024 [06:49<03:09,  1.71it/s][A
 69%|██████▊   | 702/1024 [06:49<03:08,  1.70it/s][A
 69%|██████▊   | 703/1024 [06:50<03:07,  1.71it/s][A
 69%|██████▉   | 704/1024 [06:50<03:06,  1.71it/s][A
 69%|██████▉   | 705/1024 [06:51<03:05,  1.72it/s][A
 69%|██████▉   | 706/1024 [06:52<03:04,  1.72it/s][A
 69%|██████▉   | 707/1024 [06:52<03:04,  1.72it/s][A
 69%|██████▉   | 708/1024 [06:53<03:03,  1.72it/s][A
 69%|██████▉   | 709/1024 [06:53<03:02,  1.72it/s][A
 69%|██████▉   | 710/1024 [06:54<03:02,  1.72it/s][A
 69%|██████▉   | 711/1024 [06:55<03:01,  1.72it/s][A
 70%|██████▉   | 712/1024 [06:55<03:02,  1.71it/s][A
 70%|██████▉   | 713/1024 [06:56<03:01,  1.71it/s][A
 70%|██████▉   | 714/1024 [06:56<03:00,  1.72it/s][A
 70%|██████▉   | 715/1024 [06:57<03:00,  1.72it/s][A
 70%|██████▉   | 716/1024 [06:57<03:00,  1.71it/s][A
 70%|███████   | 717/1024 [06:58<02:58,  1.72it/s][A
 70%|███████   | 718/1024 [06:59<02:58,  1.72it/s][A
 70%|███████   | 719/1024 [

800/1024 iterations, loss:0.02954624593257904



 78%|███████▊  | 801/1024 [07:47<02:11,  1.70it/s][A
 78%|███████▊  | 802/1024 [07:48<02:09,  1.71it/s][A
 78%|███████▊  | 803/1024 [07:48<02:08,  1.72it/s][A
 79%|███████▊  | 804/1024 [07:49<02:08,  1.72it/s][A
 79%|███████▊  | 805/1024 [07:49<02:07,  1.72it/s][A
 79%|███████▊  | 806/1024 [07:50<02:06,  1.72it/s][A
 79%|███████▉  | 807/1024 [07:50<02:06,  1.72it/s][A
 79%|███████▉  | 808/1024 [07:51<02:05,  1.73it/s][A
 79%|███████▉  | 809/1024 [07:52<02:04,  1.73it/s][A
 79%|███████▉  | 810/1024 [07:52<02:03,  1.73it/s][A
 79%|███████▉  | 811/1024 [07:53<02:03,  1.73it/s][A
 79%|███████▉  | 812/1024 [07:53<02:02,  1.74it/s][A
 79%|███████▉  | 813/1024 [07:54<02:01,  1.73it/s][A
 79%|███████▉  | 814/1024 [07:55<02:01,  1.73it/s][A
 80%|███████▉  | 815/1024 [07:55<02:01,  1.72it/s][A
 80%|███████▉  | 816/1024 [07:56<02:00,  1.72it/s][A
 80%|███████▉  | 817/1024 [07:56<01:59,  1.73it/s][A
 80%|███████▉  | 818/1024 [07:57<01:59,  1.73it/s][A
 80%|███████▉  | 819/1024 [

900/1024 iterations, loss:0.03844504803419113



 88%|████████▊ | 901/1024 [08:45<01:12,  1.71it/s][A
 88%|████████▊ | 902/1024 [08:46<01:11,  1.71it/s][A
 88%|████████▊ | 903/1024 [08:46<01:10,  1.71it/s][A
 88%|████████▊ | 904/1024 [08:47<01:10,  1.71it/s][A
 88%|████████▊ | 905/1024 [08:48<01:09,  1.72it/s][A
 88%|████████▊ | 906/1024 [08:48<01:08,  1.72it/s][A
 89%|████████▊ | 907/1024 [08:49<01:08,  1.71it/s][A
 89%|████████▊ | 908/1024 [08:49<01:08,  1.70it/s][A
 89%|████████▉ | 909/1024 [08:50<01:07,  1.71it/s][A
 89%|████████▉ | 910/1024 [08:51<01:06,  1.72it/s][A
 89%|████████▉ | 911/1024 [08:51<01:05,  1.72it/s][A
 89%|████████▉ | 912/1024 [08:52<01:04,  1.72it/s][A
 89%|████████▉ | 913/1024 [08:52<01:04,  1.73it/s][A
 89%|████████▉ | 914/1024 [08:53<01:03,  1.72it/s][A
 89%|████████▉ | 915/1024 [08:53<01:03,  1.73it/s][A
 89%|████████▉ | 916/1024 [08:54<01:02,  1.72it/s][A
 90%|████████▉ | 917/1024 [08:55<01:02,  1.72it/s][A
 90%|████████▉ | 918/1024 [08:55<01:01,  1.72it/s][A
 90%|████████▉ | 919/1024 [

1000/1024 iterations, loss:0.06773126870393753



 98%|█████████▊| 1001/1024 [09:44<00:13,  1.72it/s][A
 98%|█████████▊| 1002/1024 [09:44<00:12,  1.71it/s][A
 98%|█████████▊| 1003/1024 [09:45<00:12,  1.70it/s][A
 98%|█████████▊| 1004/1024 [09:45<00:11,  1.69it/s][A
 98%|█████████▊| 1005/1024 [09:46<00:11,  1.67it/s][A
 98%|█████████▊| 1006/1024 [09:47<00:10,  1.65it/s][A
 98%|█████████▊| 1007/1024 [09:47<00:10,  1.67it/s][A
 98%|█████████▊| 1008/1024 [09:48<00:09,  1.69it/s][A
 99%|█████████▊| 1009/1024 [09:48<00:08,  1.70it/s][A
 99%|█████████▊| 1010/1024 [09:49<00:08,  1.69it/s][A
 99%|█████████▊| 1011/1024 [09:50<00:07,  1.70it/s][A
 99%|█████████▉| 1012/1024 [09:50<00:07,  1.70it/s][A
 99%|█████████▉| 1013/1024 [09:51<00:06,  1.71it/s][A
 99%|█████████▉| 1014/1024 [09:51<00:05,  1.71it/s][A
 99%|█████████▉| 1015/1024 [09:52<00:05,  1.72it/s][A
 99%|█████████▉| 1016/1024 [09:52<00:04,  1.72it/s][A
 99%|█████████▉| 1017/1024 [09:53<00:04,  1.72it/s][A
 99%|█████████▉| 1018/1024 [09:54<00:03,  1.72it/s][A
100%|████

epoch [5/5], loss:0.0286


100%|██████████| 5/5 [1:26:32<00:00, 1038.48s/it]
