import necessary libraries

In [1]:
import numpy as np
import pickle


data_path = '../Data/training_data/period0/'

### The model we'll be using below

In [2]:
import numpy as np
import torch as t
import torch.nn as nn

from torch import LongTensor as LT
from torch import FloatTensor as FT

 
class Bundler(nn.Module):

    def forward(self, data):
        raise NotImplementedError

    def forward_i(self, data):
        raise NotImplementedError

    def forward_o(self, data):
        raise NotImplementedError


class Word2Vec(Bundler):

    def __init__(self, vocab_size=20000, embedding_size=300, padding_idx=0):
        # this instantiate the parent class
        super(Word2Vec, self).__init__()
        self.vocab_size = vocab_size
        self.embedding_size = embedding_size
        # define embeddings for the target word matrix and the context word matrix
        self.ivectors = nn.Embedding(self.vocab_size, self.embedding_size, padding_idx=padding_idx)
        self.ovectors = nn.Embedding(self.vocab_size, self.embedding_size, padding_idx=padding_idx)
        # define parameters with initial weights: 0 for the padding and uniformly sampled weights for the vocab
        self.ivectors.weight = nn.Parameter(t.cat([t.zeros(1, self.embedding_size), FT(self.vocab_size - 1, self.embedding_size).uniform_(-0.5 / self.embedding_size, 0.5 / self.embedding_size)]))
        self.ovectors.weight = nn.Parameter(t.cat([t.zeros(1, self.embedding_size), FT(self.vocab_size - 1, self.embedding_size).uniform_(-0.5 / self.embedding_size, 0.5 / self.embedding_size)]))
        # indicates that we do not exclude this as it is the main part of the graph - this should be treated as parameters
        self.ivectors.weight.requires_grad = True
        self.ovectors.weight.requires_grad = True

    def forward(self, data):
        return self.forward_i(data)

    def forward_i(self, data):
        v = LT(data)
        v = v.cuda() if self.ivectors.weight.is_cuda else v
        return self.ivectors(v)

    def forward_o(self, data):
        v = LT(data)
        v = v.cuda() if self.ovectors.weight.is_cuda else v
        return self.ovectors(v)


class SGNS(nn.Module):

    def __init__(self, embedding, vocab_size=20000, n_negs=20, weights=None):
        super(SGNS, self).__init__()
        self.embedding = embedding
        self.vocab_size = vocab_size
        self.n_negs = n_negs
        self.weights = None
        if weights is not None:
            wf = np.power(weights, 0.75)
            wf = wf / wf.sum()
            self.weights = FT(wf)

    def forward(self, iword, owords):
        batch_size = iword.size()[0]
        context_size = owords.size()[1]
        if self.weights is not None:
            nwords = t.multinomial(self.weights, batch_size * context_size * self.n_negs, replacement=True).view(batch_size, -1)
        else:
            nwords = FT(batch_size, context_size * self.n_negs).uniform_(0, self.vocab_size - 1).long()
        ivectors = self.embedding.forward_i(iword).unsqueeze(2)
        ovectors = self.embedding.forward_o(owords)
        nvectors = self.embedding.forward_o(nwords).neg()
##-------------- this is the line we need to modify: add the euclidean distance as a regularisation term
##-------------- we will also consider the consine similarity
        oloss = t.bmm(ovectors, ivectors).squeeze().sigmoid().log().mean(1)
        nloss = t.bmm(nvectors, ivectors).squeeze().sigmoid().log().view(-1, context_size, self.n_negs).sum(2).mean(1)
        return(-(oloss + nloss).mean())

### code for training

In [3]:
import os
import pickle
import random
import argparse
import torch as t
import numpy as np

from tqdm import tqdm
from torch.optim import Adam
from torch.optim import SGD
from torch.utils.data import Dataset, DataLoader
#from model import Word2Vec, SGNS


def parse_args():
    parser = argparse.ArgumentParser()
    parser.add_argument('--name', type=str, default='sgns', help="model name")
    parser.add_argument('--data_dir', type=str, default='./data/', help="data directory path")
    parser.add_argument('--save_dir', type=str, default='./pts/', help="model directory path")
    parser.add_argument('--e_dim', type=int, default=300, help="embedding dimension")
    parser.add_argument('--n_negs', type=int, default=20, help="number of negative samples")
    parser.add_argument('--epoch', type=int, default=100, help="number of epochs")
    parser.add_argument('--mb', type=int, default=4096, help="mini-batch size")
    parser.add_argument('--ss_t', type=float, default=1e-5, help="subsample threshold")
    parser.add_argument('--conti', action='store_true', help="continue learning")
    parser.add_argument('--weights', action='store_true', help="use weights for negative sampling")
    parser.add_argument('--cuda', action='store_true', help="use CUDA")
    return parser.parse_args()


class PermutedSubsampledCorpus(Dataset):

    def __init__(self, datapath, ws=None):
        data = pickle.load(open(datapath, 'rb'))
        if ws is not None:
            self.data = []
            for iword, owords in data:
                if random.random() > ws[iword]:
                    self.data.append((iword, owords))
        else:
            self.data = data

    def __len__(self):
        return len(self.data)

    def __getitem__(self, idx):
        iword, owords = self.data[idx]
        return iword, np.array(owords)


def train(args):
    idx2word = pickle.load(open(os.path.join(args.data_dir, 'idx2word.dat'), 'rb'))
    wc = pickle.load(open(os.path.join(args.data_dir, 'wc.dat'), 'rb'))
    wf = np.array([wc[word] for word in idx2word])
    wf = wf / wf.sum()
    ws = 1 - np.sqrt(args.ss_t / wf)
    ws = np.clip(ws, 0, 1)
    vocab_size = len(idx2word)
    weights = wf if args.weights else None
    if not os.path.isdir(args.save_dir):
        os.mkdir(args.save_dir)
    model = Word2Vec(vocab_size=vocab_size, embedding_size=args.e_dim)
    modelpath = os.path.join(args.save_dir, '{}.pt'.format(args.name))
    sgns = SGNS(embedding=model, vocab_size=vocab_size, n_negs=args.n_negs, weights=weights)
    if os.path.isfile(modelpath) and args.conti:
        sgns.load_state_dict(t.load(modelpath))
    if args.cuda:
        sgns = sgns.cuda()
    optim = Adam(sgns.parameters())
    optimpath = os.path.join(args.save_dir, '{}.optim.pt'.format(args.name))
    if os.path.isfile(optimpath) and args.conti:
        optim.load_state_dict(t.load(optimpath))
    for epoch in range(1, args.epoch + 1):
        dataset = PermutedSubsampledCorpus(os.path.join(args.data_dir, 'train.dat'))
        dataloader = DataLoader(dataset, batch_size=args.mb, shuffle=True)
        total_batches = int(np.ceil(len(dataset) / args.mb))
        pbar = tqdm(dataloader)
        pbar.set_description("[Epoch {}]".format(epoch))
        for iword, owords in pbar:
            loss = sgns(iword, owords)
            optim.zero_grad()
            loss.backward()
            optim.step()
            pbar.set_postfix(loss=loss.item())
    idx2vec = model.ivectors.weight.data.cpu().numpy()
    pickle.dump(idx2vec, open(os.path.join(args.data_dir, 'idx2vec.dat'), 'wb'))
    t.save(sgns.state_dict(), os.path.join(args.save_dir, '{}.pt'.format(args.name)))
    t.save(optim.state_dict(), os.path.join(args.save_dir, '{}.optim.pt'.format(args.name)))


#if __name__ == '__main__':
 #   train(parse_args())

### We'll go through this line by line

In [4]:
import os
import pickle
import random

import argparse
import torch as t
import numpy as np

from tqdm import tqdm
from torch.optim import Adam
from torch.utils.data import Dataset, DataLoader
#from model import Word2Vec, SGNS

In [5]:
# loading in idx2word and word counts and calculating the normalised frequency for words in the idx

with(open(os.path.join(data_path, 'idx2word.dat'), 'rb')) as handle:
    idx2word = pickle.load(handle)
with(open(os.path.join(data_path, 'wc.dat'), 'rb')) as handle:
    wc = pickle.load(handle)
wf = np.array([wc[word] for word in idx2word])
wf = wf / wf.sum()

In [6]:
# calculating the subsampling proba and obtaining vocab size

ss_t = 0.00001

ws = 1 - np.sqrt(ss_t / wf)
ws = np.clip(ws, 0, 1)
vocab_size = len(idx2word)

In [14]:
# do we wanna use weights for negsampling?
use_weights = True
weights = wf if use_weights else None

In [15]:
save_dir = data_path+'res/'
if not os.path.isdir(save_dir):
    os.mkdir(save_dir)

In [16]:
# call and instantiate the model class
emb_dim = 300
model_name = 'period0'

model = Word2Vec(vocab_size=vocab_size, embedding_size=emb_dim)
modelpath = os.path.join(save_dir, '{}.pt'.format(model_name))

In [17]:
# call the SGNS model and instantiate
n_negs = 100

sgns = SGNS(embedding=model, vocab_size=vocab_size, n_negs=n_negs, weights=weights)

In [18]:
# do we wanna pick up from a previous learning?
# do we wanna use CUDA

conti = False
cuda = True

if os.path.isfile(modelpath) and conti:
    sgns.load_state_dict(t.load(modelpath))
if cuda:
    sgns = sgns.cuda()

In [19]:
# call the optimiser, we use Adam, can also use SGD
optim = Adam(sgns.parameters(), lr=2e-3)
optimpath = os.path.join(save_dir, '{}.optim.pt'.format(model_name))
if os.path.isfile(optimpath) and conti:
    optim.load_state_dict(t.load(optimpath))

In [20]:
# train!
n_epoch = 8
mb = 1000

for epoch in range(1, n_epoch + 1):
    dataset = PermutedSubsampledCorpus(os.path.join(data_path, 'train.dat'), ws)
    dataloader = DataLoader(dataset, batch_size=mb, shuffle=True)
    total_batches = int(np.ceil(len(dataset) / mb))
    pbar = tqdm(dataloader)
    pbar.set_description("[Epoch {}]".format(epoch))
    for iword, owords in pbar:
        loss = sgns(iword, owords)
        #grad = sgns(iword, owords)[1]
        #print(grad)
        optim.zero_grad()
        loss.backward()
        optim.step()
        pbar.set_postfix(loss=loss.item())

[Epoch 1]: 100%|██████████| 717/717 [04:32<00:00,  2.64it/s, loss=15.9]
[Epoch 2]: 100%|██████████| 717/717 [04:32<00:00,  2.64it/s, loss=14.2]
[Epoch 3]: 100%|██████████| 716/716 [04:30<00:00,  2.65it/s, loss=26.8]
[Epoch 4]: 100%|██████████| 716/716 [04:31<00:00,  2.64it/s, loss=15.2]
[Epoch 5]: 100%|██████████| 716/716 [04:31<00:00,  2.63it/s, loss=37.8]
[Epoch 6]: 100%|██████████| 716/716 [04:31<00:00,  2.63it/s, loss=13.9]
[Epoch 7]: 100%|██████████| 716/716 [04:29<00:00,  2.65it/s, loss=13.6]
[Epoch 8]: 100%|██████████| 717/717 [04:31<00:00,  2.64it/s, loss=17.2]


In [21]:
idx2vec = model.ivectors.weight.data.cpu().numpy()
#pickle.dump(idx2vec, open(data_path+'idx2vec.dat'), 'wb')
t.save(sgns.state_dict(), os.path.join(save_dir, '{}.pt'.format(model_name)))
t.save(optim.state_dict(), os.path.join(save_dir, '{}.optim.pt'.format(model_name)))

In [22]:
model.ivectors.weight.data.cpu().numpy()

array([[ 0.        ,  0.        ,  0.        , ...,  0.        ,
         0.        ,  0.        ],
       [ 0.05689228,  0.15685235,  0.07270526, ...,  0.15389794,
         0.09007584,  0.0774914 ],
       [ 0.00632227,  0.01002212,  0.09341568, ...,  0.10295281,
         0.15408444,  0.09707116],
       ..., 
       [ 0.03852747,  0.06537829,  0.04834054, ...,  0.07518096,
         0.08379278,  0.0544805 ],
       [ 0.03027225,  0.02561502, -0.0026253 , ...,  0.0233258 ,
         0.02598815,  0.05608466],
       [ 0.0625817 ,  0.057478  ,  0.05790081, ...,  0.00474848,
        -0.03421123,  0.05335202]], dtype=float32)

In [23]:
vector3 = model.ivectors.weight.data.cpu().numpy()[3]
vector3

array([ 0.05789586,  0.04476868,  0.09167903, -0.17152733,  0.10329971,
        0.03014417,  0.01219846, -0.13819744, -0.00565925,  0.03899888,
        0.03732952, -0.0898168 , -0.07575436,  0.02051679, -0.02981773,
       -0.07936405,  0.00382746, -0.01618091, -0.08324953, -0.1328506 ,
        0.10098054, -0.08548413,  0.07240234,  0.02332029,  0.05415119,
       -0.06823785, -0.05450507,  0.09783662, -0.01419741,  0.00150108,
       -0.00262661, -0.04425149, -0.13105522, -0.00611185, -0.02356478,
        0.02706797, -0.09736105,  0.04132115, -0.03511995,  0.00675131,
        0.02178738,  0.01402447, -0.11562996, -0.01941235, -0.0577183 ,
       -0.03773048, -0.00415369,  0.01645307,  0.05912367,  0.03455342,
        0.0583756 , -0.0349873 , -0.00496768, -0.09155397,  0.06138192,
        0.03567986, -0.13077518,  0.01166302,  0.13653545, -0.11633229,
        0.05879457,  0.02754627,  0.03053075, -0.00725776,  0.19709015,
        0.04714454, -0.09065689,  0.02722152,  0.0851267 , -0.04

In [24]:
with open(data_path + 'word2idx.dat', 'rb') as handle:
    word2idx = pickle.load(handle)

In [25]:
word0, word1 = 'shoe','great'
if word0 in idx2word and word1 in idx2word:
    comp_idx = word2idx[word0], word2idx[word1]
    print(comp_idx)
else:
    print('not found')

(11820, 337)


In [26]:
array0, array1 = model.ivectors.weight.data.cpu().numpy()[comp_idx[0]],model.ivectors.weight.data.cpu().numpy()[comp_idx[1]]

In [27]:
from scipy import spatial

result = 1 - spatial.distance.cosine(array0, array1)
print(result)

0.501607239246


In [36]:
res = [1 - spatial.distance.cosine(model.ivectors.weight.data.cpu().numpy()[3], model.ivectors.weight.data.cpu().numpy()[i]) for i in tqdm(range(1, vocab_size))]


  0%|          | 0/19999 [00:00<?, ?it/s][A
  0%|          | 4/19999 [00:00<08:28, 39.33it/s][A
  0%|          | 9/19999 [00:00<08:09, 40.80it/s][A
  0%|          | 14/19999 [00:00<07:37, 43.66it/s][A
  0%|          | 20/19999 [00:00<07:17, 45.66it/s][A
  0%|          | 26/19999 [00:00<07:07, 46.77it/s][A
  0%|          | 32/19999 [00:00<07:00, 47.48it/s][A
  0%|          | 38/19999 [00:00<06:55, 48.01it/s][A
  0%|          | 44/19999 [00:00<06:51, 48.47it/s][A
  0%|          | 50/19999 [00:01<06:48, 48.78it/s][A
  0%|          | 56/19999 [00:01<06:46, 49.03it/s][A
  0%|          | 61/19999 [00:01<06:45, 49.12it/s][A
  0%|          | 67/19999 [00:01<06:44, 49.29it/s][A
  0%|          | 73/19999 [00:01<06:50, 48.49it/s][A
  0%|          | 78/19999 [00:01<06:55, 47.97it/s][A
  0%|          | 83/19999 [00:01<06:58, 47.55it/s][A
  0%|          | 88/19999 [00:01<06:59, 47.48it/s][A
  0%|          | 94/19999 [00:01<06:57, 47.71it/s][A
  1%|          | 100/19999 [00:02<06:5

  4%|▍         | 832/19999 [00:17<06:46, 47.17it/s][A
  4%|▍         | 837/19999 [00:17<06:46, 47.13it/s][A
  4%|▍         | 842/19999 [00:17<06:46, 47.09it/s][A
  4%|▍         | 847/19999 [00:18<06:47, 47.05it/s][A
  4%|▍         | 852/19999 [00:18<06:47, 47.01it/s][A
  4%|▍         | 857/19999 [00:18<06:47, 46.98it/s][A
  4%|▍         | 862/19999 [00:18<06:47, 46.94it/s][A
  4%|▍         | 867/19999 [00:18<06:47, 46.90it/s][A
  4%|▍         | 872/19999 [00:18<06:48, 46.86it/s][A
  4%|▍         | 877/19999 [00:18<06:48, 46.86it/s][A
  4%|▍         | 882/19999 [00:18<06:48, 46.83it/s][A
  4%|▍         | 887/19999 [00:18<06:48, 46.79it/s][A
  4%|▍         | 892/19999 [00:19<06:48, 46.81it/s][A
  4%|▍         | 898/19999 [00:19<06:47, 46.84it/s][A
  5%|▍         | 904/19999 [00:19<06:47, 46.86it/s][A
  5%|▍         | 909/19999 [00:19<06:47, 46.88it/s][A
  5%|▍         | 915/19999 [00:19<06:46, 46.90it/s][A
  5%|▍         | 921/19999 [00:19<06:46, 46.92it/s][A
  5%|▍    

  8%|▊         | 1655/19999 [00:35<06:28, 47.21it/s][A
  8%|▊         | 1660/19999 [00:35<06:28, 47.19it/s][A
  8%|▊         | 1665/19999 [00:35<06:28, 47.17it/s][A
  8%|▊         | 1670/19999 [00:35<06:28, 47.15it/s][A
  8%|▊         | 1675/19999 [00:35<06:28, 47.13it/s][A
  8%|▊         | 1680/19999 [00:35<06:28, 47.11it/s][A
  8%|▊         | 1685/19999 [00:35<06:28, 47.09it/s][A
  8%|▊         | 1690/19999 [00:35<06:28, 47.08it/s][A
  8%|▊         | 1695/19999 [00:36<06:28, 47.06it/s][A
  9%|▊         | 1701/19999 [00:36<06:28, 47.07it/s][A
  9%|▊         | 1707/19999 [00:36<06:28, 47.09it/s][A
  9%|▊         | 1713/19999 [00:36<06:28, 47.10it/s][A
  9%|▊         | 1719/19999 [00:36<06:27, 47.11it/s][A
  9%|▊         | 1725/19999 [00:36<06:27, 47.12it/s][A
  9%|▊         | 1731/19999 [00:36<06:27, 47.14it/s][A
  9%|▊         | 1736/19999 [00:36<06:27, 47.12it/s][A
  9%|▊         | 1741/19999 [00:36<06:27, 47.10it/s][A
  9%|▊         | 1746/19999 [00:37<06:27, 47.09i

 12%|█▏        | 2469/19999 [00:52<06:12, 47.11it/s][A
 12%|█▏        | 2474/19999 [00:52<06:12, 47.09it/s][A
 12%|█▏        | 2479/19999 [00:52<06:12, 47.08it/s][A
 12%|█▏        | 2484/19999 [00:52<06:12, 47.07it/s][A
 12%|█▏        | 2489/19999 [00:52<06:12, 47.06it/s][A
 12%|█▏        | 2494/19999 [00:53<06:12, 47.04it/s][A
 12%|█▏        | 2499/19999 [00:53<06:12, 47.03it/s][A
 13%|█▎        | 2504/19999 [00:53<06:12, 47.02it/s][A
 13%|█▎        | 2509/19999 [00:53<06:12, 47.01it/s][A
 13%|█▎        | 2514/19999 [00:53<06:12, 46.99it/s][A
 13%|█▎        | 2519/19999 [00:53<06:12, 46.98it/s][A
 13%|█▎        | 2524/19999 [00:53<06:12, 46.97it/s][A
 13%|█▎        | 2529/19999 [00:53<06:12, 46.95it/s][A
 13%|█▎        | 2534/19999 [00:53<06:12, 46.94it/s][A
 13%|█▎        | 2539/19999 [00:54<06:12, 46.93it/s][A
 13%|█▎        | 2544/19999 [00:54<06:12, 46.91it/s][A
 13%|█▎        | 2549/19999 [00:54<06:11, 46.92it/s][A
 13%|█▎        | 2554/19999 [00:54<06:11, 46.90i

 16%|█▌        | 3243/19999 [01:09<06:01, 46.39it/s][A
 16%|█▌        | 3249/19999 [01:10<06:00, 46.40it/s][A
 16%|█▋        | 3255/19999 [01:10<06:00, 46.41it/s][A
 16%|█▋        | 3261/19999 [01:10<06:00, 46.40it/s][A
 16%|█▋        | 3266/19999 [01:10<06:00, 46.39it/s][A
 16%|█▋        | 3272/19999 [01:10<06:00, 46.40it/s][A
 16%|█▋        | 3278/19999 [01:10<06:00, 46.41it/s][A
 16%|█▋        | 3284/19999 [01:10<06:00, 46.42it/s][A
 16%|█▋        | 3290/19999 [01:10<05:59, 46.42it/s][A
 16%|█▋        | 3296/19999 [01:10<05:59, 46.43it/s][A
 17%|█▋        | 3302/19999 [01:11<05:59, 46.44it/s][A
 17%|█▋        | 3308/19999 [01:11<05:59, 46.44it/s][A
 17%|█▋        | 3314/19999 [01:11<05:59, 46.45it/s][A
 17%|█▋        | 3320/19999 [01:11<05:59, 46.46it/s][A
 17%|█▋        | 3326/19999 [01:11<05:58, 46.46it/s][A
 17%|█▋        | 3332/19999 [01:11<05:58, 46.47it/s][A
 17%|█▋        | 3338/19999 [01:11<05:58, 46.48it/s][A
 17%|█▋        | 3344/19999 [01:11<05:58, 46.49i

 20%|██        | 4033/19999 [01:27<05:45, 46.15it/s][A
 20%|██        | 4038/19999 [01:27<05:45, 46.14it/s][A
 20%|██        | 4043/19999 [01:27<05:45, 46.13it/s][A
 20%|██        | 4048/19999 [01:27<05:45, 46.12it/s][A
 20%|██        | 4053/19999 [01:27<05:45, 46.11it/s][A
 20%|██        | 4058/19999 [01:28<05:45, 46.11it/s][A
 20%|██        | 4063/19999 [01:28<05:45, 46.10it/s][A
 20%|██        | 4068/19999 [01:28<05:45, 46.09it/s][A
 20%|██        | 4073/19999 [01:28<05:45, 46.08it/s][A
 20%|██        | 4078/19999 [01:28<05:45, 46.08it/s][A
 20%|██        | 4083/19999 [01:28<05:45, 46.07it/s][A
 20%|██        | 4088/19999 [01:28<05:45, 46.06it/s][A
 20%|██        | 4093/19999 [01:28<05:45, 46.05it/s][A
 20%|██        | 4098/19999 [01:29<05:45, 46.04it/s][A
 21%|██        | 4103/19999 [01:29<05:45, 46.04it/s][A
 21%|██        | 4108/19999 [01:29<05:45, 46.03it/s][A
 21%|██        | 4113/19999 [01:29<05:45, 46.02it/s][A
 21%|██        | 4118/19999 [01:29<05:45, 46.02i

 24%|██▍       | 4844/19999 [01:44<05:27, 46.24it/s][A
 24%|██▍       | 4849/19999 [01:44<05:27, 46.24it/s][A
 24%|██▍       | 4854/19999 [01:44<05:27, 46.23it/s][A
 24%|██▍       | 4859/19999 [01:45<05:27, 46.23it/s][A
 24%|██▍       | 4864/19999 [01:45<05:27, 46.22it/s][A
 24%|██▍       | 4869/19999 [01:45<05:27, 46.22it/s][A
 24%|██▍       | 4874/19999 [01:45<05:27, 46.21it/s][A
 24%|██▍       | 4879/19999 [01:45<05:27, 46.20it/s][A
 24%|██▍       | 4884/19999 [01:45<05:27, 46.20it/s][A
 24%|██▍       | 4889/19999 [01:45<05:27, 46.19it/s][A
 24%|██▍       | 4894/19999 [01:45<05:27, 46.19it/s][A
 25%|██▍       | 4900/19999 [01:46<05:26, 46.19it/s][A
 25%|██▍       | 4906/19999 [01:46<05:26, 46.20it/s][A
 25%|██▍       | 4912/19999 [01:46<05:26, 46.20it/s][A
 25%|██▍       | 4918/19999 [01:46<05:26, 46.21it/s][A
 25%|██▍       | 4924/19999 [01:46<05:26, 46.21it/s][A
 25%|██▍       | 4930/19999 [01:46<05:26, 46.22it/s][A
 25%|██▍       | 4936/19999 [01:46<05:25, 46.23i

 28%|██▊       | 5665/19999 [02:02<05:09, 46.34it/s][A
 28%|██▊       | 5670/19999 [02:02<05:09, 46.34it/s][A
 28%|██▊       | 5675/19999 [02:02<05:09, 46.33it/s][A
 28%|██▊       | 5680/19999 [02:02<05:09, 46.32it/s][A
 28%|██▊       | 5685/19999 [02:02<05:09, 46.32it/s][A
 28%|██▊       | 5690/19999 [02:02<05:08, 46.31it/s][A
 28%|██▊       | 5695/19999 [02:02<05:08, 46.31it/s][A
 29%|██▊       | 5700/19999 [02:03<05:08, 46.30it/s][A
 29%|██▊       | 5705/19999 [02:03<05:08, 46.30it/s][A
 29%|██▊       | 5710/19999 [02:03<05:08, 46.29it/s][A
 29%|██▊       | 5715/19999 [02:03<05:08, 46.29it/s][A
 29%|██▊       | 5720/19999 [02:03<05:08, 46.28it/s][A
 29%|██▊       | 5725/19999 [02:03<05:08, 46.28it/s][A
 29%|██▊       | 5731/19999 [02:03<05:08, 46.29it/s][A
 29%|██▊       | 5737/19999 [02:03<05:08, 46.29it/s][A
 29%|██▊       | 5743/19999 [02:04<05:07, 46.30it/s][A
 29%|██▊       | 5748/19999 [02:04<05:07, 46.29it/s][A
 29%|██▉       | 5753/19999 [02:04<05:07, 46.29i

 32%|███▏      | 6454/19999 [02:19<04:52, 46.24it/s][A
 32%|███▏      | 6460/19999 [02:19<04:52, 46.24it/s][A
 32%|███▏      | 6466/19999 [02:19<04:52, 46.25it/s][A
 32%|███▏      | 6472/19999 [02:19<04:52, 46.25it/s][A
 32%|███▏      | 6478/19999 [02:20<04:52, 46.25it/s][A
 32%|███▏      | 6483/19999 [02:20<04:52, 46.24it/s][A
 32%|███▏      | 6488/19999 [02:20<04:52, 46.24it/s][A
 32%|███▏      | 6493/19999 [02:20<04:52, 46.24it/s][A
 32%|███▏      | 6498/19999 [02:20<04:52, 46.23it/s][A
 33%|███▎      | 6503/19999 [02:20<04:51, 46.23it/s][A
 33%|███▎      | 6509/19999 [02:20<04:51, 46.23it/s][A
 33%|███▎      | 6515/19999 [02:20<04:51, 46.24it/s][A
 33%|███▎      | 6521/19999 [02:21<04:51, 46.24it/s][A
 33%|███▎      | 6527/19999 [02:21<04:51, 46.24it/s][A
 33%|███▎      | 6533/19999 [02:21<04:51, 46.25it/s][A
 33%|███▎      | 6538/19999 [02:21<04:51, 46.24it/s][A
 33%|███▎      | 6543/19999 [02:21<04:51, 46.24it/s][A
 33%|███▎      | 6548/19999 [02:21<04:50, 46.23i

 36%|███▌      | 7236/19999 [02:37<04:37, 46.04it/s][A
 36%|███▌      | 7241/19999 [02:37<04:37, 46.03it/s][A
 36%|███▌      | 7246/19999 [02:37<04:37, 46.03it/s][A
 36%|███▋      | 7251/19999 [02:37<04:36, 46.03it/s][A
 36%|███▋      | 7256/19999 [02:37<04:36, 46.02it/s][A
 36%|███▋      | 7261/19999 [02:37<04:36, 46.02it/s][A
 36%|███▋      | 7266/19999 [02:37<04:36, 46.02it/s][A
 36%|███▋      | 7271/19999 [02:38<04:36, 46.01it/s][A
 36%|███▋      | 7276/19999 [02:38<04:36, 46.01it/s][A
 36%|███▋      | 7282/19999 [02:38<04:36, 46.01it/s][A
 36%|███▋      | 7288/19999 [02:38<04:36, 46.02it/s][A
 36%|███▋      | 7293/19999 [02:38<04:36, 46.02it/s][A
 36%|███▋      | 7299/19999 [02:38<04:35, 46.02it/s][A
 37%|███▋      | 7305/19999 [02:38<04:35, 46.02it/s][A
 37%|███▋      | 7311/19999 [02:38<04:35, 46.03it/s][A
 37%|███▋      | 7317/19999 [02:38<04:35, 46.03it/s][A
 37%|███▋      | 7323/19999 [02:39<04:35, 46.04it/s][A
 37%|███▋      | 7329/19999 [02:39<04:35, 46.04i

 40%|████      | 8047/19999 [02:54<04:19, 46.11it/s][A
 40%|████      | 8052/19999 [02:54<04:19, 46.11it/s][A
 40%|████      | 8057/19999 [02:54<04:19, 46.10it/s][A
 40%|████      | 8062/19999 [02:54<04:18, 46.10it/s][A
 40%|████      | 8067/19999 [02:55<04:18, 46.10it/s][A
 40%|████      | 8072/19999 [02:55<04:18, 46.09it/s][A
 40%|████      | 8077/19999 [02:55<04:18, 46.09it/s][A
 40%|████      | 8082/19999 [02:55<04:18, 46.09it/s][A
 40%|████      | 8088/19999 [02:55<04:18, 46.09it/s][A
 40%|████      | 8094/19999 [02:55<04:18, 46.09it/s][A
 41%|████      | 8100/19999 [02:55<04:18, 46.10it/s][A
 41%|████      | 8105/19999 [02:55<04:18, 46.10it/s][A
 41%|████      | 8111/19999 [02:55<04:17, 46.10it/s][A
 41%|████      | 8117/19999 [02:56<04:17, 46.11it/s][A
 41%|████      | 8122/19999 [02:56<04:17, 46.11it/s][A
 41%|████      | 8128/19999 [02:56<04:17, 46.11it/s][A
 41%|████      | 8133/19999 [02:56<04:17, 46.11it/s][A
 41%|████      | 8139/19999 [02:56<04:17, 46.12i

 44%|████▍     | 8860/19999 [03:11<04:01, 46.20it/s][A
 44%|████▍     | 8866/19999 [03:11<04:00, 46.20it/s][A
 44%|████▍     | 8871/19999 [03:12<04:00, 46.20it/s][A
 44%|████▍     | 8876/19999 [03:12<04:00, 46.19it/s][A
 44%|████▍     | 8881/19999 [03:12<04:00, 46.19it/s][A
 44%|████▍     | 8886/19999 [03:12<04:00, 46.19it/s][A
 44%|████▍     | 8891/19999 [03:12<04:00, 46.18it/s][A
 44%|████▍     | 8897/19999 [03:12<04:00, 46.19it/s][A
 45%|████▍     | 8902/19999 [03:12<04:00, 46.18it/s][A
 45%|████▍     | 8908/19999 [03:12<04:00, 46.19it/s][A
 45%|████▍     | 8914/19999 [03:12<03:59, 46.19it/s][A
 45%|████▍     | 8919/19999 [03:13<03:59, 46.19it/s][A
 45%|████▍     | 8925/19999 [03:13<03:59, 46.19it/s][A
 45%|████▍     | 8931/19999 [03:13<03:59, 46.20it/s][A
 45%|████▍     | 8937/19999 [03:13<03:59, 46.20it/s][A
 45%|████▍     | 8943/19999 [03:13<03:59, 46.20it/s][A
 45%|████▍     | 8949/19999 [03:13<03:59, 46.20it/s][A
 45%|████▍     | 8954/19999 [03:13<03:59, 46.20i

 48%|████▊     | 9661/19999 [03:29<03:43, 46.16it/s][A
 48%|████▊     | 9667/19999 [03:29<03:43, 46.16it/s][A
 48%|████▊     | 9673/19999 [03:29<03:43, 46.17it/s][A
 48%|████▊     | 9679/19999 [03:29<03:43, 46.17it/s][A
 48%|████▊     | 9685/19999 [03:29<03:43, 46.17it/s][A
 48%|████▊     | 9691/19999 [03:29<03:43, 46.17it/s][A
 48%|████▊     | 9697/19999 [03:29<03:43, 46.18it/s][A
 49%|████▊     | 9703/19999 [03:30<03:42, 46.18it/s][A
 49%|████▊     | 9709/19999 [03:30<03:42, 46.18it/s][A
 49%|████▊     | 9715/19999 [03:30<03:42, 46.18it/s][A
 49%|████▊     | 9721/19999 [03:30<03:42, 46.19it/s][A
 49%|████▊     | 9727/19999 [03:30<03:42, 46.19it/s][A
 49%|████▊     | 9733/19999 [03:30<03:42, 46.20it/s][A
 49%|████▊     | 9739/19999 [03:30<03:42, 46.20it/s][A
 49%|████▊     | 9745/19999 [03:30<03:41, 46.20it/s][A
 49%|████▉     | 9751/19999 [03:31<03:41, 46.20it/s][A
 49%|████▉     | 9757/19999 [03:31<03:41, 46.21it/s][A
 49%|████▉     | 9763/19999 [03:31<03:41, 46.21i

 52%|█████▏    | 10438/19999 [03:46<03:27, 46.09it/s][A
 52%|█████▏    | 10443/19999 [03:46<03:27, 46.10it/s][A
 52%|█████▏    | 10448/19999 [03:46<03:27, 46.09it/s][A
 52%|█████▏    | 10453/19999 [03:46<03:27, 46.09it/s][A
 52%|█████▏    | 10458/19999 [03:46<03:27, 46.09it/s][A
 52%|█████▏    | 10463/19999 [03:47<03:26, 46.08it/s][A
 52%|█████▏    | 10468/19999 [03:47<03:26, 46.08it/s][A
 52%|█████▏    | 10473/19999 [03:47<03:26, 46.08it/s][A
 52%|█████▏    | 10478/19999 [03:47<03:26, 46.08it/s][A
 52%|█████▏    | 10483/19999 [03:47<03:26, 46.07it/s][A
 52%|█████▏    | 10488/19999 [03:47<03:26, 46.07it/s][A
 52%|█████▏    | 10494/19999 [03:47<03:26, 46.08it/s][A
 53%|█████▎    | 10500/19999 [03:47<03:26, 46.08it/s][A
 53%|█████▎    | 10505/19999 [03:47<03:26, 46.08it/s][A
 53%|█████▎    | 10510/19999 [03:48<03:25, 46.07it/s][A
 53%|█████▎    | 10515/19999 [03:48<03:25, 46.07it/s][A
 53%|█████▎    | 10520/19999 [03:48<03:25, 46.07it/s][A
 53%|█████▎    | 10525/19999 [0

 56%|█████▌    | 11206/19999 [04:03<03:11, 46.01it/s][A
 56%|█████▌    | 11212/19999 [04:03<03:10, 46.01it/s][A
 56%|█████▌    | 11218/19999 [04:03<03:10, 46.01it/s][A
 56%|█████▌    | 11224/19999 [04:03<03:10, 46.01it/s][A
 56%|█████▌    | 11230/19999 [04:04<03:10, 46.02it/s][A
 56%|█████▌    | 11236/19999 [04:04<03:10, 46.02it/s][A
 56%|█████▌    | 11242/19999 [04:04<03:10, 46.02it/s][A
 56%|█████▌    | 11248/19999 [04:04<03:10, 46.02it/s][A
 56%|█████▋    | 11254/19999 [04:04<03:10, 46.03it/s][A
 56%|█████▋    | 11260/19999 [04:04<03:09, 46.03it/s][A
 56%|█████▋    | 11266/19999 [04:04<03:09, 46.03it/s][A
 56%|█████▋    | 11272/19999 [04:04<03:09, 46.03it/s][A
 56%|█████▋    | 11277/19999 [04:05<03:09, 46.03it/s][A
 56%|█████▋    | 11282/19999 [04:05<03:09, 46.03it/s][A
 56%|█████▋    | 11288/19999 [04:05<03:09, 46.03it/s][A
 56%|█████▋    | 11294/19999 [04:05<03:09, 46.03it/s][A
 57%|█████▋    | 11300/19999 [04:05<03:08, 46.03it/s][A
 57%|█████▋    | 11306/19999 [0

 60%|██████    | 12023/19999 [04:20<02:52, 46.13it/s][A
 60%|██████    | 12028/19999 [04:20<02:52, 46.13it/s][A
 60%|██████    | 12033/19999 [04:20<02:52, 46.13it/s][A
 60%|██████    | 12038/19999 [04:20<02:52, 46.13it/s][A
 60%|██████    | 12043/19999 [04:21<02:52, 46.12it/s][A
 60%|██████    | 12048/19999 [04:21<02:52, 46.12it/s][A
 60%|██████    | 12053/19999 [04:21<02:52, 46.12it/s][A
 60%|██████    | 12058/19999 [04:21<02:52, 46.12it/s][A
 60%|██████    | 12063/19999 [04:21<02:52, 46.11it/s][A
 60%|██████    | 12068/19999 [04:21<02:51, 46.11it/s][A
 60%|██████    | 12073/19999 [04:21<02:51, 46.11it/s][A
 60%|██████    | 12078/19999 [04:21<02:51, 46.11it/s][A
 60%|██████    | 12083/19999 [04:22<02:51, 46.10it/s][A
 60%|██████    | 12088/19999 [04:22<02:51, 46.10it/s][A
 60%|██████    | 12093/19999 [04:22<02:51, 46.10it/s][A
 60%|██████    | 12098/19999 [04:22<02:51, 46.10it/s][A
 61%|██████    | 12103/19999 [04:22<02:51, 46.09it/s][A
 61%|██████    | 12108/19999 [0

 64%|██████▍   | 12774/19999 [04:37<02:37, 45.98it/s][A
 64%|██████▍   | 12780/19999 [04:37<02:37, 45.98it/s][A
 64%|██████▍   | 12785/19999 [04:38<02:36, 45.98it/s][A
 64%|██████▍   | 12790/19999 [04:38<02:36, 45.98it/s][A
 64%|██████▍   | 12796/19999 [04:38<02:36, 45.98it/s][A
 64%|██████▍   | 12802/19999 [04:38<02:36, 45.99it/s][A
 64%|██████▍   | 12807/19999 [04:38<02:36, 45.99it/s][A
 64%|██████▍   | 12813/19999 [04:38<02:36, 45.99it/s][A
 64%|██████▍   | 12819/19999 [04:38<02:36, 45.99it/s][A
 64%|██████▍   | 12825/19999 [04:38<02:35, 45.99it/s][A
 64%|██████▍   | 12831/19999 [04:38<02:35, 45.99it/s][A
 64%|██████▍   | 12836/19999 [04:39<02:35, 45.99it/s][A
 64%|██████▍   | 12841/19999 [04:39<02:35, 45.99it/s][A
 64%|██████▍   | 12846/19999 [04:39<02:35, 45.99it/s][A
 64%|██████▍   | 12851/19999 [04:39<02:35, 45.99it/s][A
 64%|██████▍   | 12857/19999 [04:39<02:35, 45.99it/s][A
 64%|██████▍   | 12862/19999 [04:39<02:35, 45.99it/s][A
 64%|██████▍   | 12867/19999 [0

 68%|██████▊   | 13587/19999 [04:54<02:19, 46.08it/s][A
 68%|██████▊   | 13593/19999 [04:54<02:19, 46.08it/s][A
 68%|██████▊   | 13599/19999 [04:55<02:18, 46.08it/s][A
 68%|██████▊   | 13605/19999 [04:55<02:18, 46.09it/s][A
 68%|██████▊   | 13611/19999 [04:55<02:18, 46.09it/s][A
 68%|██████▊   | 13617/19999 [04:55<02:18, 46.09it/s][A
 68%|██████▊   | 13623/19999 [04:55<02:18, 46.09it/s][A
 68%|██████▊   | 13629/19999 [04:55<02:18, 46.09it/s][A
 68%|██████▊   | 13635/19999 [04:55<02:18, 46.10it/s][A
 68%|██████▊   | 13641/19999 [04:55<02:17, 46.10it/s][A
 68%|██████▊   | 13647/19999 [04:56<02:17, 46.10it/s][A
 68%|██████▊   | 13653/19999 [04:56<02:17, 46.10it/s][A
 68%|██████▊   | 13659/19999 [04:56<02:17, 46.10it/s][A
 68%|██████▊   | 13665/19999 [04:56<02:17, 46.10it/s][A
 68%|██████▊   | 13670/19999 [04:56<02:17, 46.10it/s][A
 68%|██████▊   | 13675/19999 [04:56<02:17, 46.10it/s][A
 68%|██████▊   | 13680/19999 [04:56<02:17, 46.09it/s][A
 68%|██████▊   | 13685/19999 [0

 72%|███████▏  | 14361/19999 [05:11<02:02, 46.05it/s][A
 72%|███████▏  | 14367/19999 [05:11<02:02, 46.06it/s][A
 72%|███████▏  | 14373/19999 [05:12<02:02, 46.06it/s][A
 72%|███████▏  | 14379/19999 [05:12<02:02, 46.06it/s][A
 72%|███████▏  | 14385/19999 [05:12<02:01, 46.06it/s][A
 72%|███████▏  | 14391/19999 [05:12<02:01, 46.06it/s][A
 72%|███████▏  | 14397/19999 [05:12<02:01, 46.06it/s][A
 72%|███████▏  | 14403/19999 [05:12<02:01, 46.07it/s][A
 72%|███████▏  | 14409/19999 [05:12<02:01, 46.06it/s][A
 72%|███████▏  | 14414/19999 [05:12<02:01, 46.06it/s][A
 72%|███████▏  | 14419/19999 [05:13<02:01, 46.06it/s][A
 72%|███████▏  | 14424/19999 [05:13<02:01, 46.06it/s][A
 72%|███████▏  | 14429/19999 [05:13<02:00, 46.06it/s][A
 72%|███████▏  | 14434/19999 [05:13<02:00, 46.05it/s][A
 72%|███████▏  | 14439/19999 [05:13<02:00, 46.05it/s][A
 72%|███████▏  | 14444/19999 [05:13<02:00, 46.05it/s][A
 72%|███████▏  | 14449/19999 [05:13<02:00, 46.05it/s][A
 72%|███████▏  | 14454/19999 [0

 76%|███████▌  | 15109/19999 [05:28<01:46, 45.93it/s][A
 76%|███████▌  | 15114/19999 [05:29<01:46, 45.93it/s][A
 76%|███████▌  | 15119/19999 [05:29<01:46, 45.92it/s][A
 76%|███████▌  | 15124/19999 [05:29<01:46, 45.92it/s][A
 76%|███████▌  | 15129/19999 [05:29<01:46, 45.92it/s][A
 76%|███████▌  | 15134/19999 [05:29<01:45, 45.92it/s][A
 76%|███████▌  | 15139/19999 [05:29<01:45, 45.92it/s][A
 76%|███████▌  | 15144/19999 [05:29<01:45, 45.92it/s][A
 76%|███████▌  | 15149/19999 [05:29<01:45, 45.91it/s][A
 76%|███████▌  | 15154/19999 [05:30<01:45, 45.91it/s][A
 76%|███████▌  | 15159/19999 [05:30<01:45, 45.91it/s][A
 76%|███████▌  | 15164/19999 [05:30<01:45, 45.91it/s][A
 76%|███████▌  | 15169/19999 [05:30<01:45, 45.91it/s][A
 76%|███████▌  | 15174/19999 [05:30<01:45, 45.90it/s][A
 76%|███████▌  | 15179/19999 [05:30<01:45, 45.90it/s][A
 76%|███████▌  | 15185/19999 [05:30<01:44, 45.90it/s][A
 76%|███████▌  | 15191/19999 [05:30<01:44, 45.90it/s][A
 76%|███████▌  | 15197/19999 [0

 79%|███████▉  | 15864/19999 [05:45<01:30, 45.86it/s][A
 79%|███████▉  | 15870/19999 [05:46<01:30, 45.87it/s][A
 79%|███████▉  | 15876/19999 [05:46<01:29, 45.87it/s][A
 79%|███████▉  | 15882/19999 [05:46<01:29, 45.87it/s][A
 79%|███████▉  | 15888/19999 [05:46<01:29, 45.87it/s][A
 79%|███████▉  | 15894/19999 [05:46<01:29, 45.87it/s][A
 80%|███████▉  | 15900/19999 [05:46<01:29, 45.87it/s][A
 80%|███████▉  | 15906/19999 [05:46<01:29, 45.87it/s][A
 80%|███████▉  | 15912/19999 [05:46<01:29, 45.88it/s][A
 80%|███████▉  | 15918/19999 [05:46<01:28, 45.88it/s][A
 80%|███████▉  | 15924/19999 [05:47<01:28, 45.88it/s][A
 80%|███████▉  | 15930/19999 [05:47<01:28, 45.88it/s][A
 80%|███████▉  | 15936/19999 [05:47<01:28, 45.88it/s][A
 80%|███████▉  | 15942/19999 [05:47<01:28, 45.88it/s][A
 80%|███████▉  | 15947/19999 [05:47<01:28, 45.88it/s][A
 80%|███████▉  | 15952/19999 [05:47<01:28, 45.88it/s][A
 80%|███████▉  | 15958/19999 [05:47<01:28, 45.88it/s][A
 80%|███████▉  | 15964/19999 [0

 83%|████████▎ | 16646/19999 [06:02<01:13, 45.87it/s][A
 83%|████████▎ | 16652/19999 [06:03<01:12, 45.87it/s][A
 83%|████████▎ | 16658/19999 [06:03<01:12, 45.87it/s][A
 83%|████████▎ | 16664/19999 [06:03<01:12, 45.88it/s][A
 83%|████████▎ | 16670/19999 [06:03<01:12, 45.88it/s][A
 83%|████████▎ | 16676/19999 [06:03<01:12, 45.88it/s][A
 83%|████████▎ | 16682/19999 [06:03<01:12, 45.88it/s][A
 83%|████████▎ | 16688/19999 [06:03<01:12, 45.88it/s][A
 83%|████████▎ | 16694/19999 [06:03<01:12, 45.88it/s][A
 84%|████████▎ | 16700/19999 [06:03<01:11, 45.88it/s][A
 84%|████████▎ | 16706/19999 [06:04<01:11, 45.89it/s][A
 84%|████████▎ | 16712/19999 [06:04<01:11, 45.89it/s][A
 84%|████████▎ | 16718/19999 [06:04<01:11, 45.89it/s][A
 84%|████████▎ | 16723/19999 [06:04<01:11, 45.88it/s][A
 84%|████████▎ | 16728/19999 [06:04<01:11, 45.88it/s][A
 84%|████████▎ | 16733/19999 [06:04<01:11, 45.88it/s][A
 84%|████████▎ | 16738/19999 [06:04<01:11, 45.88it/s][A
 84%|████████▎ | 16743/19999 [0

 87%|████████▋ | 17440/19999 [06:20<00:55, 45.89it/s][A
 87%|████████▋ | 17445/19999 [06:20<00:55, 45.89it/s][A
 87%|████████▋ | 17450/19999 [06:20<00:55, 45.89it/s][A
 87%|████████▋ | 17455/19999 [06:20<00:55, 45.89it/s][A
 87%|████████▋ | 17460/19999 [06:20<00:55, 45.89it/s][A
 87%|████████▋ | 17465/19999 [06:20<00:55, 45.89it/s][A
 87%|████████▋ | 17470/19999 [06:20<00:55, 45.88it/s][A
 87%|████████▋ | 17475/19999 [06:20<00:55, 45.88it/s][A
 87%|████████▋ | 17480/19999 [06:20<00:54, 45.88it/s][A
 87%|████████▋ | 17485/19999 [06:21<00:54, 45.88it/s][A
 87%|████████▋ | 17490/19999 [06:21<00:54, 45.88it/s][A
 87%|████████▋ | 17496/19999 [06:21<00:54, 45.88it/s][A
 88%|████████▊ | 17502/19999 [06:21<00:54, 45.88it/s][A
 88%|████████▊ | 17508/19999 [06:21<00:54, 45.88it/s][A
 88%|████████▊ | 17514/19999 [06:21<00:54, 45.89it/s][A
 88%|████████▊ | 17519/19999 [06:21<00:54, 45.88it/s][A
 88%|████████▊ | 17524/19999 [06:21<00:53, 45.88it/s][A
 88%|████████▊ | 17530/19999 [0

 91%|█████████ | 18201/19999 [06:37<00:39, 45.84it/s][A
 91%|█████████ | 18206/19999 [06:37<00:39, 45.84it/s][A
 91%|█████████ | 18211/19999 [06:37<00:39, 45.84it/s][A
 91%|█████████ | 18217/19999 [06:37<00:38, 45.84it/s][A
 91%|█████████ | 18222/19999 [06:37<00:38, 45.84it/s][A
 91%|█████████ | 18227/19999 [06:37<00:38, 45.84it/s][A
 91%|█████████ | 18232/19999 [06:37<00:38, 45.84it/s][A
 91%|█████████ | 18237/19999 [06:37<00:38, 45.84it/s][A
 91%|█████████ | 18242/19999 [06:37<00:38, 45.84it/s][A
 91%|█████████ | 18247/19999 [06:38<00:38, 45.84it/s][A
 91%|█████████▏| 18252/19999 [06:38<00:38, 45.84it/s][A
 91%|█████████▏| 18257/19999 [06:38<00:38, 45.84it/s][A
 91%|█████████▏| 18263/19999 [06:38<00:37, 45.84it/s][A
 91%|█████████▏| 18268/19999 [06:38<00:37, 45.84it/s][A
 91%|█████████▏| 18273/19999 [06:38<00:37, 45.84it/s][A
 91%|█████████▏| 18279/19999 [06:38<00:37, 45.84it/s][A
 91%|█████████▏| 18284/19999 [06:38<00:37, 45.84it/s][A
 91%|█████████▏| 18289/19999 [0

 95%|█████████▍| 18944/19999 [06:53<00:23, 45.77it/s][A
 95%|█████████▍| 18950/19999 [06:54<00:22, 45.77it/s][A
 95%|█████████▍| 18955/19999 [06:54<00:22, 45.77it/s][A
 95%|█████████▍| 18960/19999 [06:54<00:22, 45.77it/s][A
 95%|█████████▍| 18965/19999 [06:54<00:22, 45.77it/s][A
 95%|█████████▍| 18970/19999 [06:54<00:22, 45.76it/s][A
 95%|█████████▍| 18975/19999 [06:54<00:22, 45.76it/s][A
 95%|█████████▍| 18980/19999 [06:54<00:22, 45.76it/s][A
 95%|█████████▍| 18985/19999 [06:54<00:22, 45.76it/s][A
 95%|█████████▍| 18990/19999 [06:55<00:22, 45.76it/s][A
 95%|█████████▍| 18995/19999 [06:55<00:21, 45.76it/s][A
 95%|█████████▌| 19000/19999 [06:55<00:21, 45.76it/s][A
 95%|█████████▌| 19005/19999 [06:55<00:21, 45.75it/s][A
 95%|█████████▌| 19010/19999 [06:55<00:21, 45.75it/s][A
 95%|█████████▌| 19015/19999 [06:55<00:21, 45.75it/s][A
 95%|█████████▌| 19020/19999 [06:55<00:21, 45.75it/s][A
 95%|█████████▌| 19025/19999 [06:55<00:21, 45.75it/s][A
 95%|█████████▌| 19030/19999 [0

 99%|█████████▊| 19727/19999 [07:10<00:05, 45.78it/s][A
 99%|█████████▊| 19732/19999 [07:11<00:05, 45.77it/s][A
 99%|█████████▊| 19737/19999 [07:11<00:05, 45.77it/s][A
 99%|█████████▊| 19742/19999 [07:11<00:05, 45.77it/s][A
 99%|█████████▊| 19747/19999 [07:11<00:05, 45.77it/s][A
 99%|█████████▉| 19752/19999 [07:11<00:05, 45.77it/s][A
 99%|█████████▉| 19757/19999 [07:11<00:05, 45.77it/s][A
 99%|█████████▉| 19762/19999 [07:11<00:05, 45.77it/s][A
 99%|█████████▉| 19767/19999 [07:11<00:05, 45.77it/s][A
 99%|█████████▉| 19772/19999 [07:12<00:04, 45.77it/s][A
 99%|█████████▉| 19778/19999 [07:12<00:04, 45.77it/s][A
 99%|█████████▉| 19784/19999 [07:12<00:04, 45.77it/s][A
 99%|█████████▉| 19790/19999 [07:12<00:04, 45.77it/s][A
 99%|█████████▉| 19796/19999 [07:12<00:04, 45.77it/s][A
 99%|█████████▉| 19802/19999 [07:12<00:04, 45.77it/s][A
 99%|█████████▉| 19808/19999 [07:12<00:04, 45.78it/s][A
 99%|█████████▉| 19814/19999 [07:12<00:04, 45.78it/s][A
 99%|█████████▉| 19820/19999 [0

In [68]:
np.mean(res), np.std(res)

(0.41633244453847357, 0.077514127213931847)

Here we try to test adding regularisation

In [29]:
import numpy as np
import torch as t
import torch.nn as nn

from torch import LongTensor as LT
from torch import FloatTensor as FT

 
class Bundler(nn.Module):

    def forward(self, data):
        raise NotImplementedError

    def forward_i(self, data):
        raise NotImplementedError

    def forward_o(self, data):
        raise NotImplementedError


class Word2Vec(Bundler):

    def __init__(self, vocab_size=20000, embedding_size=300, padding_idx=0, vector_3 = None):
        # this instantiate the parent class
        super(Word2Vec, self).__init__()
        self.vocab_size = vocab_size
        self.embedding_size = embedding_size
        # define embeddings for the target word matrix and the context word matrix
        self.ivectors = nn.Embedding(self.vocab_size, self.embedding_size, padding_idx=padding_idx)
        self.ovectors = nn.Embedding(self.vocab_size, self.embedding_size, padding_idx=padding_idx)
        #self.vector_3 = nn.Embedding(self.vocab_size, 1, padding_idx=None)
        # define parameters with initial weights: 0 for the padding and uniformly sampled weights for the vocab
        self.ivectors.weight = nn.Parameter(t.cat([t.zeros(1, self.embedding_size), FT(self.vocab_size - 1, self.embedding_size).uniform_(-0.5 / self.embedding_size, 0.5 / self.embedding_size)]))
        self.ovectors.weight = nn.Parameter(t.cat([t.zeros(1, self.embedding_size), FT(self.vocab_size - 1, self.embedding_size).uniform_(-0.5 / self.embedding_size, 0.5 / self.embedding_size)]))
        #self.vector_3.weight = FT(vector_3)
        # indicates that we do not exclude this as it is the main part of the graph - this should be treated as parameters
        self.ivectors.weight.requires_grad = True
        self.ovectors.weight.requires_grad = True
        #self.vector_3.weight.requires_grad = False

    def forward(self, data):
        return self.forward_i(data)

    def forward_i(self, data):
        if data is not None:
            v = LT(data)
            v = v.cuda() if self.ivectors.weight.is_cuda else v
            return self.ivectors(v)
        else:
            return(None)

    def forward_o(self, data):
        v = LT(data)
        v = v.cuda() if self.ovectors.weight.is_cuda else v
        return self.ovectors(v)

class SGNS(nn.Module):

    def __init__(self, embedding, vocab_size=20000, n_negs=20, weights=None, test_tensor = None, vector3 = None):
        super(SGNS, self).__init__()
        self.embedding = embedding
        self.vocab_size = vocab_size
        self.n_negs = n_negs
        self.weights = None
        self.vector3 = FT(vector3).cuda()
        self.vector3.requires_grad = False
        if weights is not None:
            wf = np.power(weights, 0.75)
            wf = wf / wf.sum()
            self.weights = FT(wf)

    def forward(self, iword, owords, rwords):
        batch_size = iword.size()[0]
        context_size = owords.size()[1]
        if self.weights is not None:
            nwords = t.multinomial(self.weights, batch_size * context_size * self.n_negs, replacement=True).view(batch_size, -1)
        else:
            nwords = FT(batch_size, context_size * self.n_negs).uniform_(0, self.vocab_size - 1).long()
        ivectors = self.embedding.forward_i(iword).unsqueeze(2)
        #print('ivectors', ivectors.shape)
        ovectors = self.embedding.forward_o(owords)
        #print('ovectors', ovectors.shape)
        nvectors = self.embedding.forward_o(nwords).neg()
        #print(rvectors.shape)
##-------------- this is the line we need to modify: add the euclidean distance as a regularisation term
##-------------- we will also consider the consine similarity
        oloss = t.bmm(ovectors, ivectors).squeeze().sigmoid().log().mean(1)
        #print(oloss.shape)
        nloss = t.bmm(nvectors, ivectors).squeeze().sigmoid().log().view(-1, context_size, self.n_negs).sum(2).mean(1)
        #print(t.bmm(nvectors, ivectors).squeeze().sigmoid().log().view(-1, context_size, self.n_negs).sum(2).mean(1).shape)
        #rloss = 3*((rvectors.squeeze() - self.vector3)**2).sum()
        if self.embedding.forward_i(rwords) is not None:
            MSE_loss_fn = nn.MSELoss(reduction='sum')
            rvectors = self.embedding.forward_i(rwords)
            rloss = MSE_loss_fn(rvectors.squeeze(), self.vector3)
            return(-(oloss + nloss).mean() + 10*rloss)
        else:
            return(-(oloss + nloss).mean())
        #print((-(oloss + nloss).mean()).shape)

In [30]:
emb_dim = 300
model_name = 'period0_1'

model_1 = Word2Vec(vocab_size=vocab_size, embedding_size=emb_dim)
modelpath = os.path.join(save_dir, '{}.pt'.format(model_name))

n_negs = 100

sgns_1 = SGNS(embedding=model_1, vocab_size=vocab_size, n_negs=n_negs, weights=weights, vector3=vector3)

In [31]:
sgns_1 = sgns_1.cuda()

In [32]:
optim_1 = Adam(sgns_1.parameters())
optimpath = os.path.join(save_dir, '{}.optim.pt'.format(model_name))
if os.path.isfile(optimpath) and conti:
    optim_1.load_state_dict(t.load(optimpath))

In [33]:
n_epoch = 10
mb = 1000

for epoch in range(1, n_epoch + 1):
    dataset = PermutedSubsampledCorpus(os.path.join(data_path, 'train.dat'), ws)
    dataloader = DataLoader(dataset, batch_size=mb, shuffle=True)
    total_batches = int(np.ceil(len(dataset) / mb))
    pbar = tqdm(dataloader)
    pbar.set_description("[Epoch {}]".format(epoch))
    for iword, owords in pbar:
        rwords = LT([3]) if 3 in iword else None
        loss = sgns_1(iword, owords, rwords)
        #grad = sgns_1(iword, owords, rwords)[1]
        optim_1.zero_grad()
        loss.backward()
        #print(grad)
        #print(list(model_1.parameters()))
        optim_1.step()
        pbar.set_postfix(loss=loss.item())

  1%|          | 206/19999 [00:20<32:05, 10.28it/s]
  0%|          | 0/716 [00:00<?, ?it/s][A
[Epoch 1]:   0%|          | 0/716 [00:00<?, ?it/s][A
[Epoch 1]:   0%|          | 0/716 [00:00<?, ?it/s, loss=85.8][A
[Epoch 1]:   0%|          | 1/716 [00:00<08:35,  1.39it/s, loss=85.8][A
[Epoch 1]:   0%|          | 1/716 [00:01<13:24,  1.13s/it, loss=85.5][A
[Epoch 1]:   0%|          | 2/716 [00:01<06:42,  1.78it/s, loss=85.5][A
[Epoch 1]:   0%|          | 2/716 [00:01<08:58,  1.33it/s, loss=85.1][A
[Epoch 1]:   0%|          | 3/716 [00:01<05:58,  1.99it/s, loss=85.1][A
[Epoch 1]:   0%|          | 3/716 [00:01<07:31,  1.58it/s, loss=84.8][A
[Epoch 1]:   1%|          | 4/716 [00:01<05:39,  2.10it/s, loss=84.8][A
[Epoch 1]:   1%|          | 4/716 [00:02<06:47,  1.75it/s, loss=84.4][A
[Epoch 1]:   1%|          | 5/716 [00:02<05:26,  2.18it/s, loss=84.4][A
[Epoch 1]:   1%|          | 5/716 [00:02<06:19,  1.87it/s, loss=84.1][A
[Epoch 1]:   1%|          | 6/716 [00:02<05:16,  2.24it/

[Epoch 1]:   8%|▊         | 55/716 [00:21<04:20,  2.54it/s, loss=65][A
[Epoch 1]:   8%|▊         | 55/716 [00:22<04:24,  2.50it/s, loss=64.2][A
[Epoch 1]:   8%|▊         | 56/716 [00:22<04:19,  2.54it/s, loss=64.2][A
[Epoch 1]:   8%|▊         | 56/716 [00:22<04:24,  2.50it/s, loss=63.4][A
[Epoch 1]:   8%|▊         | 57/716 [00:22<04:19,  2.54it/s, loss=63.4][A
[Epoch 1]:   8%|▊         | 57/716 [00:22<04:23,  2.50it/s, loss=63.3][A
[Epoch 1]:   8%|▊         | 58/716 [00:22<04:18,  2.54it/s, loss=63.3][A
[Epoch 1]:   8%|▊         | 58/716 [00:23<04:22,  2.50it/s, loss=62.4][A
[Epoch 1]:   8%|▊         | 59/716 [00:23<04:18,  2.54it/s, loss=62.4][A
[Epoch 1]:   8%|▊         | 59/716 [00:23<04:22,  2.50it/s, loss=62.1][A
[Epoch 1]:   8%|▊         | 60/716 [00:23<04:17,  2.55it/s, loss=62.1][A
[Epoch 1]:   8%|▊         | 60/716 [00:23<04:21,  2.50it/s, loss=61.8][A
[Epoch 1]:   9%|▊         | 61/716 [00:23<04:17,  2.55it/s, loss=61.8][A
[Epoch 1]:   9%|▊         | 61/716 [00:2

[Epoch 1]:  15%|█▌        | 110/716 [00:42<03:55,  2.57it/s, loss=36.6][A
[Epoch 1]:  15%|█▌        | 110/716 [00:43<03:57,  2.55it/s, loss=36.6][A
[Epoch 1]:  16%|█▌        | 111/716 [00:43<03:54,  2.57it/s, loss=36.6][A
[Epoch 1]:  16%|█▌        | 111/716 [00:43<03:57,  2.55it/s, loss=35.7][A
[Epoch 1]:  16%|█▌        | 112/716 [00:43<03:54,  2.58it/s, loss=35.7][A
[Epoch 1]:  16%|█▌        | 112/716 [00:43<03:56,  2.55it/s, loss=36.2][A
[Epoch 1]:  16%|█▌        | 113/716 [00:43<03:54,  2.58it/s, loss=36.2][A
[Epoch 1]:  16%|█▌        | 113/716 [00:44<03:56,  2.55it/s, loss=34.3][A
[Epoch 1]:  16%|█▌        | 114/716 [00:44<03:53,  2.58it/s, loss=34.3][A
[Epoch 1]:  16%|█▌        | 114/716 [00:44<03:55,  2.55it/s, loss=33.4][A
[Epoch 1]:  16%|█▌        | 115/716 [00:44<03:53,  2.58it/s, loss=33.4][A
[Epoch 1]:  16%|█▌        | 115/716 [00:45<03:55,  2.55it/s, loss=34]  [A
[Epoch 1]:  16%|█▌        | 116/716 [00:45<03:52,  2.58it/s, loss=34][A
[Epoch 1]:  16%|█▌        |

[Epoch 1]:  23%|██▎       | 164/716 [01:03<03:34,  2.57it/s, loss=23.8][A
[Epoch 1]:  23%|██▎       | 165/716 [01:03<03:32,  2.59it/s, loss=23.8][A
[Epoch 1]:  23%|██▎       | 165/716 [01:04<03:34,  2.57it/s, loss=23.6][A
[Epoch 1]:  23%|██▎       | 166/716 [01:04<03:32,  2.59it/s, loss=23.6][A
[Epoch 1]:  23%|██▎       | 166/716 [01:04<03:33,  2.57it/s, loss=23.4][A
[Epoch 1]:  23%|██▎       | 167/716 [01:04<03:32,  2.59it/s, loss=23.4][A
[Epoch 1]:  23%|██▎       | 167/716 [01:04<03:33,  2.57it/s, loss=24.3][A
[Epoch 1]:  23%|██▎       | 168/716 [01:04<03:31,  2.59it/s, loss=24.3][A
[Epoch 1]:  23%|██▎       | 168/716 [01:05<03:32,  2.57it/s, loss=23.8][A
[Epoch 1]:  24%|██▎       | 169/716 [01:05<03:31,  2.59it/s, loss=23.8][A
[Epoch 1]:  24%|██▎       | 169/716 [01:05<03:32,  2.57it/s, loss=23.2][A
[Epoch 1]:  24%|██▎       | 170/716 [01:05<03:30,  2.59it/s, loss=23.2][A
[Epoch 1]:  24%|██▎       | 170/716 [01:06<03:32,  2.57it/s, loss=21.7][A
[Epoch 1]:  24%|██▍      

[Epoch 1]:  31%|███       | 219/716 [01:24<03:11,  2.59it/s, loss=18.4][A
[Epoch 1]:  31%|███       | 219/716 [01:24<03:12,  2.58it/s, loss=18.6][A
[Epoch 1]:  31%|███       | 220/716 [01:24<03:11,  2.59it/s, loss=18.6][A
[Epoch 1]:  31%|███       | 220/716 [01:25<03:12,  2.58it/s, loss=18.7][A
[Epoch 1]:  31%|███       | 221/716 [01:25<03:10,  2.59it/s, loss=18.7][A
[Epoch 1]:  31%|███       | 221/716 [01:25<03:11,  2.58it/s, loss=19]  [A
[Epoch 1]:  31%|███       | 222/716 [01:25<03:10,  2.59it/s, loss=19][A
[Epoch 1]:  31%|███       | 222/716 [01:26<03:11,  2.58it/s, loss=18.6][A
[Epoch 1]:  31%|███       | 223/716 [01:26<03:10,  2.59it/s, loss=18.6][A
[Epoch 1]:  31%|███       | 223/716 [01:26<03:11,  2.58it/s, loss=18.8][A
[Epoch 1]:  31%|███▏      | 224/716 [01:26<03:09,  2.59it/s, loss=18.8][A
[Epoch 1]:  31%|███▏      | 224/716 [01:26<03:10,  2.58it/s, loss=17.9][A
[Epoch 1]:  31%|███▏      | 225/716 [01:26<03:09,  2.59it/s, loss=17.9][A
[Epoch 1]:  31%|███▏      |

[Epoch 1]:  38%|███▊      | 273/716 [01:45<02:51,  2.59it/s, loss=17.6][A
[Epoch 1]:  38%|███▊      | 274/716 [01:45<02:50,  2.59it/s, loss=17.6][A
[Epoch 1]:  38%|███▊      | 274/716 [01:45<02:50,  2.59it/s, loss=15.9][A
[Epoch 1]:  38%|███▊      | 275/716 [01:45<02:49,  2.59it/s, loss=15.9][A
[Epoch 1]:  38%|███▊      | 275/716 [01:46<02:50,  2.59it/s, loss=16.7][A
[Epoch 1]:  39%|███▊      | 276/716 [01:46<02:49,  2.59it/s, loss=16.7][A
[Epoch 1]:  39%|███▊      | 276/716 [01:46<02:50,  2.59it/s, loss=17.7][A
[Epoch 1]:  39%|███▊      | 277/716 [01:46<02:49,  2.59it/s, loss=17.7][A
[Epoch 1]:  39%|███▊      | 277/716 [01:47<02:49,  2.59it/s, loss=16.9][A
[Epoch 1]:  39%|███▉      | 278/716 [01:47<02:48,  2.59it/s, loss=16.9][A
[Epoch 1]:  39%|███▉      | 278/716 [01:47<02:49,  2.59it/s, loss=17.3][A
[Epoch 1]:  39%|███▉      | 279/716 [01:47<02:48,  2.59it/s, loss=17.3][A
[Epoch 1]:  39%|███▉      | 279/716 [01:47<02:49,  2.59it/s, loss=16.6][A
[Epoch 1]:  39%|███▉     

[Epoch 1]:  46%|████▌     | 328/716 [02:06<02:29,  2.60it/s, loss=15.8][A
[Epoch 1]:  46%|████▌     | 328/716 [02:06<02:29,  2.59it/s, loss=14.6][A
[Epoch 1]:  46%|████▌     | 329/716 [02:06<02:29,  2.60it/s, loss=14.6][A
[Epoch 1]:  46%|████▌     | 329/716 [02:07<02:29,  2.59it/s, loss=15.6][A
[Epoch 1]:  46%|████▌     | 330/716 [02:07<02:28,  2.60it/s, loss=15.6][A
[Epoch 1]:  46%|████▌     | 330/716 [02:07<02:29,  2.59it/s, loss=15]  [A
[Epoch 1]:  46%|████▌     | 331/716 [02:07<02:28,  2.60it/s, loss=15][A
[Epoch 1]:  46%|████▌     | 331/716 [02:07<02:28,  2.59it/s, loss=16][A
[Epoch 1]:  46%|████▋     | 332/716 [02:07<02:27,  2.60it/s, loss=16][A
[Epoch 1]:  46%|████▋     | 332/716 [02:08<02:28,  2.59it/s, loss=15.9][A
[Epoch 1]:  47%|████▋     | 333/716 [02:08<02:27,  2.60it/s, loss=15.9][A
[Epoch 1]:  47%|████▋     | 333/716 [02:08<02:27,  2.59it/s, loss=14.1][A
[Epoch 1]:  47%|████▋     | 334/716 [02:08<02:27,  2.60it/s, loss=14.1][A
[Epoch 1]:  47%|████▋     | 334

[Epoch 1]:  53%|█████▎    | 382/716 [02:27<02:08,  2.59it/s, loss=14.9][A
[Epoch 1]:  53%|█████▎    | 383/716 [02:27<02:08,  2.60it/s, loss=14.9][A
[Epoch 1]:  53%|█████▎    | 383/716 [02:27<02:08,  2.59it/s, loss=14.3][A
[Epoch 1]:  54%|█████▎    | 384/716 [02:27<02:07,  2.60it/s, loss=14.3][A
[Epoch 1]:  54%|█████▎    | 384/716 [02:28<02:08,  2.59it/s, loss=15.8][A
[Epoch 1]:  54%|█████▍    | 385/716 [02:28<02:07,  2.60it/s, loss=15.8][A
[Epoch 1]:  54%|█████▍    | 385/716 [02:28<02:07,  2.59it/s, loss=14.7][A
[Epoch 1]:  54%|█████▍    | 386/716 [02:28<02:06,  2.60it/s, loss=14.7][A
[Epoch 1]:  54%|█████▍    | 386/716 [02:28<02:07,  2.59it/s, loss=14.3][A
[Epoch 1]:  54%|█████▍    | 387/716 [02:28<02:06,  2.60it/s, loss=14.3][A
[Epoch 1]:  54%|█████▍    | 387/716 [02:29<02:06,  2.59it/s, loss=15]  [A
[Epoch 1]:  54%|█████▍    | 388/716 [02:29<02:06,  2.60it/s, loss=15][A
[Epoch 1]:  54%|█████▍    | 388/716 [02:29<02:06,  2.59it/s, loss=14.4][A
[Epoch 1]:  54%|█████▍    |

[Epoch 1]:  61%|██████    | 437/716 [02:47<01:47,  2.60it/s, loss=14][A
[Epoch 1]:  61%|██████    | 437/716 [02:48<01:47,  2.60it/s, loss=15.4][A
[Epoch 1]:  61%|██████    | 438/716 [02:48<01:46,  2.60it/s, loss=15.4][A
[Epoch 1]:  61%|██████    | 438/716 [02:48<01:47,  2.60it/s, loss=14.1][A
[Epoch 1]:  61%|██████▏   | 439/716 [02:48<01:46,  2.60it/s, loss=14.1][A
[Epoch 1]:  61%|██████▏   | 439/716 [02:49<01:46,  2.60it/s, loss=14.1][A
[Epoch 1]:  61%|██████▏   | 440/716 [02:49<01:46,  2.60it/s, loss=14.1][A
[Epoch 1]:  61%|██████▏   | 440/716 [02:49<01:46,  2.60it/s, loss=14.6][A
[Epoch 1]:  62%|██████▏   | 441/716 [02:49<01:45,  2.60it/s, loss=14.6][A
[Epoch 1]:  62%|██████▏   | 441/716 [02:49<01:45,  2.60it/s, loss=15.4][A
[Epoch 1]:  62%|██████▏   | 442/716 [02:49<01:45,  2.60it/s, loss=15.4][A
[Epoch 1]:  62%|██████▏   | 442/716 [02:50<01:45,  2.60it/s, loss=13.7][A
[Epoch 1]:  62%|██████▏   | 443/716 [02:50<01:44,  2.60it/s, loss=13.7][A
[Epoch 1]:  62%|██████▏   |

[Epoch 1]:  69%|██████▊   | 491/716 [03:08<01:26,  2.60it/s, loss=13.5][A
[Epoch 1]:  69%|██████▊   | 492/716 [03:08<01:25,  2.61it/s, loss=13.5][A
[Epoch 1]:  69%|██████▊   | 492/716 [03:09<01:26,  2.60it/s, loss=14.5][A
[Epoch 1]:  69%|██████▉   | 493/716 [03:09<01:25,  2.61it/s, loss=14.5][A
[Epoch 1]:  69%|██████▉   | 493/716 [03:09<01:25,  2.60it/s, loss=13.8][A
[Epoch 1]:  69%|██████▉   | 494/716 [03:09<01:25,  2.61it/s, loss=13.8][A
[Epoch 1]:  69%|██████▉   | 494/716 [03:09<01:25,  2.60it/s, loss=14.4][A
[Epoch 1]:  69%|██████▉   | 495/716 [03:09<01:24,  2.61it/s, loss=14.4][A
[Epoch 1]:  69%|██████▉   | 495/716 [03:10<01:24,  2.60it/s, loss=13.8][A
[Epoch 1]:  69%|██████▉   | 496/716 [03:10<01:24,  2.61it/s, loss=13.8][A
[Epoch 1]:  69%|██████▉   | 496/716 [03:10<01:24,  2.60it/s, loss=14.1][A
[Epoch 1]:  69%|██████▉   | 497/716 [03:10<01:24,  2.61it/s, loss=14.1][A
[Epoch 1]:  69%|██████▉   | 497/716 [03:11<01:24,  2.60it/s, loss=14.7][A
[Epoch 1]:  70%|██████▉  

[Epoch 1]:  76%|███████▋  | 546/716 [03:29<01:05,  2.61it/s, loss=14][A
[Epoch 1]:  76%|███████▋  | 546/716 [03:29<01:05,  2.60it/s, loss=13.7][A
[Epoch 1]:  76%|███████▋  | 547/716 [03:29<01:04,  2.61it/s, loss=13.7][A
[Epoch 1]:  76%|███████▋  | 547/716 [03:30<01:04,  2.60it/s, loss=13.2][A
[Epoch 1]:  77%|███████▋  | 548/716 [03:30<01:04,  2.61it/s, loss=13.2][A
[Epoch 1]:  77%|███████▋  | 548/716 [03:30<01:04,  2.60it/s, loss=13.8][A
[Epoch 1]:  77%|███████▋  | 549/716 [03:30<01:04,  2.61it/s, loss=13.8][A
[Epoch 1]:  77%|███████▋  | 549/716 [03:30<01:04,  2.60it/s, loss=14.3][A
[Epoch 1]:  77%|███████▋  | 550/716 [03:30<01:03,  2.61it/s, loss=14.3][A
[Epoch 1]:  77%|███████▋  | 550/716 [03:31<01:03,  2.60it/s, loss=15.3][A
[Epoch 1]:  77%|███████▋  | 551/716 [03:31<01:03,  2.61it/s, loss=15.3][A
[Epoch 1]:  77%|███████▋  | 551/716 [03:31<01:03,  2.60it/s, loss=14.8][A
[Epoch 1]:  77%|███████▋  | 552/716 [03:31<01:02,  2.61it/s, loss=14.8][A
[Epoch 1]:  77%|███████▋  |

[Epoch 1]:  84%|████████▍ | 600/716 [03:50<00:44,  2.61it/s, loss=13.2][A
[Epoch 1]:  84%|████████▍ | 601/716 [03:50<00:44,  2.61it/s, loss=13.2][A
[Epoch 1]:  84%|████████▍ | 601/716 [03:50<00:44,  2.61it/s, loss=13.9][A
[Epoch 1]:  84%|████████▍ | 602/716 [03:50<00:43,  2.61it/s, loss=13.9][A
[Epoch 1]:  84%|████████▍ | 602/716 [03:50<00:43,  2.61it/s, loss=15.4][A
[Epoch 1]:  84%|████████▍ | 603/716 [03:50<00:43,  2.61it/s, loss=15.4][A
[Epoch 1]:  84%|████████▍ | 603/716 [03:51<00:43,  2.61it/s, loss=14]  [A
[Epoch 1]:  84%|████████▍ | 604/716 [03:51<00:42,  2.61it/s, loss=14][A
[Epoch 1]:  84%|████████▍ | 604/716 [03:51<00:42,  2.61it/s, loss=13.5][A
[Epoch 1]:  84%|████████▍ | 605/716 [03:51<00:42,  2.61it/s, loss=13.5][A
[Epoch 1]:  84%|████████▍ | 605/716 [03:52<00:42,  2.61it/s, loss=14.3][A
[Epoch 1]:  85%|████████▍ | 606/716 [03:52<00:42,  2.61it/s, loss=14.3][A
[Epoch 1]:  85%|████████▍ | 606/716 [03:52<00:42,  2.61it/s, loss=14.1][A
[Epoch 1]:  85%|████████▍ |

[Epoch 1]:  91%|█████████▏| 655/716 [04:10<00:23,  2.61it/s, loss=14.2][A
[Epoch 1]:  91%|█████████▏| 655/716 [04:11<00:23,  2.61it/s, loss=13.8][A
[Epoch 1]:  92%|█████████▏| 656/716 [04:11<00:22,  2.61it/s, loss=13.8][A
[Epoch 1]:  92%|█████████▏| 656/716 [04:11<00:23,  2.61it/s, loss=12.9][A
[Epoch 1]:  92%|█████████▏| 657/716 [04:11<00:22,  2.61it/s, loss=12.9][A
[Epoch 1]:  92%|█████████▏| 657/716 [04:11<00:22,  2.61it/s, loss=15]  [A
[Epoch 1]:  92%|█████████▏| 658/716 [04:11<00:22,  2.61it/s, loss=15][A
[Epoch 1]:  92%|█████████▏| 658/716 [04:12<00:22,  2.61it/s, loss=13.6][A
[Epoch 1]:  92%|█████████▏| 659/716 [04:12<00:21,  2.61it/s, loss=13.6][A
[Epoch 1]:  92%|█████████▏| 659/716 [04:12<00:21,  2.61it/s, loss=13.8][A
[Epoch 1]:  92%|█████████▏| 660/716 [04:12<00:21,  2.61it/s, loss=13.8][A
[Epoch 1]:  92%|█████████▏| 660/716 [04:13<00:21,  2.61it/s, loss=13.7][A
[Epoch 1]:  92%|█████████▏| 661/716 [04:13<00:21,  2.61it/s, loss=13.7][A
[Epoch 1]:  92%|█████████▏|

[Epoch 1]:  99%|█████████▉| 709/716 [04:31<00:02,  2.61it/s, loss=13.6][A
[Epoch 1]:  99%|█████████▉| 710/716 [04:31<00:02,  2.61it/s, loss=13.6][A
[Epoch 1]:  99%|█████████▉| 710/716 [04:32<00:02,  2.61it/s, loss=12.5][A
[Epoch 1]:  99%|█████████▉| 711/716 [04:32<00:01,  2.61it/s, loss=12.5][A
[Epoch 1]:  99%|█████████▉| 711/716 [04:32<00:01,  2.61it/s, loss=13.4][A
[Epoch 1]:  99%|█████████▉| 712/716 [04:32<00:01,  2.61it/s, loss=13.4][A
[Epoch 1]:  99%|█████████▉| 712/716 [04:33<00:01,  2.61it/s, loss=14]  [A
[Epoch 1]: 100%|█████████▉| 713/716 [04:33<00:01,  2.61it/s, loss=14][A
[Epoch 1]: 100%|█████████▉| 713/716 [04:33<00:01,  2.61it/s, loss=13.7][A
[Epoch 1]: 100%|█████████▉| 714/716 [04:33<00:00,  2.61it/s, loss=13.7][A
[Epoch 1]: 100%|█████████▉| 714/716 [04:33<00:00,  2.61it/s, loss=13.8][A
[Epoch 1]: 100%|█████████▉| 715/716 [04:33<00:00,  2.61it/s, loss=13.8][A
[Epoch 1]: 100%|█████████▉| 715/716 [04:33<00:00,  2.61it/s, loss=14.3][A
[Epoch 1]: 100%|██████████|

[Epoch 2]:   7%|▋         | 48/716 [00:18<04:21,  2.55it/s, loss=13][A
[Epoch 2]:   7%|▋         | 48/716 [00:19<04:26,  2.50it/s, loss=14.1][A
[Epoch 2]:   7%|▋         | 49/716 [00:19<04:21,  2.55it/s, loss=14.1][A
[Epoch 2]:   7%|▋         | 49/716 [00:19<04:26,  2.50it/s, loss=12.8][A
[Epoch 2]:   7%|▋         | 50/716 [00:19<04:20,  2.55it/s, loss=12.8][A
[Epoch 2]:   7%|▋         | 50/716 [00:19<04:25,  2.51it/s, loss=14.1][A
[Epoch 2]:   7%|▋         | 51/716 [00:19<04:20,  2.56it/s, loss=14.1][A
[Epoch 2]:   7%|▋         | 51/716 [00:20<04:25,  2.51it/s, loss=14]  [A
[Epoch 2]:   7%|▋         | 52/716 [00:20<04:19,  2.56it/s, loss=14][A
[Epoch 2]:   7%|▋         | 52/716 [00:20<04:24,  2.51it/s, loss=12.4][A
[Epoch 2]:   7%|▋         | 53/716 [00:20<04:18,  2.56it/s, loss=12.4][A
[Epoch 2]:   7%|▋         | 53/716 [00:21<04:23,  2.51it/s, loss=15.5][A
[Epoch 2]:   8%|▊         | 54/716 [00:21<04:18,  2.56it/s, loss=15.5][A
[Epoch 2]:   8%|▊         | 54/716 [00:21<

[Epoch 2]:  14%|█▍        | 103/716 [00:39<03:57,  2.58it/s, loss=12.7][A
[Epoch 2]:  14%|█▍        | 103/716 [00:40<03:59,  2.56it/s, loss=13.3][A
[Epoch 2]:  15%|█▍        | 104/716 [00:40<03:57,  2.58it/s, loss=13.3][A
[Epoch 2]:  15%|█▍        | 104/716 [00:40<03:59,  2.56it/s, loss=13.7][A
[Epoch 2]:  15%|█▍        | 105/716 [00:40<03:56,  2.58it/s, loss=13.7][A
[Epoch 2]:  15%|█▍        | 105/716 [00:41<03:58,  2.56it/s, loss=13.6][A
[Epoch 2]:  15%|█▍        | 106/716 [00:41<03:56,  2.58it/s, loss=13.6][A
[Epoch 2]:  15%|█▍        | 106/716 [00:41<03:58,  2.56it/s, loss=13.5][A
[Epoch 2]:  15%|█▍        | 107/716 [00:41<03:55,  2.58it/s, loss=13.5][A
[Epoch 2]:  15%|█▍        | 107/716 [00:41<03:58,  2.56it/s, loss=13.4][A
[Epoch 2]:  15%|█▌        | 108/716 [00:41<03:55,  2.58it/s, loss=13.4][A
[Epoch 2]:  15%|█▌        | 108/716 [00:42<03:57,  2.56it/s, loss=13.4][A
[Epoch 2]:  15%|█▌        | 109/716 [00:42<03:55,  2.58it/s, loss=13.4][A
[Epoch 2]:  15%|█▌       

[Epoch 2]:  22%|██▏       | 157/716 [01:01<03:37,  2.57it/s, loss=14.6][A
[Epoch 2]:  22%|██▏       | 158/716 [01:01<03:35,  2.59it/s, loss=14.6][A
[Epoch 2]:  22%|██▏       | 158/716 [01:01<03:36,  2.57it/s, loss=14.6][A
[Epoch 2]:  22%|██▏       | 159/716 [01:01<03:35,  2.59it/s, loss=14.6][A
[Epoch 2]:  22%|██▏       | 159/716 [01:01<03:36,  2.57it/s, loss=13.8][A
[Epoch 2]:  22%|██▏       | 160/716 [01:01<03:34,  2.59it/s, loss=13.8][A
[Epoch 2]:  22%|██▏       | 160/716 [01:02<03:36,  2.57it/s, loss=14.9][A
[Epoch 2]:  22%|██▏       | 161/716 [01:02<03:34,  2.59it/s, loss=14.9][A
[Epoch 2]:  22%|██▏       | 161/716 [01:02<03:35,  2.57it/s, loss=12.5][A
[Epoch 2]:  23%|██▎       | 162/716 [01:02<03:33,  2.59it/s, loss=12.5][A
[Epoch 2]:  23%|██▎       | 162/716 [01:02<03:35,  2.57it/s, loss=14.3][A
[Epoch 2]:  23%|██▎       | 163/716 [01:02<03:33,  2.59it/s, loss=14.3][A
[Epoch 2]:  23%|██▎       | 163/716 [01:03<03:34,  2.57it/s, loss=14]  [A
[Epoch 2]:  23%|██▎      

[Epoch 2]:  30%|██▉       | 212/716 [01:21<03:14,  2.59it/s, loss=14.5][A
[Epoch 2]:  30%|██▉       | 212/716 [01:22<03:15,  2.58it/s, loss=14.2][A
[Epoch 2]:  30%|██▉       | 213/716 [01:22<03:13,  2.59it/s, loss=14.2][A
[Epoch 2]:  30%|██▉       | 213/716 [01:22<03:14,  2.58it/s, loss=13.5][A
[Epoch 2]:  30%|██▉       | 214/716 [01:22<03:13,  2.59it/s, loss=13.5][A
[Epoch 2]:  30%|██▉       | 214/716 [01:22<03:14,  2.58it/s, loss=14.2][A
[Epoch 2]:  30%|███       | 215/716 [01:22<03:13,  2.59it/s, loss=14.2][A
[Epoch 2]:  30%|███       | 215/716 [01:23<03:14,  2.58it/s, loss=12.9][A
[Epoch 2]:  30%|███       | 216/716 [01:23<03:12,  2.59it/s, loss=12.9][A
[Epoch 2]:  30%|███       | 216/716 [01:23<03:13,  2.58it/s, loss=12.7][A
[Epoch 2]:  30%|███       | 217/716 [01:23<03:12,  2.59it/s, loss=12.7][A
[Epoch 2]:  30%|███       | 217/716 [01:24<03:13,  2.58it/s, loss=14.8][A
[Epoch 2]:  30%|███       | 218/716 [01:24<03:12,  2.59it/s, loss=14.8][A
[Epoch 2]:  30%|███      

[Epoch 2]:  37%|███▋      | 266/716 [01:42<02:54,  2.59it/s, loss=13.8][A
[Epoch 2]:  37%|███▋      | 267/716 [01:42<02:53,  2.60it/s, loss=13.8][A
[Epoch 2]:  37%|███▋      | 267/716 [01:43<02:53,  2.59it/s, loss=12.8][A
[Epoch 2]:  37%|███▋      | 268/716 [01:43<02:52,  2.60it/s, loss=12.8][A
[Epoch 2]:  37%|███▋      | 268/716 [01:43<02:53,  2.59it/s, loss=13.4][A
[Epoch 2]:  38%|███▊      | 269/716 [01:43<02:52,  2.60it/s, loss=13.4][A
[Epoch 2]:  38%|███▊      | 269/716 [01:44<02:52,  2.59it/s, loss=13.3][A
[Epoch 2]:  38%|███▊      | 270/716 [01:44<02:51,  2.60it/s, loss=13.3][A
[Epoch 2]:  38%|███▊      | 270/716 [01:44<02:52,  2.59it/s, loss=15.5][A
[Epoch 2]:  38%|███▊      | 271/716 [01:44<02:51,  2.60it/s, loss=15.5][A
[Epoch 2]:  38%|███▊      | 271/716 [01:44<02:52,  2.59it/s, loss=13.9][A
[Epoch 2]:  38%|███▊      | 272/716 [01:44<02:51,  2.60it/s, loss=13.9][A
[Epoch 2]:  38%|███▊      | 272/716 [01:45<02:51,  2.59it/s, loss=13.6][A
[Epoch 2]:  38%|███▊     

[Epoch 2]:  45%|████▍     | 321/716 [02:03<02:32,  2.59it/s, loss=13.1][A
[Epoch 2]:  45%|████▍     | 321/716 [02:04<02:32,  2.59it/s, loss=13.8][A
[Epoch 2]:  45%|████▍     | 322/716 [02:04<02:31,  2.59it/s, loss=13.8][A
[Epoch 2]:  45%|████▍     | 322/716 [02:04<02:32,  2.59it/s, loss=14.4][A
[Epoch 2]:  45%|████▌     | 323/716 [02:04<02:31,  2.59it/s, loss=14.4][A
[Epoch 2]:  45%|████▌     | 323/716 [02:04<02:31,  2.59it/s, loss=13.9][A
[Epoch 2]:  45%|████▌     | 324/716 [02:04<02:31,  2.59it/s, loss=13.9][A
[Epoch 2]:  45%|████▌     | 324/716 [02:05<02:31,  2.59it/s, loss=14.8][A
[Epoch 2]:  45%|████▌     | 325/716 [02:05<02:30,  2.59it/s, loss=14.8][A
[Epoch 2]:  45%|████▌     | 325/716 [02:05<02:31,  2.59it/s, loss=13.5][A
[Epoch 2]:  46%|████▌     | 326/716 [02:05<02:30,  2.60it/s, loss=13.5][A
[Epoch 2]:  46%|████▌     | 326/716 [02:06<02:30,  2.59it/s, loss=13.2][A
[Epoch 2]:  46%|████▌     | 327/716 [02:06<02:29,  2.60it/s, loss=13.2][A
[Epoch 2]:  46%|████▌    

[Epoch 2]:  52%|█████▏    | 375/716 [02:24<02:11,  2.59it/s, loss=14.5][A
[Epoch 2]:  53%|█████▎    | 376/716 [02:24<02:10,  2.60it/s, loss=14.5][A
[Epoch 2]:  53%|█████▎    | 376/716 [02:25<02:11,  2.59it/s, loss=13.3][A
[Epoch 2]:  53%|█████▎    | 377/716 [02:25<02:10,  2.60it/s, loss=13.3][A
[Epoch 2]:  53%|█████▎    | 377/716 [02:25<02:10,  2.59it/s, loss=13.1][A
[Epoch 2]:  53%|█████▎    | 378/716 [02:25<02:10,  2.60it/s, loss=13.1][A
[Epoch 2]:  53%|█████▎    | 378/716 [02:25<02:10,  2.59it/s, loss=13.5][A
[Epoch 2]:  53%|█████▎    | 379/716 [02:25<02:09,  2.60it/s, loss=13.5][A
[Epoch 2]:  53%|█████▎    | 379/716 [02:26<02:10,  2.59it/s, loss=15.2][A
[Epoch 2]:  53%|█████▎    | 380/716 [02:26<02:09,  2.60it/s, loss=15.2][A
[Epoch 2]:  53%|█████▎    | 380/716 [02:26<02:09,  2.59it/s, loss=14.1][A
[Epoch 2]:  53%|█████▎    | 381/716 [02:26<02:08,  2.60it/s, loss=14.1][A
[Epoch 2]:  53%|█████▎    | 381/716 [02:27<02:09,  2.59it/s, loss=13.5][A
[Epoch 2]:  53%|█████▎   

[Epoch 2]:  60%|██████    | 430/716 [02:45<01:49,  2.60it/s, loss=14.2][A
[Epoch 2]:  60%|██████    | 430/716 [02:45<01:50,  2.60it/s, loss=13.8][A
[Epoch 2]:  60%|██████    | 431/716 [02:45<01:49,  2.60it/s, loss=13.8][A
[Epoch 2]:  60%|██████    | 431/716 [02:46<01:49,  2.60it/s, loss=12.9][A
[Epoch 2]:  60%|██████    | 432/716 [02:46<01:49,  2.60it/s, loss=12.9][A
[Epoch 2]:  60%|██████    | 432/716 [02:46<01:49,  2.60it/s, loss=14.1][A
[Epoch 2]:  60%|██████    | 433/716 [02:46<01:48,  2.60it/s, loss=14.1][A
[Epoch 2]:  60%|██████    | 433/716 [02:46<01:49,  2.60it/s, loss=14]  [A
[Epoch 2]:  61%|██████    | 434/716 [02:46<01:48,  2.60it/s, loss=14][A
[Epoch 2]:  61%|██████    | 434/716 [02:47<01:48,  2.60it/s, loss=12.8][A
[Epoch 2]:  61%|██████    | 435/716 [02:47<01:47,  2.60it/s, loss=12.8][A
[Epoch 2]:  61%|██████    | 435/716 [02:47<01:48,  2.60it/s, loss=14.1][A
[Epoch 2]:  61%|██████    | 436/716 [02:47<01:47,  2.60it/s, loss=14.1][A
[Epoch 2]:  61%|██████    |

[Epoch 2]:  68%|██████▊   | 484/716 [03:06<01:29,  2.60it/s, loss=14.9][A
[Epoch 2]:  68%|██████▊   | 485/716 [03:06<01:28,  2.60it/s, loss=14.9][A
[Epoch 2]:  68%|██████▊   | 485/716 [03:06<01:28,  2.60it/s, loss=14]  [A
[Epoch 2]:  68%|██████▊   | 486/716 [03:06<01:28,  2.60it/s, loss=14][A
[Epoch 2]:  68%|██████▊   | 486/716 [03:06<01:28,  2.60it/s, loss=13.3][A
[Epoch 2]:  68%|██████▊   | 487/716 [03:06<01:27,  2.60it/s, loss=13.3][A
[Epoch 2]:  68%|██████▊   | 487/716 [03:07<01:28,  2.60it/s, loss=13.1][A
[Epoch 2]:  68%|██████▊   | 488/716 [03:07<01:27,  2.60it/s, loss=13.1][A
[Epoch 2]:  68%|██████▊   | 488/716 [03:07<01:27,  2.60it/s, loss=13]  [A
[Epoch 2]:  68%|██████▊   | 489/716 [03:07<01:27,  2.61it/s, loss=13][A
[Epoch 2]:  68%|██████▊   | 489/716 [03:08<01:27,  2.60it/s, loss=14][A
[Epoch 2]:  68%|██████▊   | 490/716 [03:08<01:26,  2.61it/s, loss=14][A
[Epoch 2]:  68%|██████▊   | 490/716 [03:08<01:26,  2.60it/s, loss=13.8][A
[Epoch 2]:  69%|██████▊   | 491/7

[Epoch 2]:  75%|███████▌  | 539/716 [03:26<01:07,  2.60it/s, loss=14.3][A
[Epoch 2]:  75%|███████▌  | 539/716 [03:27<01:08,  2.60it/s, loss=12.9][A
[Epoch 2]:  75%|███████▌  | 540/716 [03:27<01:07,  2.60it/s, loss=12.9][A
[Epoch 2]:  75%|███████▌  | 540/716 [03:27<01:07,  2.60it/s, loss=13.4][A
[Epoch 2]:  76%|███████▌  | 541/716 [03:27<01:07,  2.60it/s, loss=13.4][A
[Epoch 2]:  76%|███████▌  | 541/716 [03:28<01:07,  2.60it/s, loss=14.5][A
[Epoch 2]:  76%|███████▌  | 542/716 [03:28<01:06,  2.60it/s, loss=14.5][A
[Epoch 2]:  76%|███████▌  | 542/716 [03:28<01:06,  2.60it/s, loss=15.3][A
[Epoch 2]:  76%|███████▌  | 543/716 [03:28<01:06,  2.60it/s, loss=15.3][A
[Epoch 2]:  76%|███████▌  | 543/716 [03:28<01:06,  2.60it/s, loss=13.4][A
[Epoch 2]:  76%|███████▌  | 544/716 [03:28<01:06,  2.60it/s, loss=13.4][A
[Epoch 2]:  76%|███████▌  | 544/716 [03:29<01:06,  2.60it/s, loss=13.4][A
[Epoch 2]:  76%|███████▌  | 545/716 [03:29<01:05,  2.60it/s, loss=13.4][A
[Epoch 2]:  76%|███████▌ 

[Epoch 2]:  83%|████████▎ | 593/716 [03:47<00:47,  2.60it/s, loss=13.3][A
[Epoch 2]:  83%|████████▎ | 594/716 [03:47<00:46,  2.61it/s, loss=13.3][A
[Epoch 2]:  83%|████████▎ | 594/716 [03:48<00:46,  2.60it/s, loss=13.7][A
[Epoch 2]:  83%|████████▎ | 595/716 [03:48<00:46,  2.61it/s, loss=13.7][A
[Epoch 2]:  83%|████████▎ | 595/716 [03:48<00:46,  2.60it/s, loss=13.8][A
[Epoch 2]:  83%|████████▎ | 596/716 [03:48<00:46,  2.61it/s, loss=13.8][A
[Epoch 2]:  83%|████████▎ | 596/716 [03:49<00:46,  2.60it/s, loss=15]  [A
[Epoch 2]:  83%|████████▎ | 597/716 [03:49<00:45,  2.61it/s, loss=15][A
[Epoch 2]:  83%|████████▎ | 597/716 [03:49<00:45,  2.60it/s, loss=13.6][A
[Epoch 2]:  84%|████████▎ | 598/716 [03:49<00:45,  2.61it/s, loss=13.6][A
[Epoch 2]:  84%|████████▎ | 598/716 [03:49<00:45,  2.60it/s, loss=14.2][A
[Epoch 2]:  84%|████████▎ | 599/716 [03:49<00:44,  2.61it/s, loss=14.2][A
[Epoch 2]:  84%|████████▎ | 599/716 [03:50<00:44,  2.60it/s, loss=13.6][A
[Epoch 2]:  84%|████████▍ |

[Epoch 2]:  91%|█████████ | 648/716 [04:08<00:26,  2.61it/s, loss=12.9][A
[Epoch 2]:  91%|█████████ | 648/716 [04:09<00:26,  2.60it/s, loss=12.7][A
[Epoch 2]:  91%|█████████ | 649/716 [04:09<00:25,  2.61it/s, loss=12.7][A
[Epoch 2]:  91%|█████████ | 649/716 [04:09<00:25,  2.60it/s, loss=12.8][A
[Epoch 2]:  91%|█████████ | 650/716 [04:09<00:25,  2.61it/s, loss=12.8][A
[Epoch 2]:  91%|█████████ | 650/716 [04:09<00:25,  2.60it/s, loss=14.2][A
[Epoch 2]:  91%|█████████ | 651/716 [04:09<00:24,  2.61it/s, loss=14.2][A
[Epoch 2]:  91%|█████████ | 651/716 [04:10<00:24,  2.60it/s, loss=13.6][A
[Epoch 2]:  91%|█████████ | 652/716 [04:10<00:24,  2.61it/s, loss=13.6][A
[Epoch 2]:  91%|█████████ | 652/716 [04:10<00:24,  2.60it/s, loss=14.1][A
[Epoch 2]:  91%|█████████ | 653/716 [04:10<00:24,  2.61it/s, loss=14.1][A
[Epoch 2]:  91%|█████████ | 653/716 [04:10<00:24,  2.60it/s, loss=13.5][A
[Epoch 2]:  91%|█████████▏| 654/716 [04:10<00:23,  2.61it/s, loss=13.5][A
[Epoch 2]:  91%|█████████

[Epoch 2]:  98%|█████████▊| 702/716 [04:29<00:05,  2.60it/s, loss=14][A
[Epoch 2]:  98%|█████████▊| 703/716 [04:29<00:04,  2.60it/s, loss=14][A
[Epoch 2]:  98%|█████████▊| 703/716 [04:30<00:04,  2.60it/s, loss=14.1][A
[Epoch 2]:  98%|█████████▊| 704/716 [04:30<00:04,  2.60it/s, loss=14.1][A
[Epoch 2]:  98%|█████████▊| 704/716 [04:30<00:04,  2.60it/s, loss=13.4][A
[Epoch 2]:  98%|█████████▊| 705/716 [04:30<00:04,  2.60it/s, loss=13.4][A
[Epoch 2]:  98%|█████████▊| 705/716 [04:31<00:04,  2.60it/s, loss=13.9][A
[Epoch 2]:  99%|█████████▊| 706/716 [04:31<00:03,  2.60it/s, loss=13.9][A
[Epoch 2]:  99%|█████████▊| 706/716 [04:31<00:03,  2.60it/s, loss=13.5][A
[Epoch 2]:  99%|█████████▊| 707/716 [04:31<00:03,  2.60it/s, loss=13.5][A
[Epoch 2]:  99%|█████████▊| 707/716 [04:31<00:03,  2.60it/s, loss=15.3][A
[Epoch 2]:  99%|█████████▉| 708/716 [04:31<00:03,  2.60it/s, loss=15.3][A
[Epoch 2]:  99%|█████████▉| 708/716 [04:32<00:03,  2.60it/s, loss=14.2][A
[Epoch 2]:  99%|█████████▉| 7

[Epoch 3]:   6%|▌         | 41/714 [00:15<04:22,  2.56it/s, loss=13.9][A
[Epoch 3]:   6%|▌         | 41/714 [00:16<04:28,  2.50it/s, loss=13.1][A
[Epoch 3]:   6%|▌         | 42/714 [00:16<04:21,  2.57it/s, loss=13.1][A
[Epoch 3]:   6%|▌         | 42/714 [00:16<04:28,  2.51it/s, loss=13.7][A
[Epoch 3]:   6%|▌         | 43/714 [00:16<04:21,  2.57it/s, loss=13.7][A
[Epoch 3]:   6%|▌         | 43/714 [00:17<04:27,  2.51it/s, loss=14.1][A
[Epoch 3]:   6%|▌         | 44/714 [00:17<04:20,  2.57it/s, loss=14.1][A
[Epoch 3]:   6%|▌         | 44/714 [00:17<04:26,  2.51it/s, loss=13.8][A
[Epoch 3]:   6%|▋         | 45/714 [00:17<04:20,  2.57it/s, loss=13.8][A
[Epoch 3]:   6%|▋         | 45/714 [00:17<04:26,  2.51it/s, loss=13.4][A
[Epoch 3]:   6%|▋         | 46/714 [00:17<04:20,  2.57it/s, loss=13.4][A
[Epoch 3]:   6%|▋         | 46/714 [00:18<04:25,  2.52it/s, loss=13.1][A
[Epoch 3]:   7%|▋         | 47/714 [00:18<04:19,  2.57it/s, loss=13.1][A
[Epoch 3]:   7%|▋         | 47/714 [00

[Epoch 3]:  13%|█▎        | 96/714 [00:37<03:59,  2.59it/s, loss=14.5][A
[Epoch 3]:  13%|█▎        | 96/714 [00:37<04:01,  2.56it/s, loss=13.9][A
[Epoch 3]:  14%|█▎        | 97/714 [00:37<03:58,  2.59it/s, loss=13.9][A
[Epoch 3]:  14%|█▎        | 97/714 [00:37<04:01,  2.56it/s, loss=13.7][A
[Epoch 3]:  14%|█▎        | 98/714 [00:37<03:58,  2.59it/s, loss=13.7][A
[Epoch 3]:  14%|█▎        | 98/714 [00:38<04:00,  2.56it/s, loss=14.1][A
[Epoch 3]:  14%|█▍        | 99/714 [00:38<03:57,  2.59it/s, loss=14.1][A
[Epoch 3]:  14%|█▍        | 99/714 [00:38<04:00,  2.56it/s, loss=15]  [A
[Epoch 3]:  14%|█▍        | 100/714 [00:38<03:57,  2.59it/s, loss=15][A
[Epoch 3]:  14%|█▍        | 100/714 [00:39<03:59,  2.56it/s, loss=13.1][A
[Epoch 3]:  14%|█▍        | 101/714 [00:39<03:56,  2.59it/s, loss=13.1][A
[Epoch 3]:  14%|█▍        | 101/714 [00:39<03:59,  2.56it/s, loss=14.3][A
[Epoch 3]:  14%|█▍        | 102/714 [00:39<03:56,  2.59it/s, loss=14.3][A
[Epoch 3]:  14%|█▍        | 102/714

[Epoch 3]:  21%|██        | 150/714 [00:58<03:38,  2.58it/s, loss=13.1][A
[Epoch 3]:  21%|██        | 151/714 [00:58<03:36,  2.60it/s, loss=13.1][A
[Epoch 3]:  21%|██        | 151/714 [00:58<03:37,  2.59it/s, loss=15.1][A
[Epoch 3]:  21%|██▏       | 152/714 [00:58<03:35,  2.60it/s, loss=15.1][A
[Epoch 3]:  21%|██▏       | 152/714 [00:58<03:37,  2.58it/s, loss=13.6][A
[Epoch 3]:  21%|██▏       | 153/714 [00:58<03:35,  2.60it/s, loss=13.6][A
[Epoch 3]:  21%|██▏       | 153/714 [00:59<03:36,  2.59it/s, loss=13.7][A
[Epoch 3]:  22%|██▏       | 154/714 [00:59<03:35,  2.60it/s, loss=13.7][A
[Epoch 3]:  22%|██▏       | 154/714 [00:59<03:36,  2.59it/s, loss=13.3][A
[Epoch 3]:  22%|██▏       | 155/714 [00:59<03:34,  2.60it/s, loss=13.3][A
[Epoch 3]:  22%|██▏       | 155/714 [00:59<03:36,  2.59it/s, loss=12.7][A
[Epoch 3]:  22%|██▏       | 156/714 [00:59<03:34,  2.60it/s, loss=12.7][A
[Epoch 3]:  22%|██▏       | 156/714 [01:00<03:35,  2.59it/s, loss=13.3][A
[Epoch 3]:  22%|██▏      

[Epoch 3]:  29%|██▊       | 205/714 [01:18<03:15,  2.61it/s, loss=13.1][A
[Epoch 3]:  29%|██▊       | 205/714 [01:19<03:16,  2.59it/s, loss=13.9][A
[Epoch 3]:  29%|██▉       | 206/714 [01:19<03:14,  2.61it/s, loss=13.9][A
[Epoch 3]:  29%|██▉       | 206/714 [01:19<03:15,  2.59it/s, loss=12.9][A
[Epoch 3]:  29%|██▉       | 207/714 [01:19<03:14,  2.61it/s, loss=12.9][A
[Epoch 3]:  29%|██▉       | 207/714 [01:19<03:15,  2.59it/s, loss=13.5][A
[Epoch 3]:  29%|██▉       | 208/714 [01:19<03:14,  2.60it/s, loss=13.5][A
[Epoch 3]:  29%|██▉       | 208/714 [01:20<03:15,  2.59it/s, loss=13]  [A
[Epoch 3]:  29%|██▉       | 209/714 [01:20<03:13,  2.60it/s, loss=13][A
[Epoch 3]:  29%|██▉       | 209/714 [01:20<03:14,  2.59it/s, loss=12.9][A
[Epoch 3]:  29%|██▉       | 210/714 [01:20<03:13,  2.60it/s, loss=12.9][A
[Epoch 3]:  29%|██▉       | 210/714 [01:21<03:14,  2.59it/s, loss=13.7][A
[Epoch 3]:  30%|██▉       | 211/714 [01:21<03:13,  2.60it/s, loss=13.7][A
[Epoch 3]:  30%|██▉       |

[Epoch 3]:  36%|███▋      | 259/714 [01:39<02:55,  2.60it/s, loss=12.3][A
[Epoch 3]:  36%|███▋      | 260/714 [01:39<02:54,  2.61it/s, loss=12.3][A
[Epoch 3]:  36%|███▋      | 260/714 [01:40<02:54,  2.60it/s, loss=14]  [A
[Epoch 3]:  37%|███▋      | 261/714 [01:40<02:53,  2.61it/s, loss=14][A
[Epoch 3]:  37%|███▋      | 261/714 [01:40<02:54,  2.60it/s, loss=14.1][A
[Epoch 3]:  37%|███▋      | 262/714 [01:40<02:53,  2.61it/s, loss=14.1][A
[Epoch 3]:  37%|███▋      | 262/714 [01:40<02:54,  2.60it/s, loss=13.4][A
[Epoch 3]:  37%|███▋      | 263/714 [01:40<02:53,  2.61it/s, loss=13.4][A
[Epoch 3]:  37%|███▋      | 263/714 [01:41<02:53,  2.60it/s, loss=12.9][A
[Epoch 3]:  37%|███▋      | 264/714 [01:41<02:52,  2.61it/s, loss=12.9][A
[Epoch 3]:  37%|███▋      | 264/714 [01:41<02:53,  2.60it/s, loss=11.9][A
[Epoch 3]:  37%|███▋      | 265/714 [01:41<02:52,  2.61it/s, loss=11.9][A
[Epoch 3]:  37%|███▋      | 265/714 [01:42<02:52,  2.60it/s, loss=13.2][A
[Epoch 3]:  37%|███▋      |

[Epoch 3]:  44%|████▍     | 314/714 [02:00<02:33,  2.60it/s, loss=13.8][A
[Epoch 3]:  44%|████▍     | 314/714 [02:00<02:34,  2.60it/s, loss=14.3][A
[Epoch 3]:  44%|████▍     | 315/714 [02:00<02:33,  2.60it/s, loss=14.3][A
[Epoch 3]:  44%|████▍     | 315/714 [02:01<02:33,  2.60it/s, loss=13.5][A
[Epoch 3]:  44%|████▍     | 316/714 [02:01<02:32,  2.60it/s, loss=13.5][A
[Epoch 3]:  44%|████▍     | 316/714 [02:01<02:33,  2.60it/s, loss=14.5][A
[Epoch 3]:  44%|████▍     | 317/714 [02:01<02:32,  2.60it/s, loss=14.5][A
[Epoch 3]:  44%|████▍     | 317/714 [02:02<02:32,  2.60it/s, loss=13.1][A
[Epoch 3]:  45%|████▍     | 318/714 [02:02<02:32,  2.60it/s, loss=13.1][A
[Epoch 3]:  45%|████▍     | 318/714 [02:02<02:32,  2.60it/s, loss=14.3][A
[Epoch 3]:  45%|████▍     | 319/714 [02:02<02:31,  2.60it/s, loss=14.3][A
[Epoch 3]:  45%|████▍     | 319/714 [02:02<02:32,  2.60it/s, loss=12.6][A
[Epoch 3]:  45%|████▍     | 320/714 [02:02<02:31,  2.60it/s, loss=12.6][A
[Epoch 3]:  45%|████▍    

[Epoch 3]:  52%|█████▏    | 368/714 [02:21<02:13,  2.60it/s, loss=12.6][A
[Epoch 3]:  52%|█████▏    | 369/714 [02:21<02:12,  2.60it/s, loss=12.6][A
[Epoch 3]:  52%|█████▏    | 369/714 [02:22<02:12,  2.60it/s, loss=13.9][A
[Epoch 3]:  52%|█████▏    | 370/714 [02:22<02:12,  2.60it/s, loss=13.9][A
[Epoch 3]:  52%|█████▏    | 370/714 [02:22<02:12,  2.60it/s, loss=12.7][A
[Epoch 3]:  52%|█████▏    | 371/714 [02:22<02:11,  2.60it/s, loss=12.7][A
[Epoch 3]:  52%|█████▏    | 371/714 [02:22<02:12,  2.60it/s, loss=14.6][A
[Epoch 3]:  52%|█████▏    | 372/714 [02:22<02:11,  2.60it/s, loss=14.6][A
[Epoch 3]:  52%|█████▏    | 372/714 [02:23<02:11,  2.60it/s, loss=14.9][A
[Epoch 3]:  52%|█████▏    | 373/714 [02:23<02:10,  2.60it/s, loss=14.9][A
[Epoch 3]:  52%|█████▏    | 373/714 [02:23<02:11,  2.60it/s, loss=13.5][A
[Epoch 3]:  52%|█████▏    | 374/714 [02:23<02:10,  2.60it/s, loss=13.5][A
[Epoch 3]:  52%|█████▏    | 374/714 [02:24<02:10,  2.60it/s, loss=13.7][A
[Epoch 3]:  53%|█████▎   

[Epoch 3]:  59%|█████▉    | 423/714 [02:42<01:51,  2.61it/s, loss=14.9][A
[Epoch 3]:  59%|█████▉    | 423/714 [02:42<01:51,  2.60it/s, loss=14.3][A
[Epoch 3]:  59%|█████▉    | 424/714 [02:42<01:51,  2.61it/s, loss=14.3][A
[Epoch 3]:  59%|█████▉    | 424/714 [02:43<01:51,  2.60it/s, loss=12.7][A
[Epoch 3]:  60%|█████▉    | 425/714 [02:43<01:50,  2.61it/s, loss=12.7][A
[Epoch 3]:  60%|█████▉    | 425/714 [02:43<01:51,  2.60it/s, loss=12.9][A
[Epoch 3]:  60%|█████▉    | 426/714 [02:43<01:50,  2.61it/s, loss=12.9][A
[Epoch 3]:  60%|█████▉    | 426/714 [02:43<01:50,  2.60it/s, loss=13.4][A
[Epoch 3]:  60%|█████▉    | 427/714 [02:43<01:50,  2.61it/s, loss=13.4][A
[Epoch 3]:  60%|█████▉    | 427/714 [02:44<01:50,  2.60it/s, loss=13.3][A
[Epoch 3]:  60%|█████▉    | 428/714 [02:44<01:49,  2.61it/s, loss=13.3][A
[Epoch 3]:  60%|█████▉    | 428/714 [02:44<01:50,  2.60it/s, loss=13.6][A
[Epoch 3]:  60%|██████    | 429/714 [02:44<01:49,  2.61it/s, loss=13.6][A
[Epoch 3]:  60%|██████   

[Epoch 3]:  67%|██████▋   | 477/714 [03:03<01:31,  2.60it/s, loss=13.8][A
[Epoch 3]:  67%|██████▋   | 478/714 [03:03<01:30,  2.61it/s, loss=13.8][A
[Epoch 3]:  67%|██████▋   | 478/714 [03:03<01:30,  2.60it/s, loss=13.5][A
[Epoch 3]:  67%|██████▋   | 479/714 [03:03<01:30,  2.61it/s, loss=13.5][A
[Epoch 3]:  67%|██████▋   | 479/714 [03:04<01:30,  2.60it/s, loss=13.7][A
[Epoch 3]:  67%|██████▋   | 480/714 [03:04<01:29,  2.61it/s, loss=13.7][A
[Epoch 3]:  67%|██████▋   | 480/714 [03:04<01:29,  2.60it/s, loss=14.2][A
[Epoch 3]:  67%|██████▋   | 481/714 [03:04<01:29,  2.61it/s, loss=14.2][A
[Epoch 3]:  67%|██████▋   | 481/714 [03:04<01:29,  2.60it/s, loss=13.7][A
[Epoch 3]:  68%|██████▊   | 482/714 [03:04<01:29,  2.61it/s, loss=13.7][A
[Epoch 3]:  68%|██████▊   | 482/714 [03:05<01:29,  2.60it/s, loss=14.1][A
[Epoch 3]:  68%|██████▊   | 483/714 [03:05<01:28,  2.61it/s, loss=14.1][A
[Epoch 3]:  68%|██████▊   | 483/714 [03:05<01:28,  2.60it/s, loss=14.1][A
[Epoch 3]:  68%|██████▊  

[Epoch 3]:  75%|███████▍  | 532/714 [03:24<01:09,  2.61it/s, loss=13.7][A
[Epoch 3]:  75%|███████▍  | 532/714 [03:24<01:09,  2.60it/s, loss=14]  [A
[Epoch 3]:  75%|███████▍  | 533/714 [03:24<01:09,  2.61it/s, loss=14][A
[Epoch 3]:  75%|███████▍  | 533/714 [03:24<01:09,  2.60it/s, loss=13.4][A
[Epoch 3]:  75%|███████▍  | 534/714 [03:24<01:09,  2.61it/s, loss=13.4][A
[Epoch 3]:  75%|███████▍  | 534/714 [03:25<01:09,  2.60it/s, loss=14.2][A
[Epoch 3]:  75%|███████▍  | 535/714 [03:25<01:08,  2.61it/s, loss=14.2][A
[Epoch 3]:  75%|███████▍  | 535/714 [03:25<01:08,  2.60it/s, loss=12.6][A
[Epoch 3]:  75%|███████▌  | 536/714 [03:25<01:08,  2.61it/s, loss=12.6][A
[Epoch 3]:  75%|███████▌  | 536/714 [03:25<01:08,  2.60it/s, loss=12.6][A
[Epoch 3]:  75%|███████▌  | 537/714 [03:25<01:07,  2.61it/s, loss=12.6][A
[Epoch 3]:  75%|███████▌  | 537/714 [03:26<01:07,  2.60it/s, loss=13]  [A
[Epoch 3]:  75%|███████▌  | 538/714 [03:26<01:07,  2.61it/s, loss=13][A
[Epoch 3]:  75%|███████▌  | 5

[Epoch 3]:  82%|████████▏ | 586/714 [03:45<00:49,  2.60it/s, loss=13.3][A
[Epoch 3]:  82%|████████▏ | 587/714 [03:45<00:48,  2.61it/s, loss=13.3][A
[Epoch 3]:  82%|████████▏ | 587/714 [03:45<00:48,  2.60it/s, loss=13.7][A
[Epoch 3]:  82%|████████▏ | 588/714 [03:45<00:48,  2.61it/s, loss=13.7][A
[Epoch 3]:  82%|████████▏ | 588/714 [03:45<00:48,  2.60it/s, loss=11.9][A
[Epoch 3]:  82%|████████▏ | 589/714 [03:45<00:47,  2.61it/s, loss=11.9][A
[Epoch 3]:  82%|████████▏ | 589/714 [03:46<00:48,  2.60it/s, loss=13.9][A
[Epoch 3]:  83%|████████▎ | 590/714 [03:46<00:47,  2.61it/s, loss=13.9][A
[Epoch 3]:  83%|████████▎ | 590/714 [03:46<00:47,  2.60it/s, loss=13.2][A
[Epoch 3]:  83%|████████▎ | 591/714 [03:46<00:47,  2.61it/s, loss=13.2][A
[Epoch 3]:  83%|████████▎ | 591/714 [03:47<00:47,  2.60it/s, loss=14.4][A
[Epoch 3]:  83%|████████▎ | 592/714 [03:47<00:46,  2.61it/s, loss=14.4][A
[Epoch 3]:  83%|████████▎ | 592/714 [03:47<00:46,  2.60it/s, loss=15]  [A
[Epoch 3]:  83%|████████▎

[Epoch 3]:  90%|████████▉ | 641/714 [04:05<00:28,  2.61it/s, loss=13.9][A
[Epoch 3]:  90%|████████▉ | 641/714 [04:06<00:28,  2.60it/s, loss=14.1][A
[Epoch 3]:  90%|████████▉ | 642/714 [04:06<00:27,  2.61it/s, loss=14.1][A
[Epoch 3]:  90%|████████▉ | 642/714 [04:06<00:27,  2.60it/s, loss=13]  [A
[Epoch 3]:  90%|█████████ | 643/714 [04:06<00:27,  2.61it/s, loss=13][A
[Epoch 3]:  90%|█████████ | 643/714 [04:07<00:27,  2.60it/s, loss=13.6][A
[Epoch 3]:  90%|█████████ | 644/714 [04:07<00:26,  2.61it/s, loss=13.6][A
[Epoch 3]:  90%|█████████ | 644/714 [04:07<00:26,  2.60it/s, loss=13.5][A
[Epoch 3]:  90%|█████████ | 645/714 [04:07<00:26,  2.61it/s, loss=13.5][A
[Epoch 3]:  90%|█████████ | 645/714 [04:07<00:26,  2.60it/s, loss=14]  [A
[Epoch 3]:  90%|█████████ | 646/714 [04:07<00:26,  2.61it/s, loss=14][A
[Epoch 3]:  90%|█████████ | 646/714 [04:08<00:26,  2.60it/s, loss=13.5][A
[Epoch 3]:  91%|█████████ | 647/714 [04:08<00:25,  2.61it/s, loss=13.5][A
[Epoch 3]:  91%|█████████ | 6

[Epoch 3]:  97%|█████████▋| 695/714 [04:26<00:07,  2.60it/s, loss=14.8][A
[Epoch 3]:  97%|█████████▋| 696/714 [04:26<00:06,  2.61it/s, loss=14.8][A
[Epoch 3]:  97%|█████████▋| 696/714 [04:27<00:06,  2.60it/s, loss=13.8][A
[Epoch 3]:  98%|█████████▊| 697/714 [04:27<00:06,  2.61it/s, loss=13.8][A
[Epoch 3]:  98%|█████████▊| 697/714 [04:27<00:06,  2.60it/s, loss=12.7][A
[Epoch 3]:  98%|█████████▊| 698/714 [04:27<00:06,  2.61it/s, loss=12.7][A
[Epoch 3]:  98%|█████████▊| 698/714 [04:27<00:06,  2.61it/s, loss=13.3][A
[Epoch 3]:  98%|█████████▊| 699/714 [04:27<00:05,  2.61it/s, loss=13.3][A
[Epoch 3]:  98%|█████████▊| 699/714 [04:28<00:05,  2.61it/s, loss=14.4][A
[Epoch 3]:  98%|█████████▊| 700/714 [04:28<00:05,  2.61it/s, loss=14.4][A
[Epoch 3]:  98%|█████████▊| 700/714 [04:28<00:05,  2.61it/s, loss=13.9][A
[Epoch 3]:  98%|█████████▊| 701/714 [04:28<00:04,  2.61it/s, loss=13.9][A
[Epoch 3]:  98%|█████████▊| 701/714 [04:29<00:04,  2.60it/s, loss=13.4][A
[Epoch 3]:  98%|█████████

[Epoch 4]:   5%|▌         | 36/716 [00:14<04:28,  2.54it/s, loss=14.1][A
[Epoch 4]:   5%|▌         | 36/716 [00:14<04:35,  2.47it/s, loss=13.6][A
[Epoch 4]:   5%|▌         | 37/716 [00:14<04:27,  2.54it/s, loss=13.6][A
[Epoch 4]:   5%|▌         | 37/716 [00:14<04:34,  2.48it/s, loss=13.3][A
[Epoch 4]:   5%|▌         | 38/716 [00:14<04:26,  2.54it/s, loss=13.3][A
[Epoch 4]:   5%|▌         | 38/716 [00:15<04:33,  2.48it/s, loss=12.3][A
[Epoch 4]:   5%|▌         | 39/716 [00:15<04:26,  2.54it/s, loss=12.3][A
[Epoch 4]:   5%|▌         | 39/716 [00:15<04:32,  2.48it/s, loss=12.8][A
[Epoch 4]:   6%|▌         | 40/716 [00:15<04:25,  2.55it/s, loss=12.8][A
[Epoch 4]:   6%|▌         | 40/716 [00:16<04:31,  2.49it/s, loss=14]  [A
[Epoch 4]:   6%|▌         | 41/716 [00:16<04:24,  2.55it/s, loss=14][A
[Epoch 4]:   6%|▌         | 41/716 [00:16<04:31,  2.49it/s, loss=13.8][A
[Epoch 4]:   6%|▌         | 42/716 [00:16<04:24,  2.55it/s, loss=13.8][A
[Epoch 4]:   6%|▌         | 42/716 [00:1

[Epoch 4]:  13%|█▎        | 91/716 [00:35<04:01,  2.59it/s, loss=13.2][A
[Epoch 4]:  13%|█▎        | 91/716 [00:35<04:04,  2.56it/s, loss=12.9][A
[Epoch 4]:  13%|█▎        | 92/716 [00:35<04:01,  2.59it/s, loss=12.9][A
[Epoch 4]:  13%|█▎        | 92/716 [00:35<04:03,  2.56it/s, loss=14.5][A
[Epoch 4]:  13%|█▎        | 93/716 [00:35<04:00,  2.59it/s, loss=14.5][A
[Epoch 4]:  13%|█▎        | 93/716 [00:36<04:03,  2.56it/s, loss=13.5][A
[Epoch 4]:  13%|█▎        | 94/716 [00:36<04:00,  2.59it/s, loss=13.5][A
[Epoch 4]:  13%|█▎        | 94/716 [00:36<04:02,  2.56it/s, loss=12.4][A
[Epoch 4]:  13%|█▎        | 95/716 [00:36<04:00,  2.59it/s, loss=12.4][A
[Epoch 4]:  13%|█▎        | 95/716 [00:37<04:02,  2.56it/s, loss=12.9][A
[Epoch 4]:  13%|█▎        | 96/716 [00:37<03:59,  2.59it/s, loss=12.9][A
[Epoch 4]:  13%|█▎        | 96/716 [00:37<04:02,  2.56it/s, loss=14.8][A
[Epoch 4]:  14%|█▎        | 97/716 [00:37<03:59,  2.59it/s, loss=14.8][A
[Epoch 4]:  14%|█▎        | 97/716 [00

[Epoch 4]:  20%|██        | 145/716 [00:56<03:41,  2.58it/s, loss=13.2][A
[Epoch 4]:  20%|██        | 146/716 [00:56<03:39,  2.59it/s, loss=13.2][A
[Epoch 4]:  20%|██        | 146/716 [00:56<03:41,  2.58it/s, loss=13.3][A
[Epoch 4]:  21%|██        | 147/716 [00:56<03:39,  2.59it/s, loss=13.3][A
[Epoch 4]:  21%|██        | 147/716 [00:57<03:40,  2.58it/s, loss=12.4][A
[Epoch 4]:  21%|██        | 148/716 [00:57<03:38,  2.59it/s, loss=12.4][A
[Epoch 4]:  21%|██        | 148/716 [00:57<03:40,  2.58it/s, loss=12.5][A
[Epoch 4]:  21%|██        | 149/716 [00:57<03:38,  2.59it/s, loss=12.5][A
[Epoch 4]:  21%|██        | 149/716 [00:57<03:40,  2.58it/s, loss=12.7][A
[Epoch 4]:  21%|██        | 150/716 [00:57<03:38,  2.59it/s, loss=12.7][A
[Epoch 4]:  21%|██        | 150/716 [00:58<03:39,  2.58it/s, loss=13.5][A
[Epoch 4]:  21%|██        | 151/716 [00:58<03:37,  2.59it/s, loss=13.5][A
[Epoch 4]:  21%|██        | 151/716 [00:58<03:39,  2.58it/s, loss=13.9][A
[Epoch 4]:  21%|██       

[Epoch 4]:  28%|██▊       | 200/716 [01:17<03:18,  2.60it/s, loss=12.6][A
[Epoch 4]:  28%|██▊       | 200/716 [01:17<03:19,  2.58it/s, loss=13.8][A
[Epoch 4]:  28%|██▊       | 201/716 [01:17<03:18,  2.60it/s, loss=13.8][A
[Epoch 4]:  28%|██▊       | 201/716 [01:17<03:19,  2.58it/s, loss=12.6][A
[Epoch 4]:  28%|██▊       | 202/716 [01:17<03:18,  2.60it/s, loss=12.6][A
[Epoch 4]:  28%|██▊       | 202/716 [01:18<03:18,  2.58it/s, loss=14.3][A
[Epoch 4]:  28%|██▊       | 203/716 [01:18<03:17,  2.60it/s, loss=14.3][A
[Epoch 4]:  28%|██▊       | 203/716 [01:18<03:18,  2.58it/s, loss=12.5][A
[Epoch 4]:  28%|██▊       | 204/716 [01:18<03:17,  2.60it/s, loss=12.5][A
[Epoch 4]:  28%|██▊       | 204/716 [01:18<03:18,  2.58it/s, loss=13.6][A
[Epoch 4]:  29%|██▊       | 205/716 [01:18<03:16,  2.60it/s, loss=13.6][A
[Epoch 4]:  29%|██▊       | 205/716 [01:19<03:17,  2.58it/s, loss=14.1][A
[Epoch 4]:  29%|██▉       | 206/716 [01:19<03:16,  2.60it/s, loss=14.1][A
[Epoch 4]:  29%|██▉      

[Epoch 4]:  35%|███▌      | 254/716 [01:38<02:58,  2.59it/s, loss=13.5][A
[Epoch 4]:  36%|███▌      | 255/716 [01:38<02:57,  2.60it/s, loss=13.5][A
[Epoch 4]:  36%|███▌      | 255/716 [01:38<02:57,  2.59it/s, loss=12.8][A
[Epoch 4]:  36%|███▌      | 256/716 [01:38<02:56,  2.60it/s, loss=12.8][A
[Epoch 4]:  36%|███▌      | 256/716 [01:38<02:57,  2.59it/s, loss=14.3][A
[Epoch 4]:  36%|███▌      | 257/716 [01:38<02:56,  2.60it/s, loss=14.3][A
[Epoch 4]:  36%|███▌      | 257/716 [01:39<02:57,  2.59it/s, loss=13.8][A
[Epoch 4]:  36%|███▌      | 258/716 [01:39<02:56,  2.60it/s, loss=13.8][A
[Epoch 4]:  36%|███▌      | 258/716 [01:39<02:56,  2.59it/s, loss=14.4][A
[Epoch 4]:  36%|███▌      | 259/716 [01:39<02:55,  2.60it/s, loss=14.4][A
[Epoch 4]:  36%|███▌      | 259/716 [01:39<02:56,  2.59it/s, loss=13.1][A
[Epoch 4]:  36%|███▋      | 260/716 [01:39<02:55,  2.60it/s, loss=13.1][A
[Epoch 4]:  36%|███▋      | 260/716 [01:40<02:55,  2.59it/s, loss=13.8][A
[Epoch 4]:  36%|███▋     

[Epoch 4]:  43%|████▎     | 309/716 [01:58<02:36,  2.60it/s, loss=13.6][A
[Epoch 4]:  43%|████▎     | 309/716 [01:59<02:36,  2.60it/s, loss=12.9][A
[Epoch 4]:  43%|████▎     | 310/716 [01:59<02:35,  2.60it/s, loss=12.9][A
[Epoch 4]:  43%|████▎     | 310/716 [01:59<02:36,  2.60it/s, loss=12.9][A
[Epoch 4]:  43%|████▎     | 311/716 [01:59<02:35,  2.60it/s, loss=12.9][A
[Epoch 4]:  43%|████▎     | 311/716 [01:59<02:36,  2.60it/s, loss=12.5][A
[Epoch 4]:  44%|████▎     | 312/716 [01:59<02:35,  2.60it/s, loss=12.5][A
[Epoch 4]:  44%|████▎     | 312/716 [02:00<02:35,  2.60it/s, loss=14.6][A
[Epoch 4]:  44%|████▎     | 313/716 [02:00<02:34,  2.60it/s, loss=14.6][A
[Epoch 4]:  44%|████▎     | 313/716 [02:00<02:35,  2.60it/s, loss=14.9][A
[Epoch 4]:  44%|████▍     | 314/716 [02:00<02:34,  2.60it/s, loss=14.9][A
[Epoch 4]:  44%|████▍     | 314/716 [02:00<02:34,  2.60it/s, loss=13.2][A
[Epoch 4]:  44%|████▍     | 315/716 [02:00<02:34,  2.60it/s, loss=13.2][A
[Epoch 4]:  44%|████▍    

[Epoch 4]:  51%|█████     | 363/716 [02:19<02:15,  2.60it/s, loss=13.2][A
[Epoch 4]:  51%|█████     | 364/716 [02:19<02:15,  2.61it/s, loss=13.2][A
[Epoch 4]:  51%|█████     | 364/716 [02:20<02:15,  2.60it/s, loss=14.3][A
[Epoch 4]:  51%|█████     | 365/716 [02:20<02:14,  2.61it/s, loss=14.3][A
[Epoch 4]:  51%|█████     | 365/716 [02:20<02:15,  2.60it/s, loss=12.9][A
[Epoch 4]:  51%|█████     | 366/716 [02:20<02:14,  2.61it/s, loss=12.9][A
[Epoch 4]:  51%|█████     | 366/716 [02:20<02:14,  2.60it/s, loss=12.8][A
[Epoch 4]:  51%|█████▏    | 367/716 [02:20<02:13,  2.61it/s, loss=12.8][A
[Epoch 4]:  51%|█████▏    | 367/716 [02:21<02:14,  2.60it/s, loss=13.5][A
[Epoch 4]:  51%|█████▏    | 368/716 [02:21<02:13,  2.61it/s, loss=13.5][A
[Epoch 4]:  51%|█████▏    | 368/716 [02:21<02:13,  2.60it/s, loss=13]  [A
[Epoch 4]:  52%|█████▏    | 369/716 [02:21<02:13,  2.61it/s, loss=13][A
[Epoch 4]:  52%|█████▏    | 369/716 [02:21<02:13,  2.60it/s, loss=13.5][A
[Epoch 4]:  52%|█████▏    |

[Epoch 4]:  58%|█████▊    | 418/716 [02:40<01:54,  2.61it/s, loss=12.8][A
[Epoch 4]:  58%|█████▊    | 418/716 [02:40<01:54,  2.60it/s, loss=12.7][A
[Epoch 4]:  59%|█████▊    | 419/716 [02:40<01:53,  2.61it/s, loss=12.7][A
[Epoch 4]:  59%|█████▊    | 419/716 [02:41<01:54,  2.60it/s, loss=13.4][A
[Epoch 4]:  59%|█████▊    | 420/716 [02:41<01:53,  2.61it/s, loss=13.4][A
[Epoch 4]:  59%|█████▊    | 420/716 [02:41<01:53,  2.60it/s, loss=14.1][A
[Epoch 4]:  59%|█████▉    | 421/716 [02:41<01:53,  2.61it/s, loss=14.1][A
[Epoch 4]:  59%|█████▉    | 421/716 [02:41<01:53,  2.60it/s, loss=14.4][A
[Epoch 4]:  59%|█████▉    | 422/716 [02:41<01:52,  2.61it/s, loss=14.4][A
[Epoch 4]:  59%|█████▉    | 422/716 [02:42<01:53,  2.60it/s, loss=12.7][A
[Epoch 4]:  59%|█████▉    | 423/716 [02:42<01:52,  2.61it/s, loss=12.7][A
[Epoch 4]:  59%|█████▉    | 423/716 [02:42<01:52,  2.60it/s, loss=13.9][A
[Epoch 4]:  59%|█████▉    | 424/716 [02:42<01:51,  2.61it/s, loss=13.9][A
[Epoch 4]:  59%|█████▉   

[Epoch 4]:  66%|██████▌   | 472/716 [03:01<01:33,  2.60it/s, loss=13.7][A
[Epoch 4]:  66%|██████▌   | 473/716 [03:01<01:33,  2.61it/s, loss=13.7][A
[Epoch 4]:  66%|██████▌   | 473/716 [03:01<01:33,  2.60it/s, loss=12.6][A
[Epoch 4]:  66%|██████▌   | 474/716 [03:01<01:32,  2.61it/s, loss=12.6][A
[Epoch 4]:  66%|██████▌   | 474/716 [03:02<01:33,  2.60it/s, loss=13.7][A
[Epoch 4]:  66%|██████▋   | 475/716 [03:02<01:32,  2.61it/s, loss=13.7][A
[Epoch 4]:  66%|██████▋   | 475/716 [03:02<01:32,  2.60it/s, loss=14.3][A
[Epoch 4]:  66%|██████▋   | 476/716 [03:02<01:32,  2.61it/s, loss=14.3][A
[Epoch 4]:  66%|██████▋   | 476/716 [03:02<01:32,  2.60it/s, loss=13.9][A
[Epoch 4]:  67%|██████▋   | 477/716 [03:02<01:31,  2.61it/s, loss=13.9][A
[Epoch 4]:  67%|██████▋   | 477/716 [03:03<01:31,  2.60it/s, loss=13]  [A
[Epoch 4]:  67%|██████▋   | 478/716 [03:03<01:31,  2.61it/s, loss=13][A
[Epoch 4]:  67%|██████▋   | 478/716 [03:03<01:31,  2.60it/s, loss=13.3][A
[Epoch 4]:  67%|██████▋   |

[Epoch 4]:  74%|███████▎  | 527/716 [03:22<01:12,  2.61it/s, loss=13.2][A
[Epoch 4]:  74%|███████▎  | 527/716 [03:22<01:12,  2.60it/s, loss=14.1][A
[Epoch 4]:  74%|███████▎  | 528/716 [03:22<01:12,  2.61it/s, loss=14.1][A
[Epoch 4]:  74%|███████▎  | 528/716 [03:22<01:12,  2.60it/s, loss=14.3][A
[Epoch 4]:  74%|███████▍  | 529/716 [03:22<01:11,  2.61it/s, loss=14.3][A
[Epoch 4]:  74%|███████▍  | 529/716 [03:23<01:11,  2.60it/s, loss=13.5][A
[Epoch 4]:  74%|███████▍  | 530/716 [03:23<01:11,  2.61it/s, loss=13.5][A
[Epoch 4]:  74%|███████▍  | 530/716 [03:23<01:11,  2.60it/s, loss=13.3][A
[Epoch 4]:  74%|███████▍  | 531/716 [03:23<01:10,  2.61it/s, loss=13.3][A
[Epoch 4]:  74%|███████▍  | 531/716 [03:23<01:11,  2.60it/s, loss=14.7][A
[Epoch 4]:  74%|███████▍  | 532/716 [03:23<01:10,  2.61it/s, loss=14.7][A
[Epoch 4]:  74%|███████▍  | 532/716 [03:24<01:10,  2.60it/s, loss=14.4][A
[Epoch 4]:  74%|███████▍  | 533/716 [03:24<01:10,  2.61it/s, loss=14.4][A
[Epoch 4]:  74%|███████▍ 

[Epoch 4]:  81%|████████  | 581/716 [03:43<00:51,  2.61it/s, loss=12.6][A
[Epoch 4]:  81%|████████▏ | 582/716 [03:43<00:51,  2.61it/s, loss=12.6][A
[Epoch 4]:  81%|████████▏ | 582/716 [03:43<00:51,  2.61it/s, loss=13.4][A
[Epoch 4]:  81%|████████▏ | 583/716 [03:43<00:50,  2.61it/s, loss=13.4][A
[Epoch 4]:  81%|████████▏ | 583/716 [03:43<00:51,  2.61it/s, loss=13.9][A
[Epoch 4]:  82%|████████▏ | 584/716 [03:43<00:50,  2.61it/s, loss=13.9][A
[Epoch 4]:  82%|████████▏ | 584/716 [03:44<00:50,  2.61it/s, loss=13.5][A
[Epoch 4]:  82%|████████▏ | 585/716 [03:44<00:50,  2.61it/s, loss=13.5][A
[Epoch 4]:  82%|████████▏ | 585/716 [03:44<00:50,  2.61it/s, loss=12]  [A
[Epoch 4]:  82%|████████▏ | 586/716 [03:44<00:49,  2.61it/s, loss=12][A
[Epoch 4]:  82%|████████▏ | 586/716 [03:44<00:49,  2.61it/s, loss=14.3][A
[Epoch 4]:  82%|████████▏ | 587/716 [03:44<00:49,  2.61it/s, loss=14.3][A
[Epoch 4]:  82%|████████▏ | 587/716 [03:45<00:49,  2.61it/s, loss=15.3][A
[Epoch 4]:  82%|████████▏ |

[Epoch 4]:  89%|████████▉ | 636/716 [04:03<00:30,  2.61it/s, loss=14.3][A
[Epoch 4]:  89%|████████▉ | 636/716 [04:04<00:30,  2.60it/s, loss=14.4][A
[Epoch 4]:  89%|████████▉ | 637/716 [04:04<00:30,  2.61it/s, loss=14.4][A
[Epoch 4]:  89%|████████▉ | 637/716 [04:04<00:30,  2.60it/s, loss=13.7][A
[Epoch 4]:  89%|████████▉ | 638/716 [04:04<00:29,  2.61it/s, loss=13.7][A
[Epoch 4]:  89%|████████▉ | 638/716 [04:04<00:29,  2.60it/s, loss=13.4][A
[Epoch 4]:  89%|████████▉ | 639/716 [04:04<00:29,  2.61it/s, loss=13.4][A
[Epoch 4]:  89%|████████▉ | 639/716 [04:05<00:29,  2.60it/s, loss=14.6][A
[Epoch 4]:  89%|████████▉ | 640/716 [04:05<00:29,  2.61it/s, loss=14.6][A
[Epoch 4]:  89%|████████▉ | 640/716 [04:05<00:29,  2.60it/s, loss=14.1][A
[Epoch 4]:  90%|████████▉ | 641/716 [04:05<00:28,  2.61it/s, loss=14.1][A
[Epoch 4]:  90%|████████▉ | 641/716 [04:06<00:28,  2.60it/s, loss=14.6][A
[Epoch 4]:  90%|████████▉ | 642/716 [04:06<00:28,  2.61it/s, loss=14.6][A
[Epoch 4]:  90%|████████▉

[Epoch 4]:  96%|█████████▋| 690/716 [04:24<00:09,  2.61it/s, loss=13.8][A
[Epoch 4]:  97%|█████████▋| 691/716 [04:24<00:09,  2.61it/s, loss=13.8][A
[Epoch 4]:  97%|█████████▋| 691/716 [04:25<00:09,  2.61it/s, loss=14.6][A
[Epoch 4]:  97%|█████████▋| 692/716 [04:25<00:09,  2.61it/s, loss=14.6][A
[Epoch 4]:  97%|█████████▋| 692/716 [04:25<00:09,  2.61it/s, loss=15.6][A
[Epoch 4]:  97%|█████████▋| 693/716 [04:25<00:08,  2.61it/s, loss=15.6][A
[Epoch 4]:  97%|█████████▋| 693/716 [04:25<00:08,  2.61it/s, loss=14.3][A
[Epoch 4]:  97%|█████████▋| 694/716 [04:25<00:08,  2.61it/s, loss=14.3][A
[Epoch 4]:  97%|█████████▋| 694/716 [04:26<00:08,  2.61it/s, loss=13.3][A
[Epoch 4]:  97%|█████████▋| 695/716 [04:26<00:08,  2.61it/s, loss=13.3][A
[Epoch 4]:  97%|█████████▋| 695/716 [04:26<00:08,  2.61it/s, loss=13.3][A
[Epoch 4]:  97%|█████████▋| 696/716 [04:26<00:07,  2.61it/s, loss=13.3][A
[Epoch 4]:  97%|█████████▋| 696/716 [04:27<00:07,  2.61it/s, loss=13]  [A
[Epoch 4]:  97%|█████████

[Epoch 5]:   4%|▍         | 29/717 [00:11<04:32,  2.52it/s, loss=13.5][A
[Epoch 5]:   4%|▍         | 29/717 [00:11<04:41,  2.44it/s, loss=13.7][A
[Epoch 5]:   4%|▍         | 30/717 [00:11<04:32,  2.53it/s, loss=13.7][A
[Epoch 5]:   4%|▍         | 30/717 [00:12<04:40,  2.45it/s, loss=13.2][A
[Epoch 5]:   4%|▍         | 31/717 [00:12<04:31,  2.53it/s, loss=13.2][A
[Epoch 5]:   4%|▍         | 31/717 [00:12<04:39,  2.45it/s, loss=14.6][A
[Epoch 5]:   4%|▍         | 32/717 [00:12<04:30,  2.53it/s, loss=14.6][A
[Epoch 5]:   4%|▍         | 32/717 [00:13<04:38,  2.46it/s, loss=14.1][A
[Epoch 5]:   5%|▍         | 33/717 [00:13<04:30,  2.53it/s, loss=14.1][A
[Epoch 5]:   5%|▍         | 33/717 [00:13<04:38,  2.46it/s, loss=12.9][A
[Epoch 5]:   5%|▍         | 34/717 [00:13<04:29,  2.53it/s, loss=12.9][A
[Epoch 5]:   5%|▍         | 34/717 [00:13<04:37,  2.46it/s, loss=13.8][A
[Epoch 5]:   5%|▍         | 35/717 [00:13<04:29,  2.53it/s, loss=13.8][A
[Epoch 5]:   5%|▍         | 35/717 [00

[Epoch 5]:  12%|█▏        | 84/717 [00:32<04:06,  2.57it/s, loss=13.1][A
[Epoch 5]:  12%|█▏        | 84/717 [00:33<04:09,  2.54it/s, loss=14.2][A
[Epoch 5]:  12%|█▏        | 85/717 [00:33<04:06,  2.57it/s, loss=14.2][A
[Epoch 5]:  12%|█▏        | 85/717 [00:33<04:09,  2.54it/s, loss=13.3][A
[Epoch 5]:  12%|█▏        | 86/717 [00:33<04:05,  2.57it/s, loss=13.3][A
[Epoch 5]:  12%|█▏        | 86/717 [00:33<04:08,  2.54it/s, loss=14]  [A
[Epoch 5]:  12%|█▏        | 87/717 [00:33<04:05,  2.57it/s, loss=14][A
[Epoch 5]:  12%|█▏        | 87/717 [00:34<04:08,  2.54it/s, loss=13.1][A
[Epoch 5]:  12%|█▏        | 88/717 [00:34<04:04,  2.57it/s, loss=13.1][A
[Epoch 5]:  12%|█▏        | 88/717 [00:34<04:07,  2.54it/s, loss=13.8][A
[Epoch 5]:  12%|█▏        | 89/717 [00:34<04:04,  2.57it/s, loss=13.8][A
[Epoch 5]:  12%|█▏        | 89/717 [00:35<04:07,  2.54it/s, loss=12.6][A
[Epoch 5]:  13%|█▎        | 90/717 [00:35<04:03,  2.57it/s, loss=12.6][A
[Epoch 5]:  13%|█▎        | 90/717 [00:3

[Epoch 5]:  19%|█▉        | 138/717 [00:53<03:45,  2.57it/s, loss=13.3][A
[Epoch 5]:  19%|█▉        | 139/717 [00:53<03:43,  2.58it/s, loss=13.3][A
[Epoch 5]:  19%|█▉        | 139/717 [00:54<03:45,  2.57it/s, loss=13.4][A
[Epoch 5]:  20%|█▉        | 140/717 [00:54<03:43,  2.58it/s, loss=13.4][A
[Epoch 5]:  20%|█▉        | 140/717 [00:54<03:44,  2.57it/s, loss=13.7][A
[Epoch 5]:  20%|█▉        | 141/717 [00:54<03:42,  2.59it/s, loss=13.7][A
[Epoch 5]:  20%|█▉        | 141/717 [00:54<03:44,  2.57it/s, loss=13.9][A
[Epoch 5]:  20%|█▉        | 142/717 [00:54<03:42,  2.59it/s, loss=13.9][A
[Epoch 5]:  20%|█▉        | 142/717 [00:55<03:43,  2.57it/s, loss=13.3][A
[Epoch 5]:  20%|█▉        | 143/717 [00:55<03:42,  2.59it/s, loss=13.3][A
[Epoch 5]:  20%|█▉        | 143/717 [00:55<03:43,  2.57it/s, loss=14.2][A
[Epoch 5]:  20%|██        | 144/717 [00:55<03:41,  2.59it/s, loss=14.2][A
[Epoch 5]:  20%|██        | 144/717 [00:56<03:43,  2.57it/s, loss=12.9][A
[Epoch 5]:  20%|██       

[Epoch 5]:  27%|██▋       | 193/717 [01:14<03:22,  2.59it/s, loss=15.4][A
[Epoch 5]:  27%|██▋       | 193/717 [01:14<03:23,  2.58it/s, loss=12.6][A
[Epoch 5]:  27%|██▋       | 194/717 [01:14<03:22,  2.59it/s, loss=12.6][A
[Epoch 5]:  27%|██▋       | 194/717 [01:15<03:23,  2.58it/s, loss=12.9][A
[Epoch 5]:  27%|██▋       | 195/717 [01:15<03:21,  2.59it/s, loss=12.9][A
[Epoch 5]:  27%|██▋       | 195/717 [01:15<03:22,  2.58it/s, loss=12.8][A
[Epoch 5]:  27%|██▋       | 196/717 [01:15<03:21,  2.59it/s, loss=12.8][A
[Epoch 5]:  27%|██▋       | 196/717 [01:16<03:22,  2.58it/s, loss=13.6][A
[Epoch 5]:  27%|██▋       | 197/717 [01:16<03:20,  2.59it/s, loss=13.6][A
[Epoch 5]:  27%|██▋       | 197/717 [01:16<03:21,  2.58it/s, loss=13]  [A
[Epoch 5]:  28%|██▊       | 198/717 [01:16<03:20,  2.59it/s, loss=13][A
[Epoch 5]:  28%|██▊       | 198/717 [01:16<03:21,  2.58it/s, loss=13.1][A
[Epoch 5]:  28%|██▊       | 199/717 [01:16<03:20,  2.59it/s, loss=13.1][A
[Epoch 5]:  28%|██▊       |

[Epoch 5]:  34%|███▍      | 247/717 [01:35<03:01,  2.58it/s, loss=13.8][A
[Epoch 5]:  35%|███▍      | 248/717 [01:35<03:00,  2.59it/s, loss=13.8][A
[Epoch 5]:  35%|███▍      | 248/717 [01:35<03:01,  2.58it/s, loss=13.2][A
[Epoch 5]:  35%|███▍      | 249/717 [01:35<03:00,  2.59it/s, loss=13.2][A
[Epoch 5]:  35%|███▍      | 249/717 [01:36<03:01,  2.58it/s, loss=13.4][A
[Epoch 5]:  35%|███▍      | 250/717 [01:36<02:59,  2.59it/s, loss=13.4][A
[Epoch 5]:  35%|███▍      | 250/717 [01:36<03:00,  2.58it/s, loss=12.6][A
[Epoch 5]:  35%|███▌      | 251/717 [01:36<02:59,  2.59it/s, loss=12.6][A
[Epoch 5]:  35%|███▌      | 251/717 [01:37<03:00,  2.58it/s, loss=13.9][A
[Epoch 5]:  35%|███▌      | 252/717 [01:37<02:59,  2.60it/s, loss=13.9][A
[Epoch 5]:  35%|███▌      | 252/717 [01:37<02:59,  2.58it/s, loss=14.1][A
[Epoch 5]:  35%|███▌      | 253/717 [01:37<02:58,  2.60it/s, loss=14.1][A
[Epoch 5]:  35%|███▌      | 253/717 [01:37<02:59,  2.59it/s, loss=13.4][A
[Epoch 5]:  35%|███▌     

[Epoch 5]:  42%|████▏     | 302/717 [01:56<02:39,  2.60it/s, loss=13.3][A
[Epoch 5]:  42%|████▏     | 302/717 [01:56<02:40,  2.59it/s, loss=12.9][A
[Epoch 5]:  42%|████▏     | 303/717 [01:56<02:39,  2.60it/s, loss=12.9][A
[Epoch 5]:  42%|████▏     | 303/717 [01:57<02:39,  2.59it/s, loss=12.8][A
[Epoch 5]:  42%|████▏     | 304/717 [01:57<02:39,  2.60it/s, loss=12.8][A
[Epoch 5]:  42%|████▏     | 304/717 [01:57<02:39,  2.59it/s, loss=14.1][A
[Epoch 5]:  43%|████▎     | 305/717 [01:57<02:38,  2.60it/s, loss=14.1][A
[Epoch 5]:  43%|████▎     | 305/717 [01:57<02:39,  2.59it/s, loss=12.8][A
[Epoch 5]:  43%|████▎     | 306/717 [01:57<02:38,  2.60it/s, loss=12.8][A
[Epoch 5]:  43%|████▎     | 306/717 [01:58<02:38,  2.59it/s, loss=12.8][A
[Epoch 5]:  43%|████▎     | 307/717 [01:58<02:37,  2.60it/s, loss=12.8][A
[Epoch 5]:  43%|████▎     | 307/717 [01:58<02:38,  2.59it/s, loss=13.8][A
[Epoch 5]:  43%|████▎     | 308/717 [01:58<02:37,  2.60it/s, loss=13.8][A
[Epoch 5]:  43%|████▎    

[Epoch 5]:  50%|████▉     | 356/717 [02:17<02:19,  2.59it/s, loss=13.1][A
[Epoch 5]:  50%|████▉     | 357/717 [02:17<02:18,  2.60it/s, loss=13.1][A
[Epoch 5]:  50%|████▉     | 357/717 [02:17<02:18,  2.59it/s, loss=12.6][A
[Epoch 5]:  50%|████▉     | 358/717 [02:17<02:18,  2.60it/s, loss=12.6][A
[Epoch 5]:  50%|████▉     | 358/717 [02:18<02:18,  2.59it/s, loss=13.8][A
[Epoch 5]:  50%|█████     | 359/717 [02:18<02:17,  2.60it/s, loss=13.8][A
[Epoch 5]:  50%|█████     | 359/717 [02:18<02:18,  2.59it/s, loss=13.1][A
[Epoch 5]:  50%|█████     | 360/717 [02:18<02:17,  2.60it/s, loss=13.1][A
[Epoch 5]:  50%|█████     | 360/717 [02:18<02:17,  2.59it/s, loss=14.4][A
[Epoch 5]:  50%|█████     | 361/717 [02:18<02:16,  2.60it/s, loss=14.4][A
[Epoch 5]:  50%|█████     | 361/717 [02:19<02:17,  2.59it/s, loss=12.8][A
[Epoch 5]:  50%|█████     | 362/717 [02:19<02:16,  2.60it/s, loss=12.8][A
[Epoch 5]:  50%|█████     | 362/717 [02:19<02:16,  2.59it/s, loss=13.7][A
[Epoch 5]:  51%|█████    

[Epoch 5]:  57%|█████▋    | 411/717 [02:37<01:57,  2.60it/s, loss=13.9][A
[Epoch 5]:  57%|█████▋    | 411/717 [02:38<01:57,  2.60it/s, loss=12.8][A
[Epoch 5]:  57%|█████▋    | 412/717 [02:38<01:57,  2.60it/s, loss=12.8][A
[Epoch 5]:  57%|█████▋    | 412/717 [02:38<01:57,  2.60it/s, loss=13.8][A
[Epoch 5]:  58%|█████▊    | 413/717 [02:38<01:56,  2.60it/s, loss=13.8][A
[Epoch 5]:  58%|█████▊    | 413/717 [02:39<01:57,  2.60it/s, loss=12.6][A
[Epoch 5]:  58%|█████▊    | 414/717 [02:39<01:56,  2.60it/s, loss=12.6][A
[Epoch 5]:  58%|█████▊    | 414/717 [02:39<01:56,  2.60it/s, loss=13.5][A
[Epoch 5]:  58%|█████▊    | 415/717 [02:39<01:56,  2.60it/s, loss=13.5][A
[Epoch 5]:  58%|█████▊    | 415/717 [02:39<01:56,  2.60it/s, loss=12.7][A
[Epoch 5]:  58%|█████▊    | 416/717 [02:39<01:55,  2.60it/s, loss=12.7][A
[Epoch 5]:  58%|█████▊    | 416/717 [02:40<01:55,  2.60it/s, loss=14]  [A
[Epoch 5]:  58%|█████▊    | 417/717 [02:40<01:55,  2.60it/s, loss=14][A
[Epoch 5]:  58%|█████▊    |

[Epoch 5]:  65%|██████▍   | 465/717 [02:58<01:36,  2.60it/s, loss=13.3][A
[Epoch 5]:  65%|██████▍   | 466/717 [02:58<01:36,  2.61it/s, loss=13.3][A
[Epoch 5]:  65%|██████▍   | 466/717 [02:59<01:36,  2.60it/s, loss=13]  [A
[Epoch 5]:  65%|██████▌   | 467/717 [02:59<01:35,  2.61it/s, loss=13][A
[Epoch 5]:  65%|██████▌   | 467/717 [02:59<01:36,  2.60it/s, loss=13.1][A
[Epoch 5]:  65%|██████▌   | 468/717 [02:59<01:35,  2.61it/s, loss=13.1][A
[Epoch 5]:  65%|██████▌   | 468/717 [02:59<01:35,  2.60it/s, loss=14]  [A
[Epoch 5]:  65%|██████▌   | 469/717 [02:59<01:35,  2.61it/s, loss=14][A
[Epoch 5]:  65%|██████▌   | 469/717 [03:00<01:35,  2.60it/s, loss=13][A
[Epoch 5]:  66%|██████▌   | 470/717 [03:00<01:34,  2.61it/s, loss=13][A
[Epoch 5]:  66%|██████▌   | 470/717 [03:00<01:34,  2.60it/s, loss=14.1][A
[Epoch 5]:  66%|██████▌   | 471/717 [03:00<01:34,  2.61it/s, loss=14.1][A
[Epoch 5]:  66%|██████▌   | 471/717 [03:01<01:34,  2.60it/s, loss=14.3][A
[Epoch 5]:  66%|██████▌   | 472/7

[Epoch 5]:  73%|███████▎  | 520/717 [03:19<01:15,  2.61it/s, loss=13.7][A
[Epoch 5]:  73%|███████▎  | 520/717 [03:19<01:15,  2.60it/s, loss=12.8][A
[Epoch 5]:  73%|███████▎  | 521/717 [03:19<01:15,  2.61it/s, loss=12.8][A
[Epoch 5]:  73%|███████▎  | 521/717 [03:20<01:15,  2.60it/s, loss=13.5][A
[Epoch 5]:  73%|███████▎  | 522/717 [03:20<01:14,  2.61it/s, loss=13.5][A
[Epoch 5]:  73%|███████▎  | 522/717 [03:20<01:14,  2.60it/s, loss=12.2][A
[Epoch 5]:  73%|███████▎  | 523/717 [03:20<01:14,  2.61it/s, loss=12.2][A
[Epoch 5]:  73%|███████▎  | 523/717 [03:20<01:14,  2.60it/s, loss=12.9][A
[Epoch 5]:  73%|███████▎  | 524/717 [03:20<01:14,  2.61it/s, loss=12.9][A
[Epoch 5]:  73%|███████▎  | 524/717 [03:21<01:14,  2.60it/s, loss=13]  [A
[Epoch 5]:  73%|███████▎  | 525/717 [03:21<01:13,  2.61it/s, loss=13][A
[Epoch 5]:  73%|███████▎  | 525/717 [03:21<01:13,  2.60it/s, loss=13.7][A
[Epoch 5]:  73%|███████▎  | 526/717 [03:21<01:13,  2.61it/s, loss=13.7][A
[Epoch 5]:  73%|███████▎  |

[Epoch 5]:  80%|████████  | 574/717 [03:40<00:54,  2.61it/s, loss=13.5][A
[Epoch 5]:  80%|████████  | 575/717 [03:40<00:54,  2.61it/s, loss=13.5][A
[Epoch 5]:  80%|████████  | 575/717 [03:40<00:54,  2.61it/s, loss=13.6][A
[Epoch 5]:  80%|████████  | 576/717 [03:40<00:54,  2.61it/s, loss=13.6][A
[Epoch 5]:  80%|████████  | 576/717 [03:41<00:54,  2.61it/s, loss=15.2][A
[Epoch 5]:  80%|████████  | 577/717 [03:41<00:53,  2.61it/s, loss=15.2][A
[Epoch 5]:  80%|████████  | 577/717 [03:41<00:53,  2.61it/s, loss=14.3][A
[Epoch 5]:  81%|████████  | 578/717 [03:41<00:53,  2.61it/s, loss=14.3][A
[Epoch 5]:  81%|████████  | 578/717 [03:41<00:53,  2.61it/s, loss=13.2][A
[Epoch 5]:  81%|████████  | 579/717 [03:41<00:52,  2.61it/s, loss=13.2][A
[Epoch 5]:  81%|████████  | 579/717 [03:42<00:52,  2.61it/s, loss=14.5][A
[Epoch 5]:  81%|████████  | 580/717 [03:42<00:52,  2.61it/s, loss=14.5][A
[Epoch 5]:  81%|████████  | 580/717 [03:42<00:52,  2.61it/s, loss=12.9][A
[Epoch 5]:  81%|████████ 

[Epoch 5]:  88%|████████▊ | 629/717 [04:00<00:33,  2.61it/s, loss=14.2][A
[Epoch 5]:  88%|████████▊ | 629/717 [04:01<00:33,  2.61it/s, loss=13]  [A
[Epoch 5]:  88%|████████▊ | 630/717 [04:01<00:33,  2.61it/s, loss=13][A
[Epoch 5]:  88%|████████▊ | 630/717 [04:01<00:33,  2.61it/s, loss=13.2][A
[Epoch 5]:  88%|████████▊ | 631/717 [04:01<00:32,  2.61it/s, loss=13.2][A
[Epoch 5]:  88%|████████▊ | 631/717 [04:01<00:32,  2.61it/s, loss=13.1][A
[Epoch 5]:  88%|████████▊ | 632/717 [04:01<00:32,  2.61it/s, loss=13.1][A
[Epoch 5]:  88%|████████▊ | 632/717 [04:02<00:32,  2.61it/s, loss=13.9][A
[Epoch 5]:  88%|████████▊ | 633/717 [04:02<00:32,  2.61it/s, loss=13.9][A
[Epoch 5]:  88%|████████▊ | 633/717 [04:02<00:32,  2.61it/s, loss=14.5][A
[Epoch 5]:  88%|████████▊ | 634/717 [04:02<00:31,  2.61it/s, loss=14.5][A
[Epoch 5]:  88%|████████▊ | 634/717 [04:03<00:31,  2.61it/s, loss=14.1][A
[Epoch 5]:  89%|████████▊ | 635/717 [04:03<00:31,  2.61it/s, loss=14.1][A
[Epoch 5]:  89%|████████▊ |

[Epoch 5]:  95%|█████████▌| 683/717 [04:21<00:13,  2.61it/s, loss=13.9][A
[Epoch 5]:  95%|█████████▌| 684/717 [04:21<00:12,  2.61it/s, loss=13.9][A
[Epoch 5]:  95%|█████████▌| 684/717 [04:22<00:12,  2.61it/s, loss=13.6][A
[Epoch 5]:  96%|█████████▌| 685/717 [04:22<00:12,  2.61it/s, loss=13.6][A
[Epoch 5]:  96%|█████████▌| 685/717 [04:22<00:12,  2.61it/s, loss=13.2][A
[Epoch 5]:  96%|█████████▌| 686/717 [04:22<00:11,  2.61it/s, loss=13.2][A
[Epoch 5]:  96%|█████████▌| 686/717 [04:22<00:11,  2.61it/s, loss=15.2][A
[Epoch 5]:  96%|█████████▌| 687/717 [04:22<00:11,  2.61it/s, loss=15.2][A
[Epoch 5]:  96%|█████████▌| 687/717 [04:23<00:11,  2.61it/s, loss=13.5][A
[Epoch 5]:  96%|█████████▌| 688/717 [04:23<00:11,  2.61it/s, loss=13.5][A
[Epoch 5]:  96%|█████████▌| 688/717 [04:23<00:11,  2.61it/s, loss=13.9][A
[Epoch 5]:  96%|█████████▌| 689/717 [04:23<00:10,  2.61it/s, loss=13.9][A
[Epoch 5]:  96%|█████████▌| 689/717 [04:24<00:10,  2.61it/s, loss=14.7][A
[Epoch 5]:  96%|█████████

[Epoch 6]:   3%|▎         | 21/715 [00:08<04:40,  2.48it/s, loss=13.6][A
[Epoch 6]:   3%|▎         | 21/715 [00:08<04:53,  2.37it/s, loss=12.6][A
[Epoch 6]:   3%|▎         | 22/715 [00:08<04:39,  2.48it/s, loss=12.6][A
[Epoch 6]:   3%|▎         | 22/715 [00:09<04:51,  2.38it/s, loss=15.3][A
[Epoch 6]:   3%|▎         | 23/715 [00:09<04:38,  2.48it/s, loss=15.3][A
[Epoch 6]:   3%|▎         | 23/715 [00:09<04:50,  2.39it/s, loss=13]  [A
[Epoch 6]:   3%|▎         | 24/715 [00:09<04:37,  2.49it/s, loss=13][A
[Epoch 6]:   3%|▎         | 24/715 [00:10<04:48,  2.39it/s, loss=13][A
[Epoch 6]:   3%|▎         | 25/715 [00:10<04:36,  2.49it/s, loss=13][A
[Epoch 6]:   3%|▎         | 25/715 [00:10<04:47,  2.40it/s, loss=12.9][A
[Epoch 6]:   4%|▎         | 26/715 [00:10<04:36,  2.50it/s, loss=12.9][A
[Epoch 6]:   4%|▎         | 26/715 [00:10<04:46,  2.41it/s, loss=13.6][A
[Epoch 6]:   4%|▍         | 27/715 [00:10<04:35,  2.50it/s, loss=13.6][A
[Epoch 6]:   4%|▍         | 27/715 [00:11<04

[Epoch 6]:  11%|█         | 76/715 [00:29<04:09,  2.57it/s, loss=14.5][A
[Epoch 6]:  11%|█         | 76/715 [00:29<04:12,  2.53it/s, loss=12.4][A
[Epoch 6]:  11%|█         | 77/715 [00:29<04:08,  2.57it/s, loss=12.4][A
[Epoch 6]:  11%|█         | 77/715 [00:30<04:11,  2.54it/s, loss=12.7][A
[Epoch 6]:  11%|█         | 78/715 [00:30<04:08,  2.57it/s, loss=12.7][A
[Epoch 6]:  11%|█         | 78/715 [00:30<04:11,  2.54it/s, loss=13.9][A
[Epoch 6]:  11%|█         | 79/715 [00:30<04:07,  2.57it/s, loss=13.9][A
[Epoch 6]:  11%|█         | 79/715 [00:31<04:10,  2.54it/s, loss=14.1][A
[Epoch 6]:  11%|█         | 80/715 [00:31<04:07,  2.57it/s, loss=14.1][A
[Epoch 6]:  11%|█         | 80/715 [00:31<04:10,  2.54it/s, loss=13.3][A
[Epoch 6]:  11%|█▏        | 81/715 [00:31<04:06,  2.57it/s, loss=13.3][A
[Epoch 6]:  11%|█▏        | 81/715 [00:31<04:09,  2.54it/s, loss=13.6][A
[Epoch 6]:  11%|█▏        | 82/715 [00:31<04:06,  2.57it/s, loss=13.6][A
[Epoch 6]:  11%|█▏        | 82/715 [00

[Epoch 6]:  18%|█▊        | 131/715 [00:50<03:45,  2.59it/s, loss=14.2][A
[Epoch 6]:  18%|█▊        | 131/715 [00:51<03:47,  2.57it/s, loss=14.1][A
[Epoch 6]:  18%|█▊        | 132/715 [00:51<03:45,  2.58it/s, loss=14.1][A
[Epoch 6]:  18%|█▊        | 132/715 [00:51<03:47,  2.57it/s, loss=15.3][A
[Epoch 6]:  19%|█▊        | 133/715 [00:51<03:45,  2.59it/s, loss=15.3][A
[Epoch 6]:  19%|█▊        | 133/715 [00:51<03:46,  2.57it/s, loss=12.8][A
[Epoch 6]:  19%|█▊        | 134/715 [00:51<03:44,  2.59it/s, loss=12.8][A
[Epoch 6]:  19%|█▊        | 134/715 [00:52<03:46,  2.57it/s, loss=14]  [A
[Epoch 6]:  19%|█▉        | 135/715 [00:52<03:44,  2.59it/s, loss=14][A
[Epoch 6]:  19%|█▉        | 135/715 [00:52<03:45,  2.57it/s, loss=13.9][A
[Epoch 6]:  19%|█▉        | 136/715 [00:52<03:43,  2.59it/s, loss=13.9][A
[Epoch 6]:  19%|█▉        | 136/715 [00:52<03:45,  2.57it/s, loss=12.3][A
[Epoch 6]:  19%|█▉        | 137/715 [00:52<03:43,  2.59it/s, loss=12.3][A
[Epoch 6]:  19%|█▉        |

[Epoch 6]:  26%|██▌       | 185/715 [01:11<03:25,  2.58it/s, loss=13.2][A
[Epoch 6]:  26%|██▌       | 186/715 [01:11<03:23,  2.59it/s, loss=13.2][A
[Epoch 6]:  26%|██▌       | 186/715 [01:12<03:24,  2.58it/s, loss=15]  [A
[Epoch 6]:  26%|██▌       | 187/715 [01:12<03:23,  2.60it/s, loss=15][A
[Epoch 6]:  26%|██▌       | 187/715 [01:12<03:24,  2.58it/s, loss=14.7][A
[Epoch 6]:  26%|██▋       | 188/715 [01:12<03:23,  2.59it/s, loss=14.7][A
[Epoch 6]:  26%|██▋       | 188/715 [01:12<03:24,  2.58it/s, loss=14.4][A
[Epoch 6]:  26%|██▋       | 189/715 [01:12<03:22,  2.60it/s, loss=14.4][A
[Epoch 6]:  26%|██▋       | 189/715 [01:13<03:23,  2.58it/s, loss=14.6][A
[Epoch 6]:  27%|██▋       | 190/715 [01:13<03:22,  2.60it/s, loss=14.6][A
[Epoch 6]:  27%|██▋       | 190/715 [01:13<03:23,  2.58it/s, loss=13.7][A
[Epoch 6]:  27%|██▋       | 191/715 [01:13<03:21,  2.60it/s, loss=13.7][A
[Epoch 6]:  27%|██▋       | 191/715 [01:13<03:22,  2.58it/s, loss=13.4][A
[Epoch 6]:  27%|██▋       |

[Epoch 6]:  34%|███▎      | 240/715 [01:32<03:02,  2.60it/s, loss=14.2][A
[Epoch 6]:  34%|███▎      | 240/715 [01:32<03:03,  2.59it/s, loss=13.7][A
[Epoch 6]:  34%|███▎      | 241/715 [01:32<03:02,  2.60it/s, loss=13.7][A
[Epoch 6]:  34%|███▎      | 241/715 [01:33<03:02,  2.59it/s, loss=13.3][A
[Epoch 6]:  34%|███▍      | 242/715 [01:33<03:01,  2.60it/s, loss=13.3][A
[Epoch 6]:  34%|███▍      | 242/715 [01:33<03:02,  2.59it/s, loss=13.4][A
[Epoch 6]:  34%|███▍      | 243/715 [01:33<03:01,  2.60it/s, loss=13.4][A
[Epoch 6]:  34%|███▍      | 243/715 [01:33<03:02,  2.59it/s, loss=14.1][A
[Epoch 6]:  34%|███▍      | 244/715 [01:33<03:01,  2.60it/s, loss=14.1][A
[Epoch 6]:  34%|███▍      | 244/715 [01:34<03:01,  2.59it/s, loss=13.3][A
[Epoch 6]:  34%|███▍      | 245/715 [01:34<03:00,  2.60it/s, loss=13.3][A
[Epoch 6]:  34%|███▍      | 245/715 [01:34<03:01,  2.59it/s, loss=12.6][A
[Epoch 6]:  34%|███▍      | 246/715 [01:34<03:00,  2.60it/s, loss=12.6][A
[Epoch 6]:  34%|███▍     

[Epoch 6]:  41%|████      | 294/715 [01:53<02:42,  2.59it/s, loss=13.9][A
[Epoch 6]:  41%|████▏     | 295/715 [01:53<02:41,  2.60it/s, loss=13.9][A
[Epoch 6]:  41%|████▏     | 295/715 [01:53<02:41,  2.59it/s, loss=14.7][A
[Epoch 6]:  41%|████▏     | 296/715 [01:53<02:40,  2.60it/s, loss=14.7][A
[Epoch 6]:  41%|████▏     | 296/715 [01:54<02:41,  2.59it/s, loss=13.1][A
[Epoch 6]:  42%|████▏     | 297/715 [01:54<02:40,  2.60it/s, loss=13.1][A
[Epoch 6]:  42%|████▏     | 297/715 [01:54<02:41,  2.59it/s, loss=15.7][A
[Epoch 6]:  42%|████▏     | 298/715 [01:54<02:40,  2.60it/s, loss=15.7][A
[Epoch 6]:  42%|████▏     | 298/715 [01:54<02:40,  2.59it/s, loss=13.3][A
[Epoch 6]:  42%|████▏     | 299/715 [01:54<02:39,  2.60it/s, loss=13.3][A
[Epoch 6]:  42%|████▏     | 299/715 [01:55<02:40,  2.59it/s, loss=13.6][A
[Epoch 6]:  42%|████▏     | 300/715 [01:55<02:39,  2.60it/s, loss=13.6][A
[Epoch 6]:  42%|████▏     | 300/715 [01:55<02:39,  2.59it/s, loss=14.8][A
[Epoch 6]:  42%|████▏    

[Epoch 6]:  49%|████▉     | 349/715 [02:13<02:20,  2.61it/s, loss=13.5][A
[Epoch 6]:  49%|████▉     | 349/715 [02:14<02:20,  2.60it/s, loss=14.5][A
[Epoch 6]:  49%|████▉     | 350/715 [02:14<02:20,  2.61it/s, loss=14.5][A
[Epoch 6]:  49%|████▉     | 350/715 [02:14<02:20,  2.60it/s, loss=13.8][A
[Epoch 6]:  49%|████▉     | 351/715 [02:14<02:19,  2.61it/s, loss=13.8][A
[Epoch 6]:  49%|████▉     | 351/715 [02:15<02:20,  2.60it/s, loss=12.3][A
[Epoch 6]:  49%|████▉     | 352/715 [02:15<02:19,  2.61it/s, loss=12.3][A
[Epoch 6]:  49%|████▉     | 352/715 [02:15<02:19,  2.60it/s, loss=14.3][A
[Epoch 6]:  49%|████▉     | 353/715 [02:15<02:18,  2.61it/s, loss=14.3][A
[Epoch 6]:  49%|████▉     | 353/715 [02:15<02:19,  2.60it/s, loss=12.8][A
[Epoch 6]:  50%|████▉     | 354/715 [02:15<02:18,  2.61it/s, loss=12.8][A
[Epoch 6]:  50%|████▉     | 354/715 [02:16<02:18,  2.60it/s, loss=14.6][A
[Epoch 6]:  50%|████▉     | 355/715 [02:16<02:18,  2.61it/s, loss=14.6][A
[Epoch 6]:  50%|████▉    

[Epoch 6]:  56%|█████▋    | 403/715 [02:35<02:00,  2.60it/s, loss=14.7][A
[Epoch 6]:  57%|█████▋    | 404/715 [02:35<01:59,  2.60it/s, loss=14.7][A
[Epoch 6]:  57%|█████▋    | 404/715 [02:35<01:59,  2.60it/s, loss=13.9][A
[Epoch 6]:  57%|█████▋    | 405/715 [02:35<01:59,  2.60it/s, loss=13.9][A
[Epoch 6]:  57%|█████▋    | 405/715 [02:35<01:59,  2.60it/s, loss=12.9][A
[Epoch 6]:  57%|█████▋    | 406/715 [02:35<01:58,  2.60it/s, loss=12.9][A
[Epoch 6]:  57%|█████▋    | 406/715 [02:36<01:58,  2.60it/s, loss=13.5][A
[Epoch 6]:  57%|█████▋    | 407/715 [02:36<01:58,  2.60it/s, loss=13.5][A
[Epoch 6]:  57%|█████▋    | 407/715 [02:36<01:58,  2.60it/s, loss=13.6][A
[Epoch 6]:  57%|█████▋    | 408/715 [02:36<01:57,  2.60it/s, loss=13.6][A
[Epoch 6]:  57%|█████▋    | 408/715 [02:37<01:58,  2.60it/s, loss=14.1][A
[Epoch 6]:  57%|█████▋    | 409/715 [02:37<01:57,  2.60it/s, loss=14.1][A
[Epoch 6]:  57%|█████▋    | 409/715 [02:37<01:57,  2.60it/s, loss=12.4][A
[Epoch 6]:  57%|█████▋   

[Epoch 6]:  64%|██████▍   | 458/715 [02:55<01:38,  2.61it/s, loss=13.3][A
[Epoch 6]:  64%|██████▍   | 458/715 [02:56<01:38,  2.60it/s, loss=13.2][A
[Epoch 6]:  64%|██████▍   | 459/715 [02:56<01:38,  2.61it/s, loss=13.2][A
[Epoch 6]:  64%|██████▍   | 459/715 [02:56<01:38,  2.60it/s, loss=13.4][A
[Epoch 6]:  64%|██████▍   | 460/715 [02:56<01:37,  2.61it/s, loss=13.4][A
[Epoch 6]:  64%|██████▍   | 460/715 [02:56<01:38,  2.60it/s, loss=12.8][A
[Epoch 6]:  64%|██████▍   | 461/715 [02:56<01:37,  2.61it/s, loss=12.8][A
[Epoch 6]:  64%|██████▍   | 461/715 [02:57<01:37,  2.60it/s, loss=14.2][A
[Epoch 6]:  65%|██████▍   | 462/715 [02:57<01:37,  2.61it/s, loss=14.2][A
[Epoch 6]:  65%|██████▍   | 462/715 [02:57<01:37,  2.60it/s, loss=14.5][A
[Epoch 6]:  65%|██████▍   | 463/715 [02:57<01:36,  2.61it/s, loss=14.5][A
[Epoch 6]:  65%|██████▍   | 463/715 [02:58<01:36,  2.60it/s, loss=13.9][A
[Epoch 6]:  65%|██████▍   | 464/715 [02:58<01:36,  2.61it/s, loss=13.9][A
[Epoch 6]:  65%|██████▍  

[Epoch 6]:  72%|███████▏  | 512/715 [03:16<01:18,  2.60it/s, loss=12.6][A
[Epoch 6]:  72%|███████▏  | 513/715 [03:16<01:17,  2.61it/s, loss=12.6][A
[Epoch 6]:  72%|███████▏  | 513/715 [03:17<01:17,  2.60it/s, loss=13.4][A
[Epoch 6]:  72%|███████▏  | 514/715 [03:17<01:17,  2.61it/s, loss=13.4][A
[Epoch 6]:  72%|███████▏  | 514/715 [03:17<01:17,  2.60it/s, loss=14]  [A
[Epoch 6]:  72%|███████▏  | 515/715 [03:17<01:16,  2.61it/s, loss=14][A
[Epoch 6]:  72%|███████▏  | 515/715 [03:17<01:16,  2.60it/s, loss=14.6][A
[Epoch 6]:  72%|███████▏  | 516/715 [03:17<01:16,  2.61it/s, loss=14.6][A
[Epoch 6]:  72%|███████▏  | 516/715 [03:18<01:16,  2.60it/s, loss=13.7][A
[Epoch 6]:  72%|███████▏  | 517/715 [03:18<01:15,  2.61it/s, loss=13.7][A
[Epoch 6]:  72%|███████▏  | 517/715 [03:18<01:16,  2.60it/s, loss=13.3][A
[Epoch 6]:  72%|███████▏  | 518/715 [03:18<01:15,  2.61it/s, loss=13.3][A
[Epoch 6]:  72%|███████▏  | 518/715 [03:19<01:15,  2.60it/s, loss=13.6][A
[Epoch 6]:  73%|███████▎  |

[Epoch 6]:  79%|███████▉  | 567/715 [03:37<00:56,  2.61it/s, loss=13.4][A
[Epoch 6]:  79%|███████▉  | 567/715 [03:38<00:56,  2.60it/s, loss=14]  [A
[Epoch 6]:  79%|███████▉  | 568/715 [03:38<00:56,  2.61it/s, loss=14][A
[Epoch 6]:  79%|███████▉  | 568/715 [03:38<00:56,  2.60it/s, loss=13.6][A
[Epoch 6]:  80%|███████▉  | 569/715 [03:38<00:56,  2.61it/s, loss=13.6][A
[Epoch 6]:  80%|███████▉  | 569/715 [03:38<00:56,  2.60it/s, loss=12.5][A
[Epoch 6]:  80%|███████▉  | 570/715 [03:38<00:55,  2.61it/s, loss=12.5][A
[Epoch 6]:  80%|███████▉  | 570/715 [03:39<00:55,  2.60it/s, loss=13.1][A
[Epoch 6]:  80%|███████▉  | 571/715 [03:39<00:55,  2.61it/s, loss=13.1][A
[Epoch 6]:  80%|███████▉  | 571/715 [03:39<00:55,  2.60it/s, loss=13.4][A
[Epoch 6]:  80%|████████  | 572/715 [03:39<00:54,  2.61it/s, loss=13.4][A
[Epoch 6]:  80%|████████  | 572/715 [03:39<00:54,  2.60it/s, loss=14.7][A
[Epoch 6]:  80%|████████  | 573/715 [03:39<00:54,  2.61it/s, loss=14.7][A
[Epoch 6]:  80%|████████  |

[Epoch 6]:  87%|████████▋ | 621/715 [03:58<00:36,  2.60it/s, loss=13.5][A
[Epoch 6]:  87%|████████▋ | 622/715 [03:58<00:35,  2.61it/s, loss=13.5][A
[Epoch 6]:  87%|████████▋ | 622/715 [03:59<00:35,  2.60it/s, loss=12.6][A
[Epoch 6]:  87%|████████▋ | 623/715 [03:59<00:35,  2.61it/s, loss=12.6][A
[Epoch 6]:  87%|████████▋ | 623/715 [03:59<00:35,  2.60it/s, loss=12.7][A
[Epoch 6]:  87%|████████▋ | 624/715 [03:59<00:34,  2.61it/s, loss=12.7][A
[Epoch 6]:  87%|████████▋ | 624/715 [03:59<00:34,  2.60it/s, loss=14.4][A
[Epoch 6]:  87%|████████▋ | 625/715 [03:59<00:34,  2.61it/s, loss=14.4][A
[Epoch 6]:  87%|████████▋ | 625/715 [04:00<00:34,  2.60it/s, loss=14.1][A
[Epoch 6]:  88%|████████▊ | 626/715 [04:00<00:34,  2.61it/s, loss=14.1][A
[Epoch 6]:  88%|████████▊ | 626/715 [04:00<00:34,  2.60it/s, loss=13.5][A
[Epoch 6]:  88%|████████▊ | 627/715 [04:00<00:33,  2.60it/s, loss=13.5][A
[Epoch 6]:  88%|████████▊ | 627/715 [04:01<00:33,  2.60it/s, loss=14.7][A
[Epoch 6]:  88%|████████▊

[Epoch 6]:  95%|█████████▍| 676/715 [04:19<00:14,  2.61it/s, loss=14.1][A
[Epoch 6]:  95%|█████████▍| 676/715 [04:19<00:14,  2.60it/s, loss=12.7][A
[Epoch 6]:  95%|█████████▍| 677/715 [04:19<00:14,  2.61it/s, loss=12.7][A
[Epoch 6]:  95%|█████████▍| 677/715 [04:20<00:14,  2.60it/s, loss=13.4][A
[Epoch 6]:  95%|█████████▍| 678/715 [04:20<00:14,  2.61it/s, loss=13.4][A
[Epoch 6]:  95%|█████████▍| 678/715 [04:20<00:14,  2.60it/s, loss=13.3][A
[Epoch 6]:  95%|█████████▍| 679/715 [04:20<00:13,  2.61it/s, loss=13.3][A
[Epoch 6]:  95%|█████████▍| 679/715 [04:20<00:13,  2.60it/s, loss=14.7][A
[Epoch 6]:  95%|█████████▌| 680/715 [04:20<00:13,  2.61it/s, loss=14.7][A
[Epoch 6]:  95%|█████████▌| 680/715 [04:21<00:13,  2.60it/s, loss=13.8][A
[Epoch 6]:  95%|█████████▌| 681/715 [04:21<00:13,  2.61it/s, loss=13.8][A
[Epoch 6]:  95%|█████████▌| 681/715 [04:21<00:13,  2.60it/s, loss=12.6][A
[Epoch 6]:  95%|█████████▌| 682/715 [04:21<00:12,  2.61it/s, loss=12.6][A
[Epoch 6]:  95%|█████████

[Epoch 7]:   2%|▏         | 15/716 [00:06<04:49,  2.42it/s, loss=14.4][A
[Epoch 7]:   2%|▏         | 15/716 [00:06<05:06,  2.28it/s, loss=13.6][A
[Epoch 7]:   2%|▏         | 16/716 [00:06<04:47,  2.44it/s, loss=13.6][A
[Epoch 7]:   2%|▏         | 16/716 [00:06<05:03,  2.30it/s, loss=13.4][A
[Epoch 7]:   2%|▏         | 17/716 [00:06<04:45,  2.45it/s, loss=13.4][A
[Epoch 7]:   2%|▏         | 17/716 [00:07<05:01,  2.32it/s, loss=14]  [A
[Epoch 7]:   3%|▎         | 18/716 [00:07<04:44,  2.46it/s, loss=14][A
[Epoch 7]:   3%|▎         | 18/716 [00:07<04:58,  2.34it/s, loss=14.8][A
[Epoch 7]:   3%|▎         | 19/716 [00:07<04:42,  2.47it/s, loss=14.8][A
[Epoch 7]:   3%|▎         | 19/716 [00:08<04:56,  2.35it/s, loss=14.2][A
[Epoch 7]:   3%|▎         | 20/716 [00:08<04:41,  2.48it/s, loss=14.2][A
[Epoch 7]:   3%|▎         | 20/716 [00:08<04:54,  2.36it/s, loss=14.2][A
[Epoch 7]:   3%|▎         | 21/716 [00:08<04:40,  2.48it/s, loss=14.2][A
[Epoch 7]:   3%|▎         | 21/716 [00:0

[Epoch 7]:  10%|▉         | 70/716 [00:27<04:10,  2.58it/s, loss=13.3][A
[Epoch 7]:  10%|▉         | 70/716 [00:27<04:14,  2.54it/s, loss=14.1][A
[Epoch 7]:  10%|▉         | 71/716 [00:27<04:10,  2.58it/s, loss=14.1][A
[Epoch 7]:  10%|▉         | 71/716 [00:27<04:13,  2.54it/s, loss=13.7][A
[Epoch 7]:  10%|█         | 72/716 [00:27<04:09,  2.58it/s, loss=13.7][A
[Epoch 7]:  10%|█         | 72/716 [00:28<04:13,  2.54it/s, loss=13.2][A
[Epoch 7]:  10%|█         | 73/716 [00:28<04:09,  2.58it/s, loss=13.2][A
[Epoch 7]:  10%|█         | 73/716 [00:28<04:12,  2.54it/s, loss=12.9][A
[Epoch 7]:  10%|█         | 74/716 [00:28<04:08,  2.58it/s, loss=12.9][A
[Epoch 7]:  10%|█         | 74/716 [00:29<04:12,  2.55it/s, loss=13]  [A
[Epoch 7]:  10%|█         | 75/716 [00:29<04:08,  2.58it/s, loss=13][A
[Epoch 7]:  10%|█         | 75/716 [00:29<04:11,  2.55it/s, loss=13.3][A
[Epoch 7]:  11%|█         | 76/716 [00:29<04:08,  2.58it/s, loss=13.3][A
[Epoch 7]:  11%|█         | 76/716 [00:2

[Epoch 7]:  17%|█▋        | 125/716 [00:48<03:47,  2.60it/s, loss=13.5][A
[Epoch 7]:  17%|█▋        | 125/716 [00:48<03:49,  2.58it/s, loss=13.9][A
[Epoch 7]:  18%|█▊        | 126/716 [00:48<03:47,  2.60it/s, loss=13.9][A
[Epoch 7]:  18%|█▊        | 126/716 [00:48<03:48,  2.58it/s, loss=13.2][A
[Epoch 7]:  18%|█▊        | 127/716 [00:48<03:46,  2.60it/s, loss=13.2][A
[Epoch 7]:  18%|█▊        | 127/716 [00:49<03:48,  2.58it/s, loss=12.7][A
[Epoch 7]:  18%|█▊        | 128/716 [00:49<03:46,  2.60it/s, loss=12.7][A
[Epoch 7]:  18%|█▊        | 128/716 [00:49<03:48,  2.58it/s, loss=13.4][A
[Epoch 7]:  18%|█▊        | 129/716 [00:49<03:45,  2.60it/s, loss=13.4][A
[Epoch 7]:  18%|█▊        | 129/716 [00:50<03:47,  2.58it/s, loss=15]  [A
[Epoch 7]:  18%|█▊        | 130/716 [00:50<03:45,  2.60it/s, loss=15][A
[Epoch 7]:  18%|█▊        | 130/716 [00:50<03:47,  2.58it/s, loss=13.7][A
[Epoch 7]:  18%|█▊        | 131/716 [00:50<03:45,  2.60it/s, loss=13.7][A
[Epoch 7]:  18%|█▊        |

[Epoch 7]:  25%|██▌       | 179/716 [01:09<03:27,  2.59it/s, loss=13.4][A
[Epoch 7]:  25%|██▌       | 180/716 [01:09<03:25,  2.61it/s, loss=13.4][A
[Epoch 7]:  25%|██▌       | 180/716 [01:09<03:26,  2.59it/s, loss=13.2][A
[Epoch 7]:  25%|██▌       | 181/716 [01:09<03:25,  2.61it/s, loss=13.2][A
[Epoch 7]:  25%|██▌       | 181/716 [01:09<03:26,  2.59it/s, loss=13.7][A
[Epoch 7]:  25%|██▌       | 182/716 [01:09<03:24,  2.61it/s, loss=13.7][A
[Epoch 7]:  25%|██▌       | 182/716 [01:10<03:26,  2.59it/s, loss=13.7][A
[Epoch 7]:  26%|██▌       | 183/716 [01:10<03:24,  2.61it/s, loss=13.7][A
[Epoch 7]:  26%|██▌       | 183/716 [01:10<03:25,  2.59it/s, loss=12.3][A
[Epoch 7]:  26%|██▌       | 184/716 [01:10<03:24,  2.61it/s, loss=12.3][A
[Epoch 7]:  26%|██▌       | 184/716 [01:11<03:25,  2.59it/s, loss=13.5][A
[Epoch 7]:  26%|██▌       | 185/716 [01:11<03:23,  2.61it/s, loss=13.5][A
[Epoch 7]:  26%|██▌       | 185/716 [01:11<03:24,  2.59it/s, loss=12.8][A
[Epoch 7]:  26%|██▌      

[Epoch 7]:  33%|███▎      | 234/716 [01:29<03:04,  2.61it/s, loss=14.4][A
[Epoch 7]:  33%|███▎      | 234/716 [01:30<03:05,  2.60it/s, loss=14.3][A
[Epoch 7]:  33%|███▎      | 235/716 [01:30<03:04,  2.61it/s, loss=14.3][A
[Epoch 7]:  33%|███▎      | 235/716 [01:30<03:05,  2.60it/s, loss=13.3][A
[Epoch 7]:  33%|███▎      | 236/716 [01:30<03:04,  2.61it/s, loss=13.3][A
[Epoch 7]:  33%|███▎      | 236/716 [01:30<03:04,  2.60it/s, loss=14]  [A
[Epoch 7]:  33%|███▎      | 237/716 [01:30<03:03,  2.61it/s, loss=14][A
[Epoch 7]:  33%|███▎      | 237/716 [01:31<03:04,  2.60it/s, loss=15.1][A
[Epoch 7]:  33%|███▎      | 238/716 [01:31<03:03,  2.61it/s, loss=15.1][A
[Epoch 7]:  33%|███▎      | 238/716 [01:31<03:04,  2.60it/s, loss=14.4][A
[Epoch 7]:  33%|███▎      | 239/716 [01:31<03:02,  2.61it/s, loss=14.4][A
[Epoch 7]:  33%|███▎      | 239/716 [01:32<03:03,  2.60it/s, loss=13.6][A
[Epoch 7]:  34%|███▎      | 240/716 [01:32<03:02,  2.61it/s, loss=13.6][A
[Epoch 7]:  34%|███▎      |

[Epoch 7]:  40%|████      | 288/716 [01:50<02:44,  2.60it/s, loss=13]  [A
[Epoch 7]:  40%|████      | 289/716 [01:50<02:43,  2.61it/s, loss=13][A
[Epoch 7]:  40%|████      | 289/716 [01:51<02:44,  2.60it/s, loss=14.4][A
[Epoch 7]:  41%|████      | 290/716 [01:51<02:43,  2.61it/s, loss=14.4][A
[Epoch 7]:  41%|████      | 290/716 [01:51<02:43,  2.60it/s, loss=13.9][A
[Epoch 7]:  41%|████      | 291/716 [01:51<02:42,  2.61it/s, loss=13.9][A
[Epoch 7]:  41%|████      | 291/716 [01:51<02:43,  2.60it/s, loss=13.9][A
[Epoch 7]:  41%|████      | 292/716 [01:51<02:42,  2.61it/s, loss=13.9][A
[Epoch 7]:  41%|████      | 292/716 [01:52<02:43,  2.60it/s, loss=14]  [A
[Epoch 7]:  41%|████      | 293/716 [01:52<02:42,  2.61it/s, loss=14][A
[Epoch 7]:  41%|████      | 293/716 [01:52<02:42,  2.60it/s, loss=13.3][A
[Epoch 7]:  41%|████      | 294/716 [01:52<02:41,  2.61it/s, loss=13.3][A
[Epoch 7]:  41%|████      | 294/716 [01:53<02:42,  2.60it/s, loss=15]  [A
[Epoch 7]:  41%|████      | 2

[Epoch 7]:  48%|████▊     | 343/716 [02:11<02:22,  2.61it/s, loss=14.4][A
[Epoch 7]:  48%|████▊     | 343/716 [02:11<02:23,  2.60it/s, loss=13.7][A
[Epoch 7]:  48%|████▊     | 344/716 [02:11<02:22,  2.61it/s, loss=13.7][A
[Epoch 7]:  48%|████▊     | 344/716 [02:12<02:22,  2.60it/s, loss=14.3][A
[Epoch 7]:  48%|████▊     | 345/716 [02:12<02:22,  2.61it/s, loss=14.3][A
[Epoch 7]:  48%|████▊     | 345/716 [02:12<02:22,  2.60it/s, loss=14]  [A
[Epoch 7]:  48%|████▊     | 346/716 [02:12<02:21,  2.61it/s, loss=14][A
[Epoch 7]:  48%|████▊     | 346/716 [02:12<02:22,  2.60it/s, loss=14.2][A
[Epoch 7]:  48%|████▊     | 347/716 [02:12<02:21,  2.61it/s, loss=14.2][A
[Epoch 7]:  48%|████▊     | 347/716 [02:13<02:21,  2.60it/s, loss=12.8][A
[Epoch 7]:  49%|████▊     | 348/716 [02:13<02:21,  2.61it/s, loss=12.8][A
[Epoch 7]:  49%|████▊     | 348/716 [02:13<02:21,  2.60it/s, loss=14.1][A
[Epoch 7]:  49%|████▊     | 349/716 [02:13<02:20,  2.61it/s, loss=14.1][A
[Epoch 7]:  49%|████▊     |

[Epoch 7]:  55%|█████▌    | 397/716 [02:32<02:02,  2.60it/s, loss=14.6][A
[Epoch 7]:  56%|█████▌    | 398/716 [02:32<02:01,  2.61it/s, loss=14.6][A
[Epoch 7]:  56%|█████▌    | 398/716 [02:33<02:02,  2.60it/s, loss=14.2][A
[Epoch 7]:  56%|█████▌    | 399/716 [02:33<02:01,  2.61it/s, loss=14.2][A
[Epoch 7]:  56%|█████▌    | 399/716 [02:33<02:01,  2.60it/s, loss=13.9][A
[Epoch 7]:  56%|█████▌    | 400/716 [02:33<02:01,  2.61it/s, loss=13.9][A
[Epoch 7]:  56%|█████▌    | 400/716 [02:33<02:01,  2.60it/s, loss=13.3][A
[Epoch 7]:  56%|█████▌    | 401/716 [02:33<02:00,  2.61it/s, loss=13.3][A
[Epoch 7]:  56%|█████▌    | 401/716 [02:34<02:01,  2.60it/s, loss=14.2][A
[Epoch 7]:  56%|█████▌    | 402/716 [02:34<02:00,  2.61it/s, loss=14.2][A
[Epoch 7]:  56%|█████▌    | 402/716 [02:34<02:00,  2.60it/s, loss=14.6][A
[Epoch 7]:  56%|█████▋    | 403/716 [02:34<02:00,  2.61it/s, loss=14.6][A
[Epoch 7]:  56%|█████▋    | 403/716 [02:34<02:00,  2.60it/s, loss=14.3][A
[Epoch 7]:  56%|█████▋   

[Epoch 7]:  63%|██████▎   | 452/716 [02:53<01:41,  2.61it/s, loss=14][A
[Epoch 7]:  63%|██████▎   | 452/716 [02:53<01:41,  2.60it/s, loss=13.6][A
[Epoch 7]:  63%|██████▎   | 453/716 [02:53<01:40,  2.61it/s, loss=13.6][A
[Epoch 7]:  63%|██████▎   | 453/716 [02:54<01:41,  2.60it/s, loss=13.2][A
[Epoch 7]:  63%|██████▎   | 454/716 [02:54<01:40,  2.61it/s, loss=13.2][A
[Epoch 7]:  63%|██████▎   | 454/716 [02:54<01:40,  2.60it/s, loss=14.6][A
[Epoch 7]:  64%|██████▎   | 455/716 [02:54<01:40,  2.61it/s, loss=14.6][A
[Epoch 7]:  64%|██████▎   | 455/716 [02:55<01:40,  2.60it/s, loss=12.8][A
[Epoch 7]:  64%|██████▎   | 456/716 [02:55<01:39,  2.61it/s, loss=12.8][A
[Epoch 7]:  64%|██████▎   | 456/716 [02:55<01:40,  2.60it/s, loss=14.7][A
[Epoch 7]:  64%|██████▍   | 457/716 [02:55<01:39,  2.61it/s, loss=14.7][A
[Epoch 7]:  64%|██████▍   | 457/716 [02:55<01:39,  2.60it/s, loss=14.2][A
[Epoch 7]:  64%|██████▍   | 458/716 [02:55<01:39,  2.61it/s, loss=14.2][A
[Epoch 7]:  64%|██████▍   |

[Epoch 7]:  71%|███████   | 506/716 [03:14<01:20,  2.60it/s, loss=13.6][A
[Epoch 7]:  71%|███████   | 507/716 [03:14<01:20,  2.61it/s, loss=13.6][A
[Epoch 7]:  71%|███████   | 507/716 [03:14<01:20,  2.60it/s, loss=14.5][A
[Epoch 7]:  71%|███████   | 508/716 [03:14<01:19,  2.61it/s, loss=14.5][A
[Epoch 7]:  71%|███████   | 508/716 [03:15<01:19,  2.60it/s, loss=13.3][A
[Epoch 7]:  71%|███████   | 509/716 [03:15<01:19,  2.61it/s, loss=13.3][A
[Epoch 7]:  71%|███████   | 509/716 [03:15<01:19,  2.60it/s, loss=14]  [A
[Epoch 7]:  71%|███████   | 510/716 [03:15<01:19,  2.61it/s, loss=14][A
[Epoch 7]:  71%|███████   | 510/716 [03:16<01:19,  2.60it/s, loss=13.1][A
[Epoch 7]:  71%|███████▏  | 511/716 [03:16<01:18,  2.61it/s, loss=13.1][A
[Epoch 7]:  71%|███████▏  | 511/716 [03:16<01:18,  2.60it/s, loss=13.2][A
[Epoch 7]:  72%|███████▏  | 512/716 [03:16<01:18,  2.61it/s, loss=13.2][A
[Epoch 7]:  72%|███████▏  | 512/716 [03:16<01:18,  2.60it/s, loss=13.5][A
[Epoch 7]:  72%|███████▏  |

[Epoch 7]:  78%|███████▊  | 561/716 [03:35<00:59,  2.61it/s, loss=13.4][A
[Epoch 7]:  78%|███████▊  | 561/716 [03:35<00:59,  2.60it/s, loss=14.6][A
[Epoch 7]:  78%|███████▊  | 562/716 [03:35<00:59,  2.61it/s, loss=14.6][A
[Epoch 7]:  78%|███████▊  | 562/716 [03:36<00:59,  2.60it/s, loss=13.4][A
[Epoch 7]:  79%|███████▊  | 563/716 [03:36<00:58,  2.61it/s, loss=13.4][A
[Epoch 7]:  79%|███████▊  | 563/716 [03:36<00:58,  2.60it/s, loss=12.4][A
[Epoch 7]:  79%|███████▉  | 564/716 [03:36<00:58,  2.61it/s, loss=12.4][A
[Epoch 7]:  79%|███████▉  | 564/716 [03:36<00:58,  2.60it/s, loss=14]  [A
[Epoch 7]:  79%|███████▉  | 565/716 [03:36<00:57,  2.61it/s, loss=14][A
[Epoch 7]:  79%|███████▉  | 565/716 [03:37<00:58,  2.60it/s, loss=13.3][A
[Epoch 7]:  79%|███████▉  | 566/716 [03:37<00:57,  2.61it/s, loss=13.3][A
[Epoch 7]:  79%|███████▉  | 566/716 [03:37<00:57,  2.60it/s, loss=13.8][A
[Epoch 7]:  79%|███████▉  | 567/716 [03:37<00:57,  2.61it/s, loss=13.8][A
[Epoch 7]:  79%|███████▉  |

[Epoch 7]:  86%|████████▌ | 615/716 [03:56<00:38,  2.60it/s, loss=14.1][A
[Epoch 7]:  86%|████████▌ | 616/716 [03:56<00:38,  2.61it/s, loss=14.1][A
[Epoch 7]:  86%|████████▌ | 616/716 [03:56<00:38,  2.60it/s, loss=13.7][A
[Epoch 7]:  86%|████████▌ | 617/716 [03:56<00:37,  2.61it/s, loss=13.7][A
[Epoch 7]:  86%|████████▌ | 617/716 [03:57<00:38,  2.60it/s, loss=12.4][A
[Epoch 7]:  86%|████████▋ | 618/716 [03:57<00:37,  2.61it/s, loss=12.4][A
[Epoch 7]:  86%|████████▋ | 618/716 [03:57<00:37,  2.60it/s, loss=13.2][A
[Epoch 7]:  86%|████████▋ | 619/716 [03:57<00:37,  2.61it/s, loss=13.2][A
[Epoch 7]:  86%|████████▋ | 619/716 [03:57<00:37,  2.60it/s, loss=14.6][A
[Epoch 7]:  87%|████████▋ | 620/716 [03:57<00:36,  2.61it/s, loss=14.6][A
[Epoch 7]:  87%|████████▋ | 620/716 [03:58<00:36,  2.60it/s, loss=13.5][A
[Epoch 7]:  87%|████████▋ | 621/716 [03:58<00:36,  2.61it/s, loss=13.5][A
[Epoch 7]:  87%|████████▋ | 621/716 [03:58<00:36,  2.60it/s, loss=14.9][A
[Epoch 7]:  87%|████████▋

[Epoch 7]:  94%|█████████▎| 670/716 [04:17<00:17,  2.61it/s, loss=14.2][A
[Epoch 7]:  94%|█████████▎| 670/716 [04:17<00:17,  2.60it/s, loss=12.9][A
[Epoch 7]:  94%|█████████▎| 671/716 [04:17<00:17,  2.61it/s, loss=12.9][A
[Epoch 7]:  94%|█████████▎| 671/716 [04:17<00:17,  2.60it/s, loss=13.2][A
[Epoch 7]:  94%|█████████▍| 672/716 [04:17<00:16,  2.61it/s, loss=13.2][A
[Epoch 7]:  94%|█████████▍| 672/716 [04:18<00:16,  2.60it/s, loss=12.5][A
[Epoch 7]:  94%|█████████▍| 673/716 [04:18<00:16,  2.61it/s, loss=12.5][A
[Epoch 7]:  94%|█████████▍| 673/716 [04:18<00:16,  2.60it/s, loss=13.3][A
[Epoch 7]:  94%|█████████▍| 674/716 [04:18<00:16,  2.61it/s, loss=13.3][A
[Epoch 7]:  94%|█████████▍| 674/716 [04:19<00:16,  2.60it/s, loss=13]  [A
[Epoch 7]:  94%|█████████▍| 675/716 [04:19<00:15,  2.61it/s, loss=13][A
[Epoch 7]:  94%|█████████▍| 675/716 [04:19<00:15,  2.60it/s, loss=13.3][A
[Epoch 7]:  94%|█████████▍| 676/716 [04:19<00:15,  2.61it/s, loss=13.3][A
[Epoch 7]:  94%|█████████▍|

[Epoch 8]:   1%|          | 8/716 [00:03<05:07,  2.30it/s, loss=12.4][A
[Epoch 8]:   1%|          | 8/716 [00:03<05:41,  2.07it/s, loss=14]  [A
[Epoch 8]:   1%|▏         | 9/716 [00:03<05:03,  2.33it/s, loss=14][A
[Epoch 8]:   1%|▏         | 9/716 [00:04<05:34,  2.12it/s, loss=13.3][A
[Epoch 8]:   1%|▏         | 10/716 [00:04<05:00,  2.35it/s, loss=13.3][A
[Epoch 8]:   1%|▏         | 10/716 [00:04<05:28,  2.15it/s, loss=14]  [A
[Epoch 8]:   2%|▏         | 11/716 [00:04<04:58,  2.36it/s, loss=14][A
[Epoch 8]:   2%|▏         | 11/716 [00:05<05:22,  2.18it/s, loss=15.6][A
[Epoch 8]:   2%|▏         | 12/716 [00:05<04:55,  2.38it/s, loss=15.6][A
[Epoch 8]:   2%|▏         | 12/716 [00:05<05:18,  2.21it/s, loss=13.5][A
[Epoch 8]:   2%|▏         | 13/716 [00:05<04:53,  2.39it/s, loss=13.5][A
[Epoch 8]:   2%|▏         | 13/716 [00:05<05:14,  2.24it/s, loss=14.5][A
[Epoch 8]:   2%|▏         | 14/716 [00:05<04:51,  2.41it/s, loss=14.5][A
[Epoch 8]:   2%|▏         | 14/716 [00:06<05:1

[Epoch 8]:   9%|▉         | 63/716 [00:24<04:15,  2.56it/s, loss=13.8][A
[Epoch 8]:   9%|▉         | 63/716 [00:24<04:18,  2.52it/s, loss=14.4][A
[Epoch 8]:   9%|▉         | 64/716 [00:24<04:14,  2.56it/s, loss=14.4][A
[Epoch 8]:   9%|▉         | 64/716 [00:25<04:18,  2.52it/s, loss=13.4][A
[Epoch 8]:   9%|▉         | 65/716 [00:25<04:14,  2.56it/s, loss=13.4][A
[Epoch 8]:   9%|▉         | 65/716 [00:25<04:17,  2.53it/s, loss=13.2][A
[Epoch 8]:   9%|▉         | 66/716 [00:25<04:13,  2.56it/s, loss=13.2][A
[Epoch 8]:   9%|▉         | 66/716 [00:26<04:17,  2.53it/s, loss=13.8][A
[Epoch 8]:   9%|▉         | 67/716 [00:26<04:13,  2.56it/s, loss=13.8][A
[Epoch 8]:   9%|▉         | 67/716 [00:26<04:16,  2.53it/s, loss=14]  [A
[Epoch 8]:   9%|▉         | 68/716 [00:26<04:12,  2.57it/s, loss=14][A
[Epoch 8]:   9%|▉         | 68/716 [00:26<04:16,  2.53it/s, loss=14.4][A
[Epoch 8]:  10%|▉         | 69/716 [00:26<04:12,  2.57it/s, loss=14.4][A
[Epoch 8]:  10%|▉         | 69/716 [00:2

[Epoch 8]:  16%|█▋        | 118/716 [00:45<03:51,  2.58it/s, loss=14][A
[Epoch 8]:  16%|█▋        | 118/716 [00:46<03:53,  2.56it/s, loss=13.7][A
[Epoch 8]:  17%|█▋        | 119/716 [00:46<03:51,  2.58it/s, loss=13.7][A
[Epoch 8]:  17%|█▋        | 119/716 [00:46<03:52,  2.56it/s, loss=13.4][A
[Epoch 8]:  17%|█▋        | 120/716 [00:46<03:50,  2.58it/s, loss=13.4][A
[Epoch 8]:  17%|█▋        | 120/716 [00:46<03:52,  2.56it/s, loss=13.5][A
[Epoch 8]:  17%|█▋        | 121/716 [00:46<03:50,  2.58it/s, loss=13.5][A
[Epoch 8]:  17%|█▋        | 121/716 [00:47<03:52,  2.56it/s, loss=13.5][A
[Epoch 8]:  17%|█▋        | 122/716 [00:47<03:49,  2.58it/s, loss=13.5][A
[Epoch 8]:  17%|█▋        | 122/716 [00:47<03:51,  2.56it/s, loss=13.6][A
[Epoch 8]:  17%|█▋        | 123/716 [00:47<03:49,  2.59it/s, loss=13.6][A
[Epoch 8]:  17%|█▋        | 123/716 [00:47<03:51,  2.56it/s, loss=14]  [A
[Epoch 8]:  17%|█▋        | 124/716 [00:47<03:48,  2.59it/s, loss=14][A
[Epoch 8]:  17%|█▋        | 1

[Epoch 8]:  24%|██▍       | 172/716 [01:06<03:30,  2.58it/s, loss=12.3][A
[Epoch 8]:  24%|██▍       | 173/716 [01:06<03:29,  2.59it/s, loss=12.3][A
[Epoch 8]:  24%|██▍       | 173/716 [01:07<03:30,  2.58it/s, loss=14.2][A
[Epoch 8]:  24%|██▍       | 174/716 [01:07<03:28,  2.59it/s, loss=14.2][A
[Epoch 8]:  24%|██▍       | 174/716 [01:07<03:30,  2.58it/s, loss=13.7][A
[Epoch 8]:  24%|██▍       | 175/716 [01:07<03:28,  2.59it/s, loss=13.7][A
[Epoch 8]:  24%|██▍       | 175/716 [01:07<03:29,  2.58it/s, loss=12.8][A
[Epoch 8]:  25%|██▍       | 176/716 [01:07<03:28,  2.59it/s, loss=12.8][A
[Epoch 8]:  25%|██▍       | 176/716 [01:08<03:29,  2.58it/s, loss=12.4][A
[Epoch 8]:  25%|██▍       | 177/716 [01:08<03:27,  2.59it/s, loss=12.4][A
[Epoch 8]:  25%|██▍       | 177/716 [01:08<03:28,  2.58it/s, loss=13]  [A
[Epoch 8]:  25%|██▍       | 178/716 [01:08<03:27,  2.59it/s, loss=13][A
[Epoch 8]:  25%|██▍       | 178/716 [01:08<03:28,  2.58it/s, loss=14.4][A
[Epoch 8]:  25%|██▌       |

[Epoch 8]:  32%|███▏      | 227/716 [01:27<03:08,  2.60it/s, loss=13.2][A
[Epoch 8]:  32%|███▏      | 227/716 [01:27<03:09,  2.59it/s, loss=13.6][A
[Epoch 8]:  32%|███▏      | 228/716 [01:27<03:07,  2.60it/s, loss=13.6][A
[Epoch 8]:  32%|███▏      | 228/716 [01:28<03:08,  2.59it/s, loss=14.4][A
[Epoch 8]:  32%|███▏      | 229/716 [01:28<03:07,  2.60it/s, loss=14.4][A
[Epoch 8]:  32%|███▏      | 229/716 [01:28<03:08,  2.59it/s, loss=13.9][A
[Epoch 8]:  32%|███▏      | 230/716 [01:28<03:07,  2.60it/s, loss=13.9][A
[Epoch 8]:  32%|███▏      | 230/716 [01:28<03:07,  2.59it/s, loss=13.2][A
[Epoch 8]:  32%|███▏      | 231/716 [01:28<03:06,  2.60it/s, loss=13.2][A
[Epoch 8]:  32%|███▏      | 231/716 [01:29<03:07,  2.59it/s, loss=12.9][A
[Epoch 8]:  32%|███▏      | 232/716 [01:29<03:06,  2.60it/s, loss=12.9][A
[Epoch 8]:  32%|███▏      | 232/716 [01:29<03:07,  2.59it/s, loss=13.8][A
[Epoch 8]:  33%|███▎      | 233/716 [01:29<03:05,  2.60it/s, loss=13.8][A
[Epoch 8]:  33%|███▎     

[Epoch 8]:  39%|███▉      | 281/716 [01:48<02:47,  2.59it/s, loss=13.4][A
[Epoch 8]:  39%|███▉      | 282/716 [01:48<02:46,  2.60it/s, loss=13.4][A
[Epoch 8]:  39%|███▉      | 282/716 [01:48<02:47,  2.59it/s, loss=13.5][A
[Epoch 8]:  40%|███▉      | 283/716 [01:48<02:46,  2.60it/s, loss=13.5][A
[Epoch 8]:  40%|███▉      | 283/716 [01:49<02:47,  2.59it/s, loss=15.1][A
[Epoch 8]:  40%|███▉      | 284/716 [01:49<02:46,  2.60it/s, loss=15.1][A
[Epoch 8]:  40%|███▉      | 284/716 [01:49<02:46,  2.59it/s, loss=13.6][A
[Epoch 8]:  40%|███▉      | 285/716 [01:49<02:45,  2.60it/s, loss=13.6][A
[Epoch 8]:  40%|███▉      | 285/716 [01:50<02:46,  2.59it/s, loss=12.9][A
[Epoch 8]:  40%|███▉      | 286/716 [01:50<02:45,  2.60it/s, loss=12.9][A
[Epoch 8]:  40%|███▉      | 286/716 [01:50<02:45,  2.59it/s, loss=13.7][A
[Epoch 8]:  40%|████      | 287/716 [01:50<02:45,  2.60it/s, loss=13.7][A
[Epoch 8]:  40%|████      | 287/716 [01:50<02:45,  2.59it/s, loss=12.7][A
[Epoch 8]:  40%|████     

[Epoch 8]:  47%|████▋     | 336/716 [02:09<02:26,  2.60it/s, loss=14.3][A
[Epoch 8]:  47%|████▋     | 336/716 [02:09<02:26,  2.59it/s, loss=13.9][A
[Epoch 8]:  47%|████▋     | 337/716 [02:09<02:25,  2.60it/s, loss=13.9][A
[Epoch 8]:  47%|████▋     | 337/716 [02:09<02:26,  2.59it/s, loss=12.6][A
[Epoch 8]:  47%|████▋     | 338/716 [02:09<02:25,  2.60it/s, loss=12.6][A
[Epoch 8]:  47%|████▋     | 338/716 [02:10<02:25,  2.59it/s, loss=13.1][A
[Epoch 8]:  47%|████▋     | 339/716 [02:10<02:24,  2.60it/s, loss=13.1][A
[Epoch 8]:  47%|████▋     | 339/716 [02:10<02:25,  2.59it/s, loss=13.4][A
[Epoch 8]:  47%|████▋     | 340/716 [02:10<02:24,  2.60it/s, loss=13.4][A
[Epoch 8]:  47%|████▋     | 340/716 [02:11<02:24,  2.59it/s, loss=14]  [A
[Epoch 8]:  48%|████▊     | 341/716 [02:11<02:24,  2.60it/s, loss=14][A
[Epoch 8]:  48%|████▊     | 341/716 [02:11<02:24,  2.59it/s, loss=13.5][A
[Epoch 8]:  48%|████▊     | 342/716 [02:11<02:23,  2.60it/s, loss=13.5][A
[Epoch 8]:  48%|████▊     |

[Epoch 8]:  54%|█████▍    | 390/716 [02:30<02:05,  2.60it/s, loss=12.3][A
[Epoch 8]:  55%|█████▍    | 391/716 [02:30<02:04,  2.60it/s, loss=12.3][A
[Epoch 8]:  55%|█████▍    | 391/716 [02:30<02:05,  2.60it/s, loss=14.5][A
[Epoch 8]:  55%|█████▍    | 392/716 [02:30<02:04,  2.60it/s, loss=14.5][A
[Epoch 8]:  55%|█████▍    | 392/716 [02:30<02:04,  2.60it/s, loss=13.3][A
[Epoch 8]:  55%|█████▍    | 393/716 [02:30<02:04,  2.60it/s, loss=13.3][A
[Epoch 8]:  55%|█████▍    | 393/716 [02:31<02:04,  2.60it/s, loss=13]  [A
[Epoch 8]:  55%|█████▌    | 394/716 [02:31<02:03,  2.60it/s, loss=13][A
[Epoch 8]:  55%|█████▌    | 394/716 [02:31<02:04,  2.60it/s, loss=13.2][A
[Epoch 8]:  55%|█████▌    | 395/716 [02:31<02:03,  2.60it/s, loss=13.2][A
[Epoch 8]:  55%|█████▌    | 395/716 [02:32<02:03,  2.60it/s, loss=14.2][A
[Epoch 8]:  55%|█████▌    | 396/716 [02:32<02:02,  2.60it/s, loss=14.2][A
[Epoch 8]:  55%|█████▌    | 396/716 [02:32<02:03,  2.60it/s, loss=13]  [A
[Epoch 8]:  55%|█████▌    |

[Epoch 8]:  62%|██████▏   | 445/716 [02:50<01:44,  2.60it/s, loss=11.8][A
[Epoch 8]:  62%|██████▏   | 445/716 [02:51<01:44,  2.60it/s, loss=13.5][A
[Epoch 8]:  62%|██████▏   | 446/716 [02:51<01:43,  2.60it/s, loss=13.5][A
[Epoch 8]:  62%|██████▏   | 446/716 [02:51<01:43,  2.60it/s, loss=13.1][A
[Epoch 8]:  62%|██████▏   | 447/716 [02:51<01:43,  2.60it/s, loss=13.1][A
[Epoch 8]:  62%|██████▏   | 447/716 [02:51<01:43,  2.60it/s, loss=13]  [A
[Epoch 8]:  63%|██████▎   | 448/716 [02:52<01:42,  2.60it/s, loss=13][A
[Epoch 8]:  63%|██████▎   | 448/716 [02:52<01:43,  2.60it/s, loss=13.7][A
[Epoch 8]:  63%|██████▎   | 449/716 [02:52<01:42,  2.60it/s, loss=13.7][A
[Epoch 8]:  63%|██████▎   | 449/716 [02:52<01:42,  2.60it/s, loss=13]  [A
[Epoch 8]:  63%|██████▎   | 450/716 [02:52<01:42,  2.60it/s, loss=13][A
[Epoch 8]:  63%|██████▎   | 450/716 [02:53<01:42,  2.60it/s, loss=12.3][A
[Epoch 8]:  63%|██████▎   | 451/716 [02:53<01:41,  2.60it/s, loss=12.3][A
[Epoch 8]:  63%|██████▎   | 4

[Epoch 8]:  70%|██████▉   | 499/716 [03:11<01:23,  2.60it/s, loss=11.6][A
[Epoch 8]:  70%|██████▉   | 500/716 [03:11<01:22,  2.61it/s, loss=11.6][A
[Epoch 8]:  70%|██████▉   | 500/716 [03:12<01:23,  2.60it/s, loss=13.1][A
[Epoch 8]:  70%|██████▉   | 501/716 [03:12<01:22,  2.61it/s, loss=13.1][A
[Epoch 8]:  70%|██████▉   | 501/716 [03:12<01:22,  2.60it/s, loss=13.8][A
[Epoch 8]:  70%|███████   | 502/716 [03:12<01:22,  2.61it/s, loss=13.8][A
[Epoch 8]:  70%|███████   | 502/716 [03:12<01:22,  2.60it/s, loss=13]  [A
[Epoch 8]:  70%|███████   | 503/716 [03:12<01:21,  2.61it/s, loss=13][A
[Epoch 8]:  70%|███████   | 503/716 [03:13<01:21,  2.60it/s, loss=12.3][A
[Epoch 8]:  70%|███████   | 504/716 [03:13<01:21,  2.61it/s, loss=12.3][A
[Epoch 8]:  70%|███████   | 504/716 [03:13<01:21,  2.60it/s, loss=13.2][A
[Epoch 8]:  71%|███████   | 505/716 [03:13<01:20,  2.61it/s, loss=13.2][A
[Epoch 8]:  71%|███████   | 505/716 [03:14<01:21,  2.60it/s, loss=13.7][A
[Epoch 8]:  71%|███████   |

[Epoch 8]:  77%|███████▋  | 554/716 [03:32<01:02,  2.61it/s, loss=13][A
[Epoch 8]:  77%|███████▋  | 554/716 [03:32<01:02,  2.60it/s, loss=13.1][A
[Epoch 8]:  78%|███████▊  | 555/716 [03:32<01:01,  2.61it/s, loss=13.1][A
[Epoch 8]:  78%|███████▊  | 555/716 [03:33<01:01,  2.60it/s, loss=14.3][A
[Epoch 8]:  78%|███████▊  | 556/716 [03:33<01:01,  2.61it/s, loss=14.3][A
[Epoch 8]:  78%|███████▊  | 556/716 [03:33<01:01,  2.60it/s, loss=12.3][A
[Epoch 8]:  78%|███████▊  | 557/716 [03:33<01:00,  2.61it/s, loss=12.3][A
[Epoch 8]:  78%|███████▊  | 557/716 [03:33<01:01,  2.60it/s, loss=13.7][A
[Epoch 8]:  78%|███████▊  | 558/716 [03:33<01:00,  2.61it/s, loss=13.7][A
[Epoch 8]:  78%|███████▊  | 558/716 [03:34<01:00,  2.60it/s, loss=13.6][A
[Epoch 8]:  78%|███████▊  | 559/716 [03:34<01:00,  2.61it/s, loss=13.6][A
[Epoch 8]:  78%|███████▊  | 559/716 [03:34<01:00,  2.60it/s, loss=14.4][A
[Epoch 8]:  78%|███████▊  | 560/716 [03:34<00:59,  2.61it/s, loss=14.4][A
[Epoch 8]:  78%|███████▊  |

[Epoch 8]:  85%|████████▍ | 608/716 [03:53<00:41,  2.60it/s, loss=13.9][A
[Epoch 8]:  85%|████████▌ | 609/716 [03:53<00:41,  2.61it/s, loss=13.9][A
[Epoch 8]:  85%|████████▌ | 609/716 [03:53<00:41,  2.60it/s, loss=12.6][A
[Epoch 8]:  85%|████████▌ | 610/716 [03:53<00:40,  2.61it/s, loss=12.6][A
[Epoch 8]:  85%|████████▌ | 610/716 [03:54<00:40,  2.60it/s, loss=15.3][A
[Epoch 8]:  85%|████████▌ | 611/716 [03:54<00:40,  2.61it/s, loss=15.3][A
[Epoch 8]:  85%|████████▌ | 611/716 [03:54<00:40,  2.60it/s, loss=13.5][A
[Epoch 8]:  85%|████████▌ | 612/716 [03:54<00:39,  2.61it/s, loss=13.5][A
[Epoch 8]:  85%|████████▌ | 612/716 [03:55<00:39,  2.60it/s, loss=14.2][A
[Epoch 8]:  86%|████████▌ | 613/716 [03:55<00:39,  2.61it/s, loss=14.2][A
[Epoch 8]:  86%|████████▌ | 613/716 [03:55<00:39,  2.60it/s, loss=14]  [A
[Epoch 8]:  86%|████████▌ | 614/716 [03:55<00:39,  2.61it/s, loss=14][A
[Epoch 8]:  86%|████████▌ | 614/716 [03:55<00:39,  2.60it/s, loss=12.3][A
[Epoch 8]:  86%|████████▌ |

[Epoch 8]:  93%|█████████▎| 663/716 [04:14<00:20,  2.61it/s, loss=13.7][A
[Epoch 8]:  93%|█████████▎| 663/716 [04:14<00:20,  2.60it/s, loss=14.6][A
[Epoch 8]:  93%|█████████▎| 664/716 [04:14<00:19,  2.61it/s, loss=14.6][A
[Epoch 8]:  93%|█████████▎| 664/716 [04:15<00:19,  2.60it/s, loss=12.8][A
[Epoch 8]:  93%|█████████▎| 665/716 [04:15<00:19,  2.61it/s, loss=12.8][A
[Epoch 8]:  93%|█████████▎| 665/716 [04:15<00:19,  2.60it/s, loss=15.1][A
[Epoch 8]:  93%|█████████▎| 666/716 [04:15<00:19,  2.61it/s, loss=15.1][A
[Epoch 8]:  93%|█████████▎| 666/716 [04:15<00:19,  2.60it/s, loss=13.6][A
[Epoch 8]:  93%|█████████▎| 667/716 [04:15<00:18,  2.61it/s, loss=13.6][A
[Epoch 8]:  93%|█████████▎| 667/716 [04:16<00:18,  2.60it/s, loss=14.2][A
[Epoch 8]:  93%|█████████▎| 668/716 [04:16<00:18,  2.61it/s, loss=14.2][A
[Epoch 8]:  93%|█████████▎| 668/716 [04:16<00:18,  2.60it/s, loss=12.6][A
[Epoch 8]:  93%|█████████▎| 669/716 [04:16<00:18,  2.61it/s, loss=12.6][A
[Epoch 8]:  93%|█████████

[Epoch 9]:   0%|          | 1/716 [00:00<09:26,  1.26it/s, loss=13.7][A
[Epoch 9]:   0%|          | 1/716 [00:01<14:07,  1.19s/it, loss=13]  [A
[Epoch 9]:   0%|          | 2/716 [00:01<07:06,  1.68it/s, loss=13][A
[Epoch 9]:   0%|          | 2/716 [00:01<09:24,  1.26it/s, loss=14.4][A
[Epoch 9]:   0%|          | 3/716 [00:01<06:17,  1.89it/s, loss=14.4][A
[Epoch 9]:   0%|          | 3/716 [00:01<07:53,  1.51it/s, loss=14.2][A
[Epoch 9]:   1%|          | 4/716 [00:01<05:55,  2.00it/s, loss=14.2][A
[Epoch 9]:   1%|          | 4/716 [00:02<07:07,  1.66it/s, loss=13.4][A
[Epoch 9]:   1%|          | 5/716 [00:02<05:42,  2.08it/s, loss=13.4][A
[Epoch 9]:   1%|          | 5/716 [00:02<06:36,  1.79it/s, loss=13.2][A
[Epoch 9]:   1%|          | 6/716 [00:02<05:30,  2.15it/s, loss=13.2][A
[Epoch 9]:   1%|          | 6/716 [00:03<06:15,  1.89it/s, loss=13.2][A
[Epoch 9]:   1%|          | 7/716 [00:03<05:22,  2.20it/s, loss=13.2][A
[Epoch 9]:   1%|          | 7/716 [00:03<06:00,  1.97

[Epoch 9]:   8%|▊         | 56/716 [00:22<04:24,  2.49it/s, loss=14.1][A
[Epoch 9]:   8%|▊         | 57/716 [00:22<04:19,  2.54it/s, loss=14.1][A
[Epoch 9]:   8%|▊         | 57/716 [00:22<04:23,  2.50it/s, loss=12.2][A
[Epoch 9]:   8%|▊         | 58/716 [00:22<04:19,  2.54it/s, loss=12.2][A
[Epoch 9]:   8%|▊         | 58/716 [00:23<04:23,  2.50it/s, loss=13.8][A
[Epoch 9]:   8%|▊         | 59/716 [00:23<04:18,  2.54it/s, loss=13.8][A
[Epoch 9]:   8%|▊         | 59/716 [00:23<04:22,  2.50it/s, loss=12.5][A
[Epoch 9]:   8%|▊         | 60/716 [00:23<04:17,  2.54it/s, loss=12.5][A
[Epoch 9]:   8%|▊         | 60/716 [00:23<04:22,  2.50it/s, loss=13.6][A
[Epoch 9]:   9%|▊         | 61/716 [00:23<04:17,  2.55it/s, loss=13.6][A
[Epoch 9]:   9%|▊         | 61/716 [00:24<04:21,  2.51it/s, loss=13.8][A
[Epoch 9]:   9%|▊         | 62/716 [00:24<04:16,  2.55it/s, loss=13.8][A
[Epoch 9]:   9%|▊         | 62/716 [00:24<04:20,  2.51it/s, loss=13.5][A
[Epoch 9]:   9%|▉         | 63/716 [00

[Epoch 9]:  16%|█▌        | 111/716 [00:43<03:57,  2.55it/s, loss=13.7][A
[Epoch 9]:  16%|█▌        | 112/716 [00:43<03:54,  2.57it/s, loss=13.7][A
[Epoch 9]:  16%|█▌        | 112/716 [00:43<03:56,  2.55it/s, loss=13.3][A
[Epoch 9]:  16%|█▌        | 113/716 [00:43<03:54,  2.57it/s, loss=13.3][A
[Epoch 9]:  16%|█▌        | 113/716 [00:44<03:56,  2.55it/s, loss=14]  [A
[Epoch 9]:  16%|█▌        | 114/716 [00:44<03:54,  2.57it/s, loss=14][A
[Epoch 9]:  16%|█▌        | 114/716 [00:44<03:55,  2.55it/s, loss=13.5][A
[Epoch 9]:  16%|█▌        | 115/716 [00:44<03:53,  2.57it/s, loss=13.5][A
[Epoch 9]:  16%|█▌        | 115/716 [00:45<03:55,  2.55it/s, loss=13.5][A
[Epoch 9]:  16%|█▌        | 116/716 [00:45<03:53,  2.57it/s, loss=13.5][A
[Epoch 9]:  16%|█▌        | 116/716 [00:45<03:55,  2.55it/s, loss=12.4][A
[Epoch 9]:  16%|█▋        | 117/716 [00:45<03:52,  2.57it/s, loss=12.4][A
[Epoch 9]:  16%|█▋        | 117/716 [00:45<03:54,  2.55it/s, loss=13.7][A
[Epoch 9]:  16%|█▋        |

[Epoch 9]:  23%|██▎       | 166/716 [01:04<03:32,  2.58it/s, loss=13.4][A
[Epoch 9]:  23%|██▎       | 166/716 [01:04<03:34,  2.57it/s, loss=13.8][A
[Epoch 9]:  23%|██▎       | 167/716 [01:04<03:32,  2.58it/s, loss=13.8][A
[Epoch 9]:  23%|██▎       | 167/716 [01:05<03:33,  2.57it/s, loss=13.3][A
[Epoch 9]:  23%|██▎       | 168/716 [01:05<03:32,  2.58it/s, loss=13.3][A
[Epoch 9]:  23%|██▎       | 168/716 [01:05<03:33,  2.57it/s, loss=12.2][A
[Epoch 9]:  24%|██▎       | 169/716 [01:05<03:31,  2.58it/s, loss=12.2][A
[Epoch 9]:  24%|██▎       | 169/716 [01:05<03:32,  2.57it/s, loss=13.2][A
[Epoch 9]:  24%|██▎       | 170/716 [01:05<03:31,  2.58it/s, loss=13.2][A
[Epoch 9]:  24%|██▎       | 170/716 [01:06<03:32,  2.57it/s, loss=13.3][A
[Epoch 9]:  24%|██▍       | 171/716 [01:06<03:30,  2.58it/s, loss=13.3][A
[Epoch 9]:  24%|██▍       | 171/716 [01:06<03:32,  2.57it/s, loss=13.2][A
[Epoch 9]:  24%|██▍       | 172/716 [01:06<03:30,  2.58it/s, loss=13.2][A
[Epoch 9]:  24%|██▍      

[Epoch 9]:  31%|███       | 220/716 [01:25<03:12,  2.57it/s, loss=14.3][A
[Epoch 9]:  31%|███       | 221/716 [01:25<03:11,  2.59it/s, loss=14.3][A
[Epoch 9]:  31%|███       | 221/716 [01:25<03:12,  2.57it/s, loss=13.1][A
[Epoch 9]:  31%|███       | 222/716 [01:25<03:11,  2.59it/s, loss=13.1][A
[Epoch 9]:  31%|███       | 222/716 [01:26<03:11,  2.57it/s, loss=13.1][A
[Epoch 9]:  31%|███       | 223/716 [01:26<03:10,  2.59it/s, loss=13.1][A
[Epoch 9]:  31%|███       | 223/716 [01:26<03:11,  2.57it/s, loss=12.6][A
[Epoch 9]:  31%|███▏      | 224/716 [01:26<03:10,  2.59it/s, loss=12.6][A
[Epoch 9]:  31%|███▏      | 224/716 [01:27<03:11,  2.57it/s, loss=11.8][A
[Epoch 9]:  31%|███▏      | 225/716 [01:27<03:09,  2.59it/s, loss=11.8][A
[Epoch 9]:  31%|███▏      | 225/716 [01:27<03:10,  2.57it/s, loss=14.1][A
[Epoch 9]:  32%|███▏      | 226/716 [01:27<03:09,  2.59it/s, loss=14.1][A
[Epoch 9]:  32%|███▏      | 226/716 [01:27<03:10,  2.57it/s, loss=14.2][A
[Epoch 9]:  32%|███▏     

[Epoch 9]:  38%|███▊      | 275/716 [01:46<02:50,  2.59it/s, loss=12.5][A
[Epoch 9]:  38%|███▊      | 275/716 [01:46<02:50,  2.58it/s, loss=13.8][A
[Epoch 9]:  39%|███▊      | 276/716 [01:46<02:49,  2.59it/s, loss=13.8][A
[Epoch 9]:  39%|███▊      | 276/716 [01:46<02:50,  2.58it/s, loss=12.5][A
[Epoch 9]:  39%|███▊      | 277/716 [01:46<02:49,  2.59it/s, loss=12.5][A
[Epoch 9]:  39%|███▊      | 277/716 [01:47<02:50,  2.58it/s, loss=14]  [A
[Epoch 9]:  39%|███▉      | 278/716 [01:47<02:49,  2.59it/s, loss=14][A
[Epoch 9]:  39%|███▉      | 278/716 [01:47<02:49,  2.58it/s, loss=12.5][A
[Epoch 9]:  39%|███▉      | 279/716 [01:47<02:48,  2.59it/s, loss=12.5][A
[Epoch 9]:  39%|███▉      | 279/716 [01:48<02:49,  2.58it/s, loss=12.8][A
[Epoch 9]:  39%|███▉      | 280/716 [01:48<02:48,  2.59it/s, loss=12.8][A
[Epoch 9]:  39%|███▉      | 280/716 [01:48<02:48,  2.58it/s, loss=12.4][A
[Epoch 9]:  39%|███▉      | 281/716 [01:48<02:47,  2.59it/s, loss=12.4][A
[Epoch 9]:  39%|███▉      |

[Epoch 9]:  46%|████▌     | 329/716 [02:07<02:29,  2.58it/s, loss=12.6][A
[Epoch 9]:  46%|████▌     | 330/716 [02:07<02:28,  2.59it/s, loss=12.6][A
[Epoch 9]:  46%|████▌     | 330/716 [02:07<02:29,  2.58it/s, loss=13.8][A
[Epoch 9]:  46%|████▌     | 331/716 [02:07<02:28,  2.59it/s, loss=13.8][A
[Epoch 9]:  46%|████▌     | 331/716 [02:08<02:29,  2.58it/s, loss=12.9][A
[Epoch 9]:  46%|████▋     | 332/716 [02:08<02:28,  2.59it/s, loss=12.9][A
[Epoch 9]:  46%|████▋     | 332/716 [02:08<02:28,  2.58it/s, loss=13.3][A
[Epoch 9]:  47%|████▋     | 333/716 [02:08<02:27,  2.59it/s, loss=13.3][A
[Epoch 9]:  47%|████▋     | 333/716 [02:08<02:28,  2.58it/s, loss=13.2][A
[Epoch 9]:  47%|████▋     | 334/716 [02:08<02:27,  2.59it/s, loss=13.2][A
[Epoch 9]:  47%|████▋     | 334/716 [02:09<02:27,  2.58it/s, loss=14.4][A
[Epoch 9]:  47%|████▋     | 335/716 [02:09<02:27,  2.59it/s, loss=14.4][A
[Epoch 9]:  47%|████▋     | 335/716 [02:09<02:27,  2.58it/s, loss=12.5][A
[Epoch 9]:  47%|████▋    

[Epoch 9]:  54%|█████▎    | 384/716 [02:28<02:08,  2.59it/s, loss=12.4][A
[Epoch 9]:  54%|█████▎    | 384/716 [02:28<02:08,  2.58it/s, loss=14.3][A
[Epoch 9]:  54%|█████▍    | 385/716 [02:28<02:07,  2.59it/s, loss=14.3][A
[Epoch 9]:  54%|█████▍    | 385/716 [02:28<02:08,  2.58it/s, loss=13]  [A
[Epoch 9]:  54%|█████▍    | 386/716 [02:28<02:07,  2.59it/s, loss=13][A
[Epoch 9]:  54%|█████▍    | 386/716 [02:29<02:07,  2.58it/s, loss=13.3][A
[Epoch 9]:  54%|█████▍    | 387/716 [02:29<02:06,  2.59it/s, loss=13.3][A
[Epoch 9]:  54%|█████▍    | 387/716 [02:29<02:07,  2.59it/s, loss=13]  [A
[Epoch 9]:  54%|█████▍    | 388/716 [02:29<02:06,  2.59it/s, loss=13][A
[Epoch 9]:  54%|█████▍    | 388/716 [02:30<02:06,  2.59it/s, loss=14.2][A
[Epoch 9]:  54%|█████▍    | 389/716 [02:30<02:06,  2.59it/s, loss=14.2][A
[Epoch 9]:  54%|█████▍    | 389/716 [02:30<02:06,  2.59it/s, loss=14.3][A
[Epoch 9]:  54%|█████▍    | 390/716 [02:30<02:05,  2.59it/s, loss=14.3][A
[Epoch 9]:  54%|█████▍    | 3

[Epoch 9]:  61%|██████    | 438/716 [02:49<01:47,  2.59it/s, loss=13.9][A
[Epoch 9]:  61%|██████▏   | 439/716 [02:49<01:46,  2.59it/s, loss=13.9][A
[Epoch 9]:  61%|██████▏   | 439/716 [02:49<01:47,  2.59it/s, loss=12.7][A
[Epoch 9]:  61%|██████▏   | 440/716 [02:49<01:46,  2.59it/s, loss=12.7][A
[Epoch 9]:  61%|██████▏   | 440/716 [02:50<01:46,  2.59it/s, loss=13]  [A
[Epoch 9]:  62%|██████▏   | 441/716 [02:50<01:46,  2.59it/s, loss=13][A
[Epoch 9]:  62%|██████▏   | 441/716 [02:50<01:46,  2.59it/s, loss=13.5][A
[Epoch 9]:  62%|██████▏   | 442/716 [02:50<01:45,  2.59it/s, loss=13.5][A
[Epoch 9]:  62%|██████▏   | 442/716 [02:50<01:45,  2.59it/s, loss=13.5][A
[Epoch 9]:  62%|██████▏   | 443/716 [02:50<01:45,  2.59it/s, loss=13.5][A
[Epoch 9]:  62%|██████▏   | 443/716 [02:51<01:45,  2.59it/s, loss=13.2][A
[Epoch 9]:  62%|██████▏   | 444/716 [02:51<01:44,  2.59it/s, loss=13.2][A
[Epoch 9]:  62%|██████▏   | 444/716 [02:51<01:45,  2.59it/s, loss=14.2][A
[Epoch 9]:  62%|██████▏   |

[Epoch 9]:  69%|██████▉   | 493/716 [03:09<01:25,  2.60it/s, loss=13.3][A
[Epoch 9]:  69%|██████▉   | 493/716 [03:10<01:26,  2.59it/s, loss=13.2][A
[Epoch 9]:  69%|██████▉   | 494/716 [03:10<01:25,  2.60it/s, loss=13.2][A
[Epoch 9]:  69%|██████▉   | 494/716 [03:10<01:25,  2.59it/s, loss=13.9][A
[Epoch 9]:  69%|██████▉   | 495/716 [03:10<01:25,  2.60it/s, loss=13.9][A
[Epoch 9]:  69%|██████▉   | 495/716 [03:11<01:25,  2.59it/s, loss=14.1][A
[Epoch 9]:  69%|██████▉   | 496/716 [03:11<01:24,  2.60it/s, loss=14.1][A
[Epoch 9]:  69%|██████▉   | 496/716 [03:11<01:24,  2.59it/s, loss=12.7][A
[Epoch 9]:  69%|██████▉   | 497/716 [03:11<01:24,  2.60it/s, loss=12.7][A
[Epoch 9]:  69%|██████▉   | 497/716 [03:11<01:24,  2.59it/s, loss=13.3][A
[Epoch 9]:  70%|██████▉   | 498/716 [03:11<01:23,  2.60it/s, loss=13.3][A
[Epoch 9]:  70%|██████▉   | 498/716 [03:12<01:24,  2.59it/s, loss=12.4][A
[Epoch 9]:  70%|██████▉   | 499/716 [03:12<01:23,  2.60it/s, loss=12.4][A
[Epoch 9]:  70%|██████▉  

[Epoch 9]:  76%|███████▋  | 547/716 [03:30<01:05,  2.59it/s, loss=13.6][A
[Epoch 9]:  77%|███████▋  | 548/716 [03:30<01:04,  2.60it/s, loss=13.6][A
[Epoch 9]:  77%|███████▋  | 548/716 [03:31<01:04,  2.59it/s, loss=12.8][A
[Epoch 9]:  77%|███████▋  | 549/716 [03:31<01:04,  2.60it/s, loss=12.8][A
[Epoch 9]:  77%|███████▋  | 549/716 [03:31<01:04,  2.59it/s, loss=13.6][A
[Epoch 9]:  77%|███████▋  | 550/716 [03:31<01:03,  2.60it/s, loss=13.6][A
[Epoch 9]:  77%|███████▋  | 550/716 [03:32<01:04,  2.59it/s, loss=13.6][A
[Epoch 9]:  77%|███████▋  | 551/716 [03:32<01:03,  2.60it/s, loss=13.6][A
[Epoch 9]:  77%|███████▋  | 551/716 [03:32<01:03,  2.59it/s, loss=12.9][A
[Epoch 9]:  77%|███████▋  | 552/716 [03:32<01:03,  2.60it/s, loss=12.9][A
[Epoch 9]:  77%|███████▋  | 552/716 [03:32<01:03,  2.59it/s, loss=13.1][A
[Epoch 9]:  77%|███████▋  | 553/716 [03:32<01:02,  2.60it/s, loss=13.1][A
[Epoch 9]:  77%|███████▋  | 553/716 [03:33<01:02,  2.59it/s, loss=13.5][A
[Epoch 9]:  77%|███████▋ 

[Epoch 9]:  84%|████████▍ | 602/716 [03:51<00:43,  2.60it/s, loss=13.3][A
[Epoch 9]:  84%|████████▍ | 602/716 [03:51<00:43,  2.60it/s, loss=12.9][A
[Epoch 9]:  84%|████████▍ | 603/716 [03:51<00:43,  2.60it/s, loss=12.9][A
[Epoch 9]:  84%|████████▍ | 603/716 [03:52<00:43,  2.60it/s, loss=13.4][A
[Epoch 9]:  84%|████████▍ | 604/716 [03:52<00:43,  2.60it/s, loss=13.4][A
[Epoch 9]:  84%|████████▍ | 604/716 [03:52<00:43,  2.60it/s, loss=14]  [A
[Epoch 9]:  84%|████████▍ | 605/716 [03:52<00:42,  2.60it/s, loss=14][A
[Epoch 9]:  84%|████████▍ | 605/716 [03:52<00:42,  2.60it/s, loss=13.4][A
[Epoch 9]:  85%|████████▍ | 606/716 [03:52<00:42,  2.60it/s, loss=13.4][A
[Epoch 9]:  85%|████████▍ | 606/716 [03:53<00:42,  2.60it/s, loss=12.1][A
[Epoch 9]:  85%|████████▍ | 607/716 [03:53<00:41,  2.60it/s, loss=12.1][A
[Epoch 9]:  85%|████████▍ | 607/716 [03:53<00:41,  2.60it/s, loss=13.8][A
[Epoch 9]:  85%|████████▍ | 608/716 [03:53<00:41,  2.60it/s, loss=13.8][A
[Epoch 9]:  85%|████████▍ |

[Epoch 9]:  92%|█████████▏| 656/716 [04:12<00:23,  2.60it/s, loss=14.1][A
[Epoch 9]:  92%|█████████▏| 657/716 [04:12<00:22,  2.60it/s, loss=14.1][A
[Epoch 9]:  92%|█████████▏| 657/716 [04:12<00:22,  2.60it/s, loss=12.9][A
[Epoch 9]:  92%|█████████▏| 658/716 [04:12<00:22,  2.60it/s, loss=12.9][A
[Epoch 9]:  92%|█████████▏| 658/716 [04:13<00:22,  2.60it/s, loss=14]  [A
[Epoch 9]:  92%|█████████▏| 659/716 [04:13<00:21,  2.60it/s, loss=14][A
[Epoch 9]:  92%|█████████▏| 659/716 [04:13<00:21,  2.60it/s, loss=14.5][A
[Epoch 9]:  92%|█████████▏| 660/716 [04:13<00:21,  2.60it/s, loss=14.5][A
[Epoch 9]:  92%|█████████▏| 660/716 [04:14<00:21,  2.60it/s, loss=13.3][A
[Epoch 9]:  92%|█████████▏| 661/716 [04:14<00:21,  2.60it/s, loss=13.3][A
[Epoch 9]:  92%|█████████▏| 661/716 [04:14<00:21,  2.60it/s, loss=13.8][A
[Epoch 9]:  92%|█████████▏| 662/716 [04:14<00:20,  2.60it/s, loss=13.8][A
[Epoch 9]:  92%|█████████▏| 662/716 [04:14<00:20,  2.60it/s, loss=13.3][A
[Epoch 9]:  93%|█████████▎|

[Epoch 9]:  99%|█████████▉| 711/716 [04:33<00:01,  2.60it/s, loss=13.7][A
[Epoch 9]:  99%|█████████▉| 711/716 [04:33<00:01,  2.60it/s, loss=12.6][A
[Epoch 9]:  99%|█████████▉| 712/716 [04:33<00:01,  2.60it/s, loss=12.6][A
[Epoch 9]:  99%|█████████▉| 712/716 [04:34<00:01,  2.60it/s, loss=12.4][A
[Epoch 9]: 100%|█████████▉| 713/716 [04:34<00:01,  2.60it/s, loss=12.4][A
[Epoch 9]: 100%|█████████▉| 713/716 [04:34<00:01,  2.60it/s, loss=13.8][A
[Epoch 9]: 100%|█████████▉| 714/716 [04:34<00:00,  2.60it/s, loss=13.8][A
[Epoch 9]: 100%|█████████▉| 714/716 [04:34<00:00,  2.60it/s, loss=14.7][A
[Epoch 9]: 100%|█████████▉| 715/716 [04:34<00:00,  2.60it/s, loss=14.7][A
[Epoch 9]: 100%|█████████▉| 715/716 [04:34<00:00,  2.60it/s, loss=12.5][A
[Epoch 9]: 100%|██████████| 716/716 [04:34<00:00,  2.60it/s, loss=12.5][A
  0%|          | 0/716 [00:00<?, ?it/s][A
[Epoch 10]:   0%|          | 0/716 [00:00<?, ?it/s][A
[Epoch 10]:   0%|          | 0/716 [00:00<?, ?it/s, loss=14][A
[Epoch 10]:  

[Epoch 10]:   7%|▋         | 49/716 [00:19<04:26,  2.50it/s, loss=13.4][A
[Epoch 10]:   7%|▋         | 49/716 [00:19<04:31,  2.46it/s, loss=13.5][A
[Epoch 10]:   7%|▋         | 50/716 [00:19<04:25,  2.51it/s, loss=13.5][A
[Epoch 10]:   7%|▋         | 50/716 [00:20<04:30,  2.46it/s, loss=13.7][A
[Epoch 10]:   7%|▋         | 51/716 [00:20<04:24,  2.51it/s, loss=13.7][A
[Epoch 10]:   7%|▋         | 51/716 [00:20<04:29,  2.46it/s, loss=13.9][A
[Epoch 10]:   7%|▋         | 52/716 [00:20<04:24,  2.51it/s, loss=13.9][A
[Epoch 10]:   7%|▋         | 52/716 [00:21<04:29,  2.47it/s, loss=13.7][A
[Epoch 10]:   7%|▋         | 53/716 [00:21<04:23,  2.51it/s, loss=13.7][A
[Epoch 10]:   7%|▋         | 53/716 [00:21<04:28,  2.47it/s, loss=12.8][A
[Epoch 10]:   8%|▊         | 54/716 [00:21<04:23,  2.52it/s, loss=12.8][A
[Epoch 10]:   8%|▊         | 54/716 [00:21<04:27,  2.47it/s, loss=13.5][A
[Epoch 10]:   8%|▊         | 55/716 [00:21<04:22,  2.52it/s, loss=13.5][A
[Epoch 10]:   8%|▊       

[Epoch 10]:  14%|█▍        | 103/716 [00:40<04:01,  2.54it/s, loss=12.6][A
[Epoch 10]:  15%|█▍        | 104/716 [00:40<03:58,  2.57it/s, loss=12.6][A
[Epoch 10]:  15%|█▍        | 104/716 [00:40<04:00,  2.54it/s, loss=13.2][A
[Epoch 10]:  15%|█▍        | 105/716 [00:40<03:58,  2.57it/s, loss=13.2][A
[Epoch 10]:  15%|█▍        | 105/716 [00:41<04:00,  2.54it/s, loss=12.8][A
[Epoch 10]:  15%|█▍        | 106/716 [00:41<03:57,  2.57it/s, loss=12.8][A
[Epoch 10]:  15%|█▍        | 106/716 [00:41<03:59,  2.54it/s, loss=13.5][A
[Epoch 10]:  15%|█▍        | 107/716 [00:41<03:57,  2.57it/s, loss=13.5][A
[Epoch 10]:  15%|█▍        | 107/716 [00:42<03:59,  2.54it/s, loss=13.5][A
[Epoch 10]:  15%|█▌        | 108/716 [00:42<03:56,  2.57it/s, loss=13.5][A
[Epoch 10]:  15%|█▌        | 108/716 [00:42<03:58,  2.54it/s, loss=14.1][A
[Epoch 10]:  15%|█▌        | 109/716 [00:42<03:56,  2.57it/s, loss=14.1][A
[Epoch 10]:  15%|█▌        | 109/716 [00:42<03:58,  2.55it/s, loss=13.5][A
[Epoch 10]: 

[Epoch 10]:  22%|██▏       | 157/716 [01:01<03:37,  2.57it/s, loss=14.4][A
[Epoch 10]:  22%|██▏       | 158/716 [01:01<03:35,  2.59it/s, loss=14.4][A
[Epoch 10]:  22%|██▏       | 158/716 [01:01<03:36,  2.57it/s, loss=14.7][A
[Epoch 10]:  22%|██▏       | 159/716 [01:01<03:35,  2.59it/s, loss=14.7][A
[Epoch 10]:  22%|██▏       | 159/716 [01:01<03:36,  2.57it/s, loss=13]  [A
[Epoch 10]:  22%|██▏       | 160/716 [01:01<03:34,  2.59it/s, loss=13][A
[Epoch 10]:  22%|██▏       | 160/716 [01:02<03:36,  2.57it/s, loss=14.5][A
[Epoch 10]:  22%|██▏       | 161/716 [01:02<03:34,  2.59it/s, loss=14.5][A
[Epoch 10]:  22%|██▏       | 161/716 [01:02<03:35,  2.57it/s, loss=12.3][A
[Epoch 10]:  23%|██▎       | 162/716 [01:02<03:33,  2.59it/s, loss=12.3][A
[Epoch 10]:  23%|██▎       | 162/716 [01:02<03:35,  2.57it/s, loss=14.4][A
[Epoch 10]:  23%|██▎       | 163/716 [01:02<03:33,  2.59it/s, loss=14.4][A
[Epoch 10]:  23%|██▎       | 163/716 [01:03<03:34,  2.57it/s, loss=13.9][A
[Epoch 10]:  2

[Epoch 10]:  29%|██▉       | 211/716 [01:21<03:14,  2.60it/s, loss=13][A
[Epoch 10]:  29%|██▉       | 211/716 [01:21<03:15,  2.59it/s, loss=13.6][A
[Epoch 10]:  30%|██▉       | 212/716 [01:21<03:13,  2.60it/s, loss=13.6][A
[Epoch 10]:  30%|██▉       | 212/716 [01:21<03:14,  2.59it/s, loss=14.7][A
[Epoch 10]:  30%|██▉       | 213/716 [01:21<03:13,  2.60it/s, loss=14.7][A
[Epoch 10]:  30%|██▉       | 213/716 [01:22<03:14,  2.59it/s, loss=13]  [A
[Epoch 10]:  30%|██▉       | 214/716 [01:22<03:13,  2.60it/s, loss=13][A
[Epoch 10]:  30%|██▉       | 214/716 [01:22<03:14,  2.59it/s, loss=12.2][A
[Epoch 10]:  30%|███       | 215/716 [01:22<03:12,  2.60it/s, loss=12.2][A
[Epoch 10]:  30%|███       | 215/716 [01:23<03:13,  2.59it/s, loss=13.4][A
[Epoch 10]:  30%|███       | 216/716 [01:23<03:12,  2.60it/s, loss=13.4][A
[Epoch 10]:  30%|███       | 216/716 [01:23<03:13,  2.59it/s, loss=12.6][A
[Epoch 10]:  30%|███       | 217/716 [01:23<03:12,  2.60it/s, loss=12.6][A
[Epoch 10]:  30%

[Epoch 10]:  37%|███▋      | 265/716 [01:41<02:53,  2.60it/s, loss=13.4][A
[Epoch 10]:  37%|███▋      | 265/716 [01:42<02:53,  2.59it/s, loss=14.3][A
[Epoch 10]:  37%|███▋      | 266/716 [01:42<02:52,  2.60it/s, loss=14.3][A
[Epoch 10]:  37%|███▋      | 266/716 [01:42<02:53,  2.59it/s, loss=13.7][A
[Epoch 10]:  37%|███▋      | 267/716 [01:42<02:52,  2.60it/s, loss=13.7][A
[Epoch 10]:  37%|███▋      | 267/716 [01:42<02:53,  2.59it/s, loss=13.6][A
[Epoch 10]:  37%|███▋      | 268/716 [01:42<02:52,  2.60it/s, loss=13.6][A
[Epoch 10]:  37%|███▋      | 268/716 [01:43<02:52,  2.60it/s, loss=14]  [A
[Epoch 10]:  38%|███▊      | 269/716 [01:43<02:51,  2.60it/s, loss=14][A
[Epoch 10]:  38%|███▊      | 269/716 [01:43<02:52,  2.60it/s, loss=14][A
[Epoch 10]:  38%|███▊      | 270/716 [01:43<02:51,  2.60it/s, loss=14][A
[Epoch 10]:  38%|███▊      | 270/716 [01:44<02:51,  2.60it/s, loss=13.6][A
[Epoch 10]:  38%|███▊      | 271/716 [01:44<02:50,  2.61it/s, loss=13.6][A
[Epoch 10]:  38%|█

[Epoch 10]:  45%|████▍     | 319/716 [02:02<02:32,  2.61it/s, loss=13.8][A
[Epoch 10]:  45%|████▍     | 319/716 [02:02<02:32,  2.60it/s, loss=12.9][A
[Epoch 10]:  45%|████▍     | 320/716 [02:02<02:31,  2.61it/s, loss=12.9][A
[Epoch 10]:  45%|████▍     | 320/716 [02:03<02:32,  2.60it/s, loss=13.4][A
[Epoch 10]:  45%|████▍     | 321/716 [02:03<02:31,  2.61it/s, loss=13.4][A
[Epoch 10]:  45%|████▍     | 321/716 [02:03<02:31,  2.60it/s, loss=14.4][A
[Epoch 10]:  45%|████▍     | 322/716 [02:03<02:30,  2.61it/s, loss=14.4][A
[Epoch 10]:  45%|████▍     | 322/716 [02:03<02:31,  2.60it/s, loss=12.9][A
[Epoch 10]:  45%|████▌     | 323/716 [02:03<02:30,  2.61it/s, loss=12.9][A
[Epoch 10]:  45%|████▌     | 323/716 [02:04<02:31,  2.60it/s, loss=13.4][A
[Epoch 10]:  45%|████▌     | 324/716 [02:04<02:30,  2.61it/s, loss=13.4][A
[Epoch 10]:  45%|████▌     | 324/716 [02:04<02:30,  2.60it/s, loss=13.2][A
[Epoch 10]:  45%|████▌     | 325/716 [02:04<02:29,  2.61it/s, loss=13.2][A
[Epoch 10]: 

[Epoch 10]:  52%|█████▏    | 372/716 [02:22<02:12,  2.60it/s, loss=13.7][A
[Epoch 10]:  52%|█████▏    | 373/716 [02:22<02:11,  2.61it/s, loss=13.7][A
[Epoch 10]:  52%|█████▏    | 373/716 [02:23<02:11,  2.60it/s, loss=13.4][A
[Epoch 10]:  52%|█████▏    | 374/716 [02:23<02:11,  2.61it/s, loss=13.4][A
[Epoch 10]:  52%|█████▏    | 374/716 [02:23<02:11,  2.60it/s, loss=13.6][A
[Epoch 10]:  52%|█████▏    | 375/716 [02:23<02:10,  2.61it/s, loss=13.6][A
[Epoch 10]:  52%|█████▏    | 375/716 [02:24<02:10,  2.60it/s, loss=14.5][A
[Epoch 10]:  53%|█████▎    | 376/716 [02:24<02:10,  2.61it/s, loss=14.5][A
[Epoch 10]:  53%|█████▎    | 376/716 [02:24<02:10,  2.60it/s, loss=13.3][A
[Epoch 10]:  53%|█████▎    | 377/716 [02:24<02:09,  2.61it/s, loss=13.3][A
[Epoch 10]:  53%|█████▎    | 377/716 [02:24<02:10,  2.60it/s, loss=13.2][A
[Epoch 10]:  53%|█████▎    | 378/716 [02:24<02:09,  2.61it/s, loss=13.2][A
[Epoch 10]:  53%|█████▎    | 378/716 [02:25<02:09,  2.60it/s, loss=14.8][A
[Epoch 10]: 

[Epoch 10]:  59%|█████▉    | 426/716 [02:43<01:51,  2.61it/s, loss=13.6][A
[Epoch 10]:  59%|█████▉    | 426/716 [02:43<01:51,  2.60it/s, loss=13.5][A
[Epoch 10]:  60%|█████▉    | 427/716 [02:43<01:50,  2.61it/s, loss=13.5][A
[Epoch 10]:  60%|█████▉    | 427/716 [02:43<01:50,  2.60it/s, loss=13.5][A
[Epoch 10]:  60%|█████▉    | 428/716 [02:43<01:50,  2.61it/s, loss=13.5][A
[Epoch 10]:  60%|█████▉    | 428/716 [02:44<01:50,  2.60it/s, loss=13.6][A
[Epoch 10]:  60%|█████▉    | 429/716 [02:44<01:49,  2.61it/s, loss=13.6][A
[Epoch 10]:  60%|█████▉    | 429/716 [02:44<01:50,  2.60it/s, loss=13.1][A
[Epoch 10]:  60%|██████    | 430/716 [02:44<01:49,  2.61it/s, loss=13.1][A
[Epoch 10]:  60%|██████    | 430/716 [02:45<01:49,  2.60it/s, loss=12.5][A
[Epoch 10]:  60%|██████    | 431/716 [02:45<01:49,  2.61it/s, loss=12.5][A
[Epoch 10]:  60%|██████    | 431/716 [02:45<01:49,  2.60it/s, loss=13.5][A
[Epoch 10]:  60%|██████    | 432/716 [02:45<01:48,  2.61it/s, loss=13.5][A
[Epoch 10]: 

[Epoch 10]:  67%|██████▋   | 480/716 [03:03<01:30,  2.61it/s, loss=12.7][A
[Epoch 10]:  67%|██████▋   | 480/716 [03:04<01:30,  2.61it/s, loss=13.1][A
[Epoch 10]:  67%|██████▋   | 481/716 [03:04<01:29,  2.61it/s, loss=13.1][A
[Epoch 10]:  67%|██████▋   | 481/716 [03:04<01:30,  2.61it/s, loss=13.5][A
[Epoch 10]:  67%|██████▋   | 482/716 [03:04<01:29,  2.61it/s, loss=13.5][A
[Epoch 10]:  67%|██████▋   | 482/716 [03:04<01:29,  2.61it/s, loss=12.8][A
[Epoch 10]:  67%|██████▋   | 483/716 [03:04<01:29,  2.61it/s, loss=12.8][A
[Epoch 10]:  67%|██████▋   | 483/716 [03:05<01:29,  2.61it/s, loss=12.9][A
[Epoch 10]:  68%|██████▊   | 484/716 [03:05<01:28,  2.61it/s, loss=12.9][A
[Epoch 10]:  68%|██████▊   | 484/716 [03:05<01:28,  2.61it/s, loss=13]  [A
[Epoch 10]:  68%|██████▊   | 485/716 [03:05<01:28,  2.61it/s, loss=13][A
[Epoch 10]:  68%|██████▊   | 485/716 [03:06<01:28,  2.61it/s, loss=12.3][A
[Epoch 10]:  68%|██████▊   | 486/716 [03:06<01:28,  2.61it/s, loss=12.3][A
[Epoch 10]:  6

[Epoch 10]:  74%|███████▍  | 533/716 [03:24<01:10,  2.61it/s, loss=13.2][A
[Epoch 10]:  75%|███████▍  | 534/716 [03:24<01:09,  2.61it/s, loss=13.2][A
[Epoch 10]:  75%|███████▍  | 534/716 [03:24<01:09,  2.61it/s, loss=13.6][A
[Epoch 10]:  75%|███████▍  | 535/716 [03:24<01:09,  2.61it/s, loss=13.6][A
[Epoch 10]:  75%|███████▍  | 535/716 [03:25<01:09,  2.61it/s, loss=14.5][A
[Epoch 10]:  75%|███████▍  | 536/716 [03:25<01:08,  2.61it/s, loss=14.5][A
[Epoch 10]:  75%|███████▍  | 536/716 [03:25<01:08,  2.61it/s, loss=13.4][A
[Epoch 10]:  75%|███████▌  | 537/716 [03:25<01:08,  2.61it/s, loss=13.4][A
[Epoch 10]:  75%|███████▌  | 537/716 [03:25<01:08,  2.61it/s, loss=13.1][A
[Epoch 10]:  75%|███████▌  | 538/716 [03:25<01:08,  2.61it/s, loss=13.1][A
[Epoch 10]:  75%|███████▌  | 538/716 [03:26<01:08,  2.61it/s, loss=13.3][A
[Epoch 10]:  75%|███████▌  | 539/716 [03:26<01:07,  2.61it/s, loss=13.3][A
[Epoch 10]:  75%|███████▌  | 539/716 [03:26<01:07,  2.61it/s, loss=12.4][A
[Epoch 10]: 

[Epoch 10]:  82%|████████▏ | 587/716 [03:44<00:49,  2.61it/s, loss=12.7][A
[Epoch 10]:  82%|████████▏ | 587/716 [03:44<00:49,  2.61it/s, loss=12.9][A
[Epoch 10]:  82%|████████▏ | 588/716 [03:44<00:48,  2.61it/s, loss=12.9][A
[Epoch 10]:  82%|████████▏ | 588/716 [03:45<00:49,  2.61it/s, loss=12.5][A
[Epoch 10]:  82%|████████▏ | 589/716 [03:45<00:48,  2.61it/s, loss=12.5][A
[Epoch 10]:  82%|████████▏ | 589/716 [03:45<00:48,  2.61it/s, loss=14.2][A
[Epoch 10]:  82%|████████▏ | 590/716 [03:45<00:48,  2.61it/s, loss=14.2][A
[Epoch 10]:  82%|████████▏ | 590/716 [03:46<00:48,  2.61it/s, loss=13.1][A
[Epoch 10]:  83%|████████▎ | 591/716 [03:46<00:47,  2.61it/s, loss=13.1][A
[Epoch 10]:  83%|████████▎ | 591/716 [03:46<00:47,  2.61it/s, loss=14.6][A
[Epoch 10]:  83%|████████▎ | 592/716 [03:46<00:47,  2.61it/s, loss=14.6][A
[Epoch 10]:  83%|████████▎ | 592/716 [03:46<00:47,  2.61it/s, loss=12.9][A
[Epoch 10]:  83%|████████▎ | 593/716 [03:46<00:47,  2.61it/s, loss=12.9][A
[Epoch 10]: 

[Epoch 10]:  89%|████████▉ | 640/716 [04:05<00:29,  2.61it/s, loss=13]  [A
[Epoch 10]:  90%|████████▉ | 641/716 [04:05<00:28,  2.61it/s, loss=13][A
[Epoch 10]:  90%|████████▉ | 641/716 [04:05<00:28,  2.61it/s, loss=14][A
[Epoch 10]:  90%|████████▉ | 642/716 [04:05<00:28,  2.61it/s, loss=14][A
[Epoch 10]:  90%|████████▉ | 642/716 [04:06<00:28,  2.61it/s, loss=14][A
[Epoch 10]:  90%|████████▉ | 643/716 [04:06<00:27,  2.61it/s, loss=14][A
[Epoch 10]:  90%|████████▉ | 643/716 [04:06<00:27,  2.61it/s, loss=12.5][A
[Epoch 10]:  90%|████████▉ | 644/716 [04:06<00:27,  2.61it/s, loss=12.5][A
[Epoch 10]:  90%|████████▉ | 644/716 [04:06<00:27,  2.61it/s, loss=13.6][A
[Epoch 10]:  90%|█████████ | 645/716 [04:06<00:27,  2.61it/s, loss=13.6][A
[Epoch 10]:  90%|█████████ | 645/716 [04:07<00:27,  2.61it/s, loss=13.7][A
[Epoch 10]:  90%|█████████ | 646/716 [04:07<00:26,  2.61it/s, loss=13.7][A
[Epoch 10]:  90%|█████████ | 646/716 [04:07<00:26,  2.61it/s, loss=13.1][A
[Epoch 10]:  90%|█████

[Epoch 10]:  97%|█████████▋| 694/716 [04:25<00:08,  2.61it/s, loss=13.6][A
[Epoch 10]:  97%|█████████▋| 694/716 [04:25<00:08,  2.61it/s, loss=15.1][A
[Epoch 10]:  97%|█████████▋| 695/716 [04:25<00:08,  2.61it/s, loss=15.1][A
[Epoch 10]:  97%|█████████▋| 695/716 [04:26<00:08,  2.61it/s, loss=12.7][A
[Epoch 10]:  97%|█████████▋| 696/716 [04:26<00:07,  2.61it/s, loss=12.7][A
[Epoch 10]:  97%|█████████▋| 696/716 [04:26<00:07,  2.61it/s, loss=12.8][A
[Epoch 10]:  97%|█████████▋| 697/716 [04:26<00:07,  2.61it/s, loss=12.8][A
[Epoch 10]:  97%|█████████▋| 697/716 [04:27<00:07,  2.61it/s, loss=13.5][A
[Epoch 10]:  97%|█████████▋| 698/716 [04:27<00:06,  2.61it/s, loss=13.5][A
[Epoch 10]:  97%|█████████▋| 698/716 [04:27<00:06,  2.61it/s, loss=13.3][A
[Epoch 10]:  98%|█████████▊| 699/716 [04:27<00:06,  2.61it/s, loss=13.3][A
[Epoch 10]:  98%|█████████▊| 699/716 [04:27<00:06,  2.61it/s, loss=13.5][A
[Epoch 10]:  98%|█████████▊| 700/716 [04:27<00:06,  2.61it/s, loss=13.5][A
[Epoch 10]: 

In [34]:
model_1.ivectors.weight.data.cpu().numpy()[3]

array([ 0.05816619,  0.04498733,  0.09160124, -0.17151251,  0.10322422,
        0.03000014,  0.01200111, -0.13853897, -0.00585345,  0.03884761,
        0.0371792 , -0.09004281, -0.07565466,  0.02033259, -0.02968116,
       -0.07956991,  0.00401943, -0.01603008, -0.08317608, -0.13277908,
        0.10089583, -0.08572169,  0.0722882 ,  0.0231715 ,  0.05441654,
       -0.06812048, -0.05478003,  0.09775572, -0.01404165,  0.00129854,
       -0.00281095, -0.04445899, -0.13130639, -0.00629688, -0.02344881,
        0.02692058, -0.09760157,  0.04150186, -0.03530991,  0.00656995,
        0.02200015,  0.01385296, -0.11589619, -0.01922443, -0.05797816,
       -0.03792982, -0.0039581 ,  0.01625879,  0.05939846,  0.03436416,
        0.05823668, -0.03517651, -0.00515196, -0.09179679,  0.06125971,
        0.03553877, -0.13070497,  0.01148216,  0.13685359, -0.11627848,
        0.05867105,  0.02773466,  0.03072521, -0.00707116,  0.19710493,
        0.04737592, -0.09089682,  0.02742238,  0.08533072, -0.04

In [35]:
vector3

array([ 0.05789586,  0.04476868,  0.09167903, -0.17152733,  0.10329971,
        0.03014417,  0.01219846, -0.13819744, -0.00565925,  0.03899888,
        0.03732952, -0.0898168 , -0.07575436,  0.02051679, -0.02981773,
       -0.07936405,  0.00382746, -0.01618091, -0.08324953, -0.1328506 ,
        0.10098054, -0.08548413,  0.07240234,  0.02332029,  0.05415119,
       -0.06823785, -0.05450507,  0.09783662, -0.01419741,  0.00150108,
       -0.00262661, -0.04425149, -0.13105522, -0.00611185, -0.02356478,
        0.02706797, -0.09736105,  0.04132115, -0.03511995,  0.00675131,
        0.02178738,  0.01402447, -0.11562996, -0.01941235, -0.0577183 ,
       -0.03773048, -0.00415369,  0.01645307,  0.05912367,  0.03455342,
        0.0583756 , -0.0349873 , -0.00496768, -0.09155397,  0.06138192,
        0.03567986, -0.13077518,  0.01166302,  0.13653545, -0.11633229,
        0.05879457,  0.02754627,  0.03053075, -0.00725776,  0.19709015,
        0.04714454, -0.09065689,  0.02722152,  0.0851267 , -0.04

In [184]:
sum([0 == tens for tens in LT([0,1,1,2,5,6,3]).numpy()])

1

In [191]:
LT(vector3).shape

torch.Size([300])

In [210]:
print(LT(np.array([[2,5,8],[4,5,77]])).shape, LT([1,2,3]).shape)

torch.Size([2, 3]) torch.Size([3])


In [259]:
sgns_1(LT([1,2,3]), LT(np.array([[2,5,8],[4,5,77]]).T), None)

ivectors torch.Size([3, 300, 1])
ovectors torch.Size([3, 2, 300])
nvectors torch.Size([3, 200, 300])
torch.Size([3])
torch.Size([3])
torch.Size([])


tensor(70.0079, device='cuda:0', grad_fn=<NegBackward>)

In [196]:
n_epoch = 10
mb = 1000

for epoch in range(1, n_epoch + 1):
    dataset = PermutedSubsampledCorpus(os.path.join(data_path, 'train.dat'), ws)
    dataloader = DataLoader(dataset, batch_size=mb, shuffle=True)
    total_batches = int(np.ceil(len(dataset) / mb))
    pbar = tqdm(dataloader)
    pbar.set_description("[Epoch {}]".format(epoch))
    for iword, owords in pbar:
        print(iword.shape)
        print(owords.shape)
        print('----')


  0%|          | 0/715 [00:00<?, ?it/s][A
[Epoch 1]:   2%|▏         | 14/715 [00:00<00:23, 30.14it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 1]:   6%|▋         | 46/715 [00:00<00:09, 68.31it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 1]:  11%|█         | 79/715 [00:00<00:07, 89.40it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 1]:  16%|█▌        | 111/715 [00:01<00:05, 101.93it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 1]:  20%|██        | 143/715 [00:01<00:05, 110.13it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 1]:  24%|██▍       | 175/715 [00:01<00:04, 116.34it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 1]:  29%|██▉       | 207/715 [00:01<00:04, 120.93it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 1]:  33%|███▎      | 239/715 [00:01<00:03, 124.22it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 1]:  38%|███▊      | 271/715 [00:02<00:03, 126.89it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 1]:  43%|████▎     | 304/715 [00:02<00:03, 129.77it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 1]:  47%|████▋     | 337/715 [00:02<00:02, 132.20it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 1]:  52%|█████▏    | 369/715 [00:02<00:02, 134.02it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 1]:  56%|█████▌    | 402/715 [00:02<00:02, 135.94it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 1]:  61%|██████    | 435/715 [00:03<00:02, 137.37it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 1]:  65%|██████▌   | 467/715 [00:03<00:01, 138.39it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 1]:  70%|██████▉   | 499/715 [00:03<00:01, 138.84it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 1]:  74%|███████▍  | 531/715 [00:03<00:01, 139.77it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 1]:  79%|███████▉  | 564/715 [00:04<00:01, 140.76it/s]


torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([

[Epoch 1]:  84%|████████▎ | 598/715 [00:04<00:00, 141.94it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 1]:  88%|████████▊ | 632/715 [00:04<00:00, 142.83it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 1]:  93%|█████████▎| 665/715 [00:04<00:00, 142.17it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 1]:  97%|█████████▋| 696/715 [00:04<00:00, 142.48it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 1]: 100%|██████████| 715/715 [00:05<00:00, 142.46it/s]


torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([753])
torch.Size([753, 10])
----


[Epoch 2]:   2%|▏         | 15/716 [00:00<00:21, 33.33it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 2]:   6%|▋         | 46/716 [00:00<00:09, 70.39it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 2]:  11%|█         | 78/716 [00:00<00:07, 90.64it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 2]:  16%|█▌        | 112/716 [00:01<00:05, 104.59it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 2]:  20%|██        | 146/716 [00:01<00:05, 113.93it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 2]:  25%|██▌       | 180/716 [00:01<00:04, 120.76it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 2]:  30%|██▉       | 214/716 [00:01<00:03, 126.12it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 2]:  35%|███▍      | 248/716 [00:01<00:03, 129.84it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 2]:  39%|███▉      | 282/716 [00:02<00:03, 132.83it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 2]:  44%|████▍     | 316/716 [00:02<00:02, 135.38it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 2]:  49%|████▉     | 350/716 [00:02<00:02, 137.31it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 2]:  53%|█████▎    | 383/716 [00:02<00:02, 138.87it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 2]:  58%|█████▊    | 415/716 [00:02<00:02, 139.80it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 2]:  63%|██████▎   | 449/716 [00:03<00:01, 141.39it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 2]:  67%|██████▋   | 483/716 [00:03<00:01, 142.28it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 2]:  72%|███████▏  | 517/716 [00:03<00:01, 143.60it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 2]:  77%|███████▋  | 550/716 [00:03<00:01, 144.14it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 2]:  81%|████████▏ | 582/716 [00:04<00:00, 144.90it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 2]:  86%|████████▌ | 614/716 [00:04<00:00, 145.46it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 2]:  90%|█████████ | 646/716 [00:04<00:00, 146.07it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 2]:  95%|█████████▍| 679/716 [00:04<00:00, 146.59it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 2]: 100%|██████████| 716/716 [00:04<00:00, 146.99it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1


[Epoch 3]:   2%|▏         | 14/716 [00:00<00:23, 30.35it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 3]:   7%|▋         | 47/716 [00:00<00:09, 70.25it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 3]:  11%|█         | 80/716 [00:00<00:06, 91.57it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 3]:  16%|█▌        | 113/716 [00:01<00:05, 104.97it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 3]:  20%|██        | 146/716 [00:01<00:05, 113.77it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 3]:  25%|██▍       | 178/716 [00:01<00:04, 119.62it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 3]:  29%|██▉       | 210/716 [00:01<00:04, 123.71it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 3]:  34%|███▍      | 242/716 [00:01<00:03, 127.07it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 3]:  38%|███▊      | 274/716 [00:02<00:03, 129.16it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 3]:  43%|████▎     | 306/716 [00:02<00:03, 131.40it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 3]:  47%|████▋     | 339/716 [00:02<00:02, 133.71it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 3]:  52%|█████▏    | 372/716 [00:02<00:02, 135.55it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 3]:  56%|█████▋    | 404/716 [00:02<00:02, 136.81it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 3]:  61%|██████    | 437/716 [00:03<00:02, 138.30it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 3]:  66%|██████▌   | 469/716 [00:03<00:01, 139.08it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 3]:  70%|███████   | 503/716 [00:03<00:01, 140.42it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 3]:  75%|███████▌  | 537/716 [00:03<00:01, 141.68it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 3]:  80%|███████▉  | 571/716 [00:04<00:01, 142.69it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 3]:  84%|████████▍ | 605/716 [00:04<00:00, 143.27it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 3]:  89%|████████▉ | 637/716 [00:04<00:00, 143.87it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 3]:  93%|█████████▎| 669/716 [00:04<00:00, 144.35it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 3]:  98%|█████████▊| 701/716 [00:04<00:00, 144.75it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 3]: 100%|██████████| 716/716 [00:04<00:00, 144.78it/s]


torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([336])
torch.Size([336, 10])
----


[Epoch 4]:   2%|▏         | 15/716 [00:00<00:21, 32.83it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 4]:   6%|▋         | 46/716 [00:00<00:09, 69.20it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 4]:  11%|█         | 80/716 [00:00<00:06, 91.34it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 4]:  16%|█▌        | 113/716 [00:01<00:05, 104.43it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 4]:  20%|██        | 146/716 [00:01<00:05, 113.39it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 4]:  25%|██▍       | 178/716 [00:01<00:04, 119.18it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 4]:  29%|██▉       | 211/716 [00:01<00:04, 124.07it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 4]:  34%|███▍      | 243/716 [00:01<00:03, 127.26it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 4]:  38%|███▊      | 275/716 [00:02<00:03, 129.94it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 4]:  43%|████▎     | 307/716 [00:02<00:03, 131.97it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 4]:  47%|████▋     | 340/716 [00:02<00:02, 134.15it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 4]:  52%|█████▏    | 372/716 [00:02<00:02, 135.89it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 4]:  56%|█████▋    | 404/716 [00:02<00:02, 137.26it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 4]:  61%|██████    | 436/716 [00:03<00:02, 138.40it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 4]:  65%|██████▌   | 468/716 [00:03<00:01, 139.38it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 4]:  70%|██████▉   | 500/716 [00:03<00:01, 140.29it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 4]:  74%|███████▍  | 533/716 [00:03<00:01, 141.21it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 4]:  79%|███████▉  | 566/716 [00:03<00:01, 141.93it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 4]:  84%|████████▎ | 599/716 [00:04<00:00, 142.66it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 4]:  88%|████████▊ | 632/716 [00:04<00:00, 143.41it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 4]:  93%|█████████▎| 664/716 [00:04<00:00, 143.95it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 4]:  97%|█████████▋| 697/716 [00:04<00:00, 144.52it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 4]: 100%|██████████| 716/716 [00:04<00:00, 144.73it/s]


torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([451])
torch.Size([451, 10])
----


[Epoch 5]:   2%|▏         | 16/717 [00:00<00:19, 35.69it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 5]:   7%|▋         | 49/717 [00:00<00:08, 74.89it/s]


torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([

[Epoch 5]:  12%|█▏        | 83/717 [00:00<00:06, 96.02it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 5]:  16%|█▌        | 115/717 [00:01<00:05, 107.24it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 5]:  21%|██        | 147/717 [00:01<00:04, 114.54it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 5]:  25%|██▍       | 179/717 [00:01<00:04, 120.15it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 5]:  30%|██▉       | 213/717 [00:01<00:04, 125.43it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 5]:  34%|███▍      | 246/717 [00:01<00:03, 128.81it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 5]:  39%|███▉      | 278/717 [00:02<00:03, 131.10it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 5]:  43%|████▎     | 310/717 [00:02<00:03, 133.42it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 5]:  48%|████▊     | 342/717 [00:02<00:02, 135.23it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 5]:  52%|█████▏    | 374/717 [00:02<00:02, 136.14it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 5]:  57%|█████▋    | 406/717 [00:02<00:02, 137.18it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 5]:  61%|██████    | 438/717 [00:03<00:02, 137.89it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 5]:  66%|██████▌   | 470/717 [00:03<00:01, 138.78it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 5]:  70%|██████▉   | 501/717 [00:03<00:01, 137.45it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 5]:  74%|███████▍  | 534/717 [00:03<00:01, 138.56it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 5]:  79%|███████▉  | 566/717 [00:04<00:01, 139.45it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 5]:  84%|████████▎ | 599/717 [00:04<00:00, 140.30it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 5]:  88%|████████▊ | 631/717 [00:04<00:00, 141.14it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 5]:  92%|█████████▏| 663/717 [00:04<00:00, 141.54it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 5]:  97%|█████████▋| 696/717 [00:04<00:00, 142.29it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 5]: 100%|██████████| 717/717 [00:05<00:00, 142.46it/s]


torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([62])
torch.Size([62, 10])
----


[Epoch 6]:   2%|▏         | 17/717 [00:00<00:18, 37.75it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 6]:   7%|▋         | 49/717 [00:00<00:08, 74.75it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 6]:  11%|█▏        | 81/717 [00:00<00:06, 94.31it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 6]:  16%|█▌        | 115/717 [00:01<00:05, 107.35it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 6]:  20%|██        | 146/717 [00:01<00:04, 114.25it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 6]:  25%|██▍       | 178/717 [00:01<00:04, 120.21it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 6]:  29%|██▉       | 210/717 [00:01<00:04, 124.18it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 6]:  34%|███▍      | 243/717 [00:01<00:03, 128.17it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 6]:  38%|███▊      | 276/717 [00:02<00:03, 131.35it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 6]:  43%|████▎     | 308/717 [00:02<00:03, 133.26it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 6]:  48%|████▊     | 341/717 [00:02<00:02, 135.50it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 6]:  52%|█████▏    | 373/717 [00:02<00:02, 136.52it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 6]:  57%|█████▋    | 406/717 [00:02<00:02, 138.36it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 6]:  61%|██████▏   | 440/717 [00:03<00:01, 139.64it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 6]:  66%|██████▌   | 472/717 [00:03<00:01, 140.21it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 6]:  70%|███████   | 505/717 [00:03<00:01, 141.48it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 6]:  75%|███████▌  | 538/717 [00:03<00:01, 142.48it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 6]:  80%|███████▉  | 571/717 [00:03<00:01, 143.28it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 6]:  84%|████████▍ | 604/717 [00:04<00:00, 144.12it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 6]:  89%|████████▉ | 637/717 [00:04<00:00, 144.84it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 6]:  93%|█████████▎| 670/717 [00:04<00:00, 145.60it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 6]: 100%|██████████| 717/717 [00:04<00:00, 146.26it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1


[Epoch 7]:   2%|▏         | 15/717 [00:00<00:20, 33.46it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 7]:   7%|▋         | 47/717 [00:00<00:09, 71.96it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 7]:  11%|█         | 78/717 [00:00<00:07, 90.79it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 7]:  15%|█▌        | 111/717 [00:01<00:05, 104.03it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 7]:  20%|█▉        | 143/717 [00:01<00:05, 112.37it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 7]:  25%|██▍       | 176/717 [00:01<00:04, 119.30it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 7]:  29%|██▉       | 209/717 [00:01<00:04, 124.04it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 7]:  34%|███▎      | 241/717 [00:01<00:03, 127.77it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 7]:  38%|███▊      | 273/717 [00:02<00:03, 129.74it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 7]:  43%|████▎     | 305/717 [00:02<00:03, 132.08it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 7]:  47%|████▋     | 337/717 [00:02<00:02, 134.01it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 7]:  52%|█████▏    | 370/717 [00:02<00:02, 135.84it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 7]:  56%|█████▋    | 404/717 [00:02<00:02, 137.70it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 7]:  61%|██████    | 437/717 [00:03<00:02, 139.12it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 7]:  65%|██████▌   | 469/717 [00:03<00:01, 139.80it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 7]:  70%|██████▉   | 501/717 [00:03<00:01, 140.65it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 7]:  74%|███████▍  | 534/717 [00:03<00:01, 141.72it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 7]:  79%|███████▉  | 567/717 [00:03<00:01, 142.72it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 7]:  84%|████████▎ | 599/717 [00:04<00:00, 143.27it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 7]:  88%|████████▊ | 633/717 [00:04<00:00, 144.23it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 7]:  93%|█████████▎| 665/717 [00:04<00:00, 144.72it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 7]:  97%|█████████▋| 697/717 [00:04<00:00, 145.01it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 7]: 100%|██████████| 717/717 [00:04<00:00, 145.09it/s]


torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([671])
torch.Size([671, 10])
----


[Epoch 8]:   2%|▏         | 14/715 [00:00<00:23, 30.40it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 8]:   6%|▋         | 45/715 [00:00<00:09, 67.18it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 8]:  11%|█         | 77/715 [00:00<00:07, 88.22it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 8]:  15%|█▌        | 108/715 [00:01<00:06, 99.79it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 8]:  20%|█▉        | 140/715 [00:01<00:05, 108.74it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 8]:  24%|██▍       | 172/715 [00:01<00:04, 115.47it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 8]:  29%|██▊       | 205/715 [00:01<00:04, 120.70it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 8]:  33%|███▎      | 238/715 [00:01<00:03, 124.68it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 8]:  38%|███▊      | 270/715 [00:02<00:03, 127.44it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 8]:  43%|████▎     | 304/715 [00:02<00:03, 130.87it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 8]:  47%|████▋     | 338/715 [00:02<00:02, 133.57it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 8]:  52%|█████▏    | 372/715 [00:02<00:02, 135.57it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 8]:  57%|█████▋    | 406/715 [00:02<00:02, 137.10it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 8]:  61%|██████▏   | 438/715 [00:03<00:02, 138.10it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 8]:  66%|██████▌   | 470/715 [00:03<00:01, 139.08it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 8]:  70%|███████   | 504/715 [00:03<00:01, 140.46it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 8]:  75%|███████▌  | 538/715 [00:03<00:01, 141.61it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 8]:  80%|████████  | 572/715 [00:04<00:01, 142.89it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 8]:  85%|████████▍ | 606/715 [00:04<00:00, 143.61it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 8]:  89%|████████▉ | 638/715 [00:04<00:00, 144.19it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 8]:  94%|█████████▍| 671/715 [00:04<00:00, 144.85it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 8]:  98%|█████████▊| 703/715 [00:04<00:00, 145.15it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 8]: 100%|██████████| 715/715 [00:04<00:00, 145.14it/s]


torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([548])
torch.Size([548, 10])
----


[Epoch 9]:   2%|▏         | 14/717 [00:00<00:22, 31.16it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 9]:   6%|▌         | 44/717 [00:00<00:09, 67.58it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 9]:  10%|█         | 75/717 [00:00<00:07, 87.98it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 9]:  17%|█▋        | 123/717 [00:01<00:05, 106.33it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 9]:  21%|██▏       | 154/717 [00:01<00:04, 112.94it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 9]:  26%|██▌       | 186/717 [00:01<00:04, 118.40it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 9]:  31%|███       | 219/717 [00:01<00:04, 123.01it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 9]:  35%|███▌      | 252/717 [00:01<00:03, 126.72it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 9]:  40%|███▉      | 286/717 [00:02<00:03, 129.98it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 9]:  44%|████▍     | 318/717 [00:02<00:03, 132.13it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 9]:  49%|████▉     | 350/717 [00:02<00:02, 133.62it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 9]:  53%|█████▎    | 382/717 [00:02<00:02, 135.25it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 9]:  58%|█████▊    | 414/717 [00:03<00:02, 136.68it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 9]:  62%|██████▏   | 446/717 [00:03<00:01, 137.72it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 9]:  67%|██████▋   | 478/717 [00:03<00:01, 138.88it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 9]:  71%|███████   | 510/717 [00:03<00:01, 139.33it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 9]:  76%|███████▌  | 545/717 [00:03<00:01, 140.93it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 9]:  81%|████████  | 579/717 [00:04<00:00, 142.03it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 9]:  85%|████████▌ | 613/717 [00:04<00:00, 142.90it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 9]:  90%|█████████ | 647/717 [00:04<00:00, 143.68it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 9]:  95%|█████████▍| 681/717 [00:04<00:00, 144.49it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 9]: 100%|█████████▉| 715/717 [00:04<00:00, 144.99it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 9]: 100%|██████████| 717/717 [00:04<00:00, 144.71it/s]


torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([489])
torch.Size([489, 10])
----


[Epoch 10]:   2%|▏         | 14/715 [00:00<00:22, 31.06it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 10]:   6%|▋         | 46/715 [00:00<00:09, 69.59it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 10]:  10%|█         | 72/715 [00:00<00:07, 82.44it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 10]:  14%|█▍        | 101/715 [00:01<00:06, 93.31it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 10]:  19%|█▊        | 133/715 [00:01<00:05, 103.35it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 10]:  23%|██▎       | 165/715 [00:01<00:04, 110.50it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 10]:  28%|██▊       | 197/715 [00:01<00:04, 115.83it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 10]:  32%|███▏      | 229/715 [00:01<00:04, 119.91it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 10]:  37%|███▋      | 264/715 [00:02<00:03, 124.62it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 10]:  42%|████▏     | 297/715 [00:02<00:03, 127.67it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 10]:  46%|████▌     | 329/715 [00:02<00:02, 129.86it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 10]:  50%|█████     | 361/715 [00:02<00:02, 131.69it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 10]:  55%|█████▌    | 394/715 [00:02<00:02, 133.63it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 10]:  60%|█████▉    | 426/715 [00:03<00:02, 135.04it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 10]:  64%|██████▍   | 458/715 [00:03<00:01, 136.11it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 10]:  69%|██████▊   | 490/715 [00:03<00:01, 137.34it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 10]:  73%|███████▎  | 522/715 [00:03<00:01, 138.43it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 10]:  78%|███████▊  | 556/715 [00:03<00:01, 139.77it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 10]:  82%|████████▏ | 589/715 [00:04<00:00, 140.62it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 10]:  87%|████████▋ | 621/715 [00:04<00:00, 141.41it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 10]:  91%|█████████▏| 653/715 [00:04<00:00, 142.13it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 10]:  96%|█████████▌| 686/715 [00:04<00:00, 142.77it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1

[Epoch 10]: 100%|██████████| 715/715 [00:04<00:00, 143.07it/s]

torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([1000])
torch.Size([1000, 10])
----
torch.Size([323])
torch.Size([323, 10])
----





In [37]:
res1 = [1 - spatial.distance.cosine(model_1.ivectors.weight.data.cpu().numpy()[3], model_1.ivectors.weight.data.cpu().numpy()[i]) for i in tqdm(range(1, vocab_size))]


  0%|          | 0/19999 [00:00<?, ?it/s][A
  0%|          | 6/19999 [00:00<05:55, 56.23it/s][A
  0%|          | 11/19999 [00:00<06:17, 52.94it/s][A
  0%|          | 16/19999 [00:00<06:55, 48.14it/s][A
  0%|          | 20/19999 [00:00<07:12, 46.20it/s][A
  0%|          | 24/19999 [00:00<07:24, 44.97it/s][A
  0%|          | 29/19999 [00:00<07:31, 44.23it/s][A
  0%|          | 33/19999 [00:00<07:37, 43.67it/s][A
  0%|          | 38/19999 [00:00<07:41, 43.24it/s][A
  0%|          | 42/19999 [00:00<07:45, 42.90it/s][A
  0%|          | 47/19999 [00:01<07:46, 42.73it/s][A
  0%|          | 52/19999 [00:01<07:49, 42.49it/s][A
  0%|          | 57/19999 [00:01<07:50, 42.37it/s][A
  0%|          | 62/19999 [00:01<07:52, 42.22it/s][A
  0%|          | 67/19999 [00:01<07:53, 42.10it/s][A
  0%|          | 72/19999 [00:01<07:54, 42.00it/s][A
  0%|          | 77/19999 [00:01<07:55, 41.89it/s][A
  0%|          | 82/19999 [00:01<07:56, 41.79it/s][A
  0%|          | 87/19999 [00:02<07:5

  4%|▍         | 796/19999 [00:17<07:04, 45.28it/s][A
  4%|▍         | 801/19999 [00:17<07:03, 45.30it/s][A
  4%|▍         | 806/19999 [00:17<07:03, 45.32it/s][A
  4%|▍         | 811/19999 [00:17<07:03, 45.35it/s][A
  4%|▍         | 816/19999 [00:17<07:02, 45.37it/s][A
  4%|▍         | 822/19999 [00:18<07:02, 45.40it/s][A
  4%|▍         | 828/19999 [00:18<07:01, 45.43it/s][A
  4%|▍         | 834/19999 [00:18<07:01, 45.47it/s][A
  4%|▍         | 840/19999 [00:18<07:01, 45.50it/s][A
  4%|▍         | 846/19999 [00:18<07:00, 45.54it/s][A
  4%|▍         | 852/19999 [00:18<07:00, 45.57it/s][A
  4%|▍         | 858/19999 [00:18<06:59, 45.61it/s][A
  4%|▍         | 864/19999 [00:18<06:59, 45.57it/s][A
  4%|▍         | 869/19999 [00:19<07:00, 45.55it/s][A
  4%|▍         | 874/19999 [00:19<07:00, 45.51it/s][A
  4%|▍         | 879/19999 [00:19<07:00, 45.52it/s][A
  4%|▍         | 884/19999 [00:19<07:00, 45.48it/s][A
  4%|▍         | 890/19999 [00:19<06:59, 45.52it/s][A
  4%|▍    

  8%|▊         | 1597/19999 [00:34<06:42, 45.67it/s][A
  8%|▊         | 1603/19999 [00:35<06:42, 45.68it/s][A
  8%|▊         | 1609/19999 [00:35<06:42, 45.70it/s][A
  8%|▊         | 1615/19999 [00:35<06:42, 45.72it/s][A
  8%|▊         | 1621/19999 [00:35<06:41, 45.74it/s][A
  8%|▊         | 1627/19999 [00:35<06:41, 45.75it/s][A
  8%|▊         | 1633/19999 [00:35<06:41, 45.77it/s][A
  8%|▊         | 1639/19999 [00:35<06:40, 45.79it/s][A
  8%|▊         | 1645/19999 [00:35<06:40, 45.80it/s][A
  8%|▊         | 1651/19999 [00:36<06:40, 45.82it/s][A
  8%|▊         | 1657/19999 [00:36<06:40, 45.84it/s][A
  8%|▊         | 1663/19999 [00:36<06:39, 45.86it/s][A
  8%|▊         | 1669/19999 [00:36<06:39, 45.87it/s][A
  8%|▊         | 1675/19999 [00:36<06:39, 45.89it/s][A
  8%|▊         | 1681/19999 [00:36<06:39, 45.90it/s][A
  8%|▊         | 1687/19999 [00:36<06:38, 45.92it/s][A
  8%|▊         | 1693/19999 [00:36<06:38, 45.94it/s][A
  8%|▊         | 1699/19999 [00:36<06:38, 45.95i

 12%|█▏        | 2417/19999 [00:52<06:21, 46.06it/s][A
 12%|█▏        | 2422/19999 [00:52<06:21, 46.04it/s][A
 12%|█▏        | 2427/19999 [00:52<06:21, 46.03it/s][A
 12%|█▏        | 2432/19999 [00:52<06:21, 46.02it/s][A
 12%|█▏        | 2437/19999 [00:52<06:21, 46.00it/s][A
 12%|█▏        | 2442/19999 [00:53<06:21, 45.99it/s][A
 12%|█▏        | 2447/19999 [00:53<06:21, 45.98it/s][A
 12%|█▏        | 2452/19999 [00:53<06:21, 45.97it/s][A
 12%|█▏        | 2457/19999 [00:53<06:21, 45.95it/s][A
 12%|█▏        | 2462/19999 [00:53<06:21, 45.94it/s][A
 12%|█▏        | 2467/19999 [00:53<06:21, 45.93it/s][A
 12%|█▏        | 2472/19999 [00:53<06:21, 45.92it/s][A
 12%|█▏        | 2477/19999 [00:53<06:21, 45.91it/s][A
 12%|█▏        | 2482/19999 [00:54<06:21, 45.89it/s][A
 12%|█▏        | 2487/19999 [00:54<06:21, 45.88it/s][A
 12%|█▏        | 2492/19999 [00:54<06:21, 45.87it/s][A
 12%|█▏        | 2497/19999 [00:54<06:21, 45.86it/s][A
 13%|█▎        | 2502/19999 [00:54<06:21, 45.85i

 16%|█▌        | 3205/19999 [01:10<06:06, 45.78it/s][A
 16%|█▌        | 3211/19999 [01:10<06:06, 45.78it/s][A
 16%|█▌        | 3217/19999 [01:10<06:06, 45.79it/s][A
 16%|█▌        | 3223/19999 [01:10<06:06, 45.78it/s][A
 16%|█▌        | 3228/19999 [01:10<06:06, 45.77it/s][A
 16%|█▌        | 3233/19999 [01:10<06:06, 45.77it/s][A
 16%|█▌        | 3238/19999 [01:10<06:06, 45.76it/s][A
 16%|█▌        | 3243/19999 [01:10<06:06, 45.75it/s][A
 16%|█▌        | 3248/19999 [01:11<06:06, 45.74it/s][A
 16%|█▋        | 3253/19999 [01:11<06:06, 45.73it/s][A
 16%|█▋        | 3258/19999 [01:11<06:06, 45.72it/s][A
 16%|█▋        | 3264/19999 [01:11<06:05, 45.73it/s][A
 16%|█▋        | 3270/19999 [01:11<06:05, 45.74it/s][A
 16%|█▋        | 3275/19999 [01:11<06:05, 45.74it/s][A
 16%|█▋        | 3280/19999 [01:11<06:05, 45.73it/s][A
 16%|█▋        | 3285/19999 [01:11<06:05, 45.73it/s][A
 16%|█▋        | 3290/19999 [01:11<06:05, 45.72it/s][A
 16%|█▋        | 3295/19999 [01:12<06:05, 45.71i

 20%|██        | 4018/19999 [01:27<05:47, 45.94it/s][A
 20%|██        | 4024/19999 [01:27<05:47, 45.95it/s][A
 20%|██        | 4030/19999 [01:27<05:47, 45.96it/s][A
 20%|██        | 4036/19999 [01:27<05:47, 45.96it/s][A
 20%|██        | 4042/19999 [01:27<05:47, 45.97it/s][A
 20%|██        | 4048/19999 [01:28<05:47, 45.96it/s][A
 20%|██        | 4053/19999 [01:28<05:46, 45.95it/s][A
 20%|██        | 4059/19999 [01:28<05:46, 45.96it/s][A
 20%|██        | 4065/19999 [01:28<05:46, 45.97it/s][A
 20%|██        | 4070/19999 [01:28<05:46, 45.97it/s][A
 20%|██        | 4076/19999 [01:28<05:46, 45.98it/s][A
 20%|██        | 4081/19999 [01:28<05:46, 45.97it/s][A
 20%|██        | 4086/19999 [01:28<05:46, 45.96it/s][A
 20%|██        | 4091/19999 [01:29<05:46, 45.96it/s][A
 20%|██        | 4096/19999 [01:29<05:46, 45.96it/s][A
 21%|██        | 4102/19999 [01:29<05:45, 45.97it/s][A
 21%|██        | 4108/19999 [01:29<05:45, 45.97it/s][A
 21%|██        | 4114/19999 [01:29<05:45, 45.98i

 24%|██▍       | 4808/19999 [01:44<05:31, 45.87it/s][A
 24%|██▍       | 4814/19999 [01:44<05:31, 45.87it/s][A
 24%|██▍       | 4820/19999 [01:45<05:30, 45.88it/s][A
 24%|██▍       | 4826/19999 [01:45<05:30, 45.88it/s][A
 24%|██▍       | 4832/19999 [01:45<05:30, 45.89it/s][A
 24%|██▍       | 4838/19999 [01:45<05:30, 45.89it/s][A
 24%|██▍       | 4844/19999 [01:45<05:30, 45.90it/s][A
 24%|██▍       | 4850/19999 [01:45<05:30, 45.90it/s][A
 24%|██▍       | 4856/19999 [01:45<05:29, 45.91it/s][A
 24%|██▍       | 4862/19999 [01:45<05:29, 45.92it/s][A
 24%|██▍       | 4868/19999 [01:46<05:29, 45.91it/s][A
 24%|██▍       | 4873/19999 [01:46<05:29, 45.90it/s][A
 24%|██▍       | 4878/19999 [01:46<05:29, 45.90it/s][A
 24%|██▍       | 4883/19999 [01:46<05:29, 45.89it/s][A
 24%|██▍       | 4888/19999 [01:46<05:29, 45.88it/s][A
 24%|██▍       | 4893/19999 [01:46<05:29, 45.88it/s][A
 24%|██▍       | 4898/19999 [01:46<05:29, 45.87it/s][A
 25%|██▍       | 4904/19999 [01:46<05:29, 45.88i

 28%|██▊       | 5588/19999 [02:02<05:15, 45.63it/s][A
 28%|██▊       | 5594/19999 [02:02<05:15, 45.63it/s][A
 28%|██▊       | 5600/19999 [02:02<05:15, 45.64it/s][A
 28%|██▊       | 5606/19999 [02:02<05:15, 45.64it/s][A
 28%|██▊       | 5612/19999 [02:02<05:15, 45.65it/s][A
 28%|██▊       | 5618/19999 [02:03<05:15, 45.65it/s][A
 28%|██▊       | 5624/19999 [02:03<05:14, 45.66it/s][A
 28%|██▊       | 5630/19999 [02:03<05:14, 45.66it/s][A
 28%|██▊       | 5636/19999 [02:03<05:14, 45.67it/s][A
 28%|██▊       | 5642/19999 [02:03<05:14, 45.67it/s][A
 28%|██▊       | 5648/19999 [02:03<05:14, 45.67it/s][A
 28%|██▊       | 5653/19999 [02:03<05:14, 45.67it/s][A
 28%|██▊       | 5659/19999 [02:03<05:13, 45.67it/s][A
 28%|██▊       | 5665/19999 [02:04<05:13, 45.68it/s][A
 28%|██▊       | 5671/19999 [02:04<05:13, 45.68it/s][A
 28%|██▊       | 5677/19999 [02:04<05:13, 45.69it/s][A
 28%|██▊       | 5683/19999 [02:04<05:13, 45.69it/s][A
 28%|██▊       | 5689/19999 [02:04<05:13, 45.70i

 32%|███▏      | 6357/19999 [02:20<05:00, 45.34it/s][A
 32%|███▏      | 6362/19999 [02:20<05:00, 45.34it/s][A
 32%|███▏      | 6367/19999 [02:20<05:00, 45.34it/s][A
 32%|███▏      | 6373/19999 [02:20<05:00, 45.35it/s][A
 32%|███▏      | 6379/19999 [02:20<05:00, 45.35it/s][A
 32%|███▏      | 6385/19999 [02:20<05:00, 45.36it/s][A
 32%|███▏      | 6391/19999 [02:20<04:59, 45.36it/s][A
 32%|███▏      | 6397/19999 [02:21<04:59, 45.37it/s][A
 32%|███▏      | 6403/19999 [02:21<04:59, 45.37it/s][A
 32%|███▏      | 6409/19999 [02:21<04:59, 45.38it/s][A
 32%|███▏      | 6415/19999 [02:21<04:59, 45.38it/s][A
 32%|███▏      | 6421/19999 [02:21<04:59, 45.38it/s][A
 32%|███▏      | 6427/19999 [02:21<04:59, 45.39it/s][A
 32%|███▏      | 6433/19999 [02:21<04:58, 45.39it/s][A
 32%|███▏      | 6439/19999 [02:21<04:58, 45.40it/s][A
 32%|███▏      | 6445/19999 [02:21<04:58, 45.40it/s][A
 32%|███▏      | 6451/19999 [02:22<04:58, 45.40it/s][A
 32%|███▏      | 6456/19999 [02:22<04:58, 45.39i

 36%|███▌      | 7163/19999 [02:37<04:42, 45.44it/s][A
 36%|███▌      | 7169/19999 [02:37<04:42, 45.45it/s][A
 36%|███▌      | 7175/19999 [02:37<04:42, 45.45it/s][A
 36%|███▌      | 7181/19999 [02:37<04:42, 45.45it/s][A
 36%|███▌      | 7187/19999 [02:38<04:41, 45.45it/s][A
 36%|███▌      | 7192/19999 [02:38<04:41, 45.45it/s][A
 36%|███▌      | 7197/19999 [02:38<04:41, 45.44it/s][A
 36%|███▌      | 7202/19999 [02:38<04:41, 45.44it/s][A
 36%|███▌      | 7207/19999 [02:38<04:41, 45.43it/s][A
 36%|███▌      | 7212/19999 [02:38<04:41, 45.43it/s][A
 36%|███▌      | 7217/19999 [02:38<04:41, 45.43it/s][A
 36%|███▌      | 7222/19999 [02:38<04:41, 45.42it/s][A
 36%|███▌      | 7228/19999 [02:39<04:41, 45.43it/s][A
 36%|███▌      | 7234/19999 [02:39<04:40, 45.43it/s][A
 36%|███▌      | 7240/19999 [02:39<04:40, 45.44it/s][A
 36%|███▌      | 7246/19999 [02:39<04:40, 45.44it/s][A
 36%|███▋      | 7252/19999 [02:39<04:40, 45.44it/s][A
 36%|███▋      | 7258/19999 [02:39<04:40, 45.45i

 40%|███▉      | 7944/19999 [02:55<04:25, 45.38it/s][A
 40%|███▉      | 7949/19999 [02:55<04:25, 45.38it/s][A
 40%|███▉      | 7954/19999 [02:55<04:25, 45.37it/s][A
 40%|███▉      | 7959/19999 [02:55<04:25, 45.37it/s][A
 40%|███▉      | 7964/19999 [02:55<04:25, 45.37it/s][A
 40%|███▉      | 7969/19999 [02:55<04:25, 45.36it/s][A
 40%|███▉      | 7974/19999 [02:55<04:25, 45.36it/s][A
 40%|███▉      | 7979/19999 [02:55<04:24, 45.36it/s][A
 40%|███▉      | 7984/19999 [02:55<04:24, 45.37it/s][A
 40%|███▉      | 7989/19999 [02:56<04:24, 45.37it/s][A
 40%|███▉      | 7995/19999 [02:56<04:24, 45.37it/s][A
 40%|████      | 8000/19999 [02:56<04:24, 45.37it/s][A
 40%|████      | 8005/19999 [02:56<04:24, 45.36it/s][A
 40%|████      | 8010/19999 [02:56<04:24, 45.36it/s][A
 40%|████      | 8015/19999 [02:56<04:24, 45.36it/s][A
 40%|████      | 8020/19999 [02:56<04:24, 45.35it/s][A
 40%|████      | 8025/19999 [02:56<04:24, 45.35it/s][A
 40%|████      | 8030/19999 [02:57<04:23, 45.35i

 44%|████▎     | 8746/19999 [03:12<04:07, 45.44it/s][A
 44%|████▍     | 8751/19999 [03:12<04:07, 45.43it/s][A
 44%|████▍     | 8756/19999 [03:12<04:07, 45.43it/s][A
 44%|████▍     | 8761/19999 [03:12<04:07, 45.43it/s][A
 44%|████▍     | 8766/19999 [03:12<04:07, 45.43it/s][A
 44%|████▍     | 8771/19999 [03:13<04:07, 45.42it/s][A
 44%|████▍     | 8776/19999 [03:13<04:07, 45.42it/s][A
 44%|████▍     | 8781/19999 [03:13<04:07, 45.41it/s][A
 44%|████▍     | 8786/19999 [03:13<04:06, 45.41it/s][A
 44%|████▍     | 8791/19999 [03:13<04:06, 45.41it/s][A
 44%|████▍     | 8796/19999 [03:13<04:06, 45.41it/s][A
 44%|████▍     | 8801/19999 [03:13<04:06, 45.40it/s][A
 44%|████▍     | 8806/19999 [03:13<04:06, 45.40it/s][A
 44%|████▍     | 8811/19999 [03:14<04:06, 45.40it/s][A
 44%|████▍     | 8817/19999 [03:14<04:06, 45.40it/s][A
 44%|████▍     | 8823/19999 [03:14<04:06, 45.41it/s][A
 44%|████▍     | 8829/19999 [03:14<04:05, 45.41it/s][A
 44%|████▍     | 8835/19999 [03:14<04:05, 45.41i

 48%|████▊     | 9559/19999 [03:29<03:49, 45.52it/s][A
 48%|████▊     | 9564/19999 [03:30<03:49, 45.52it/s][A
 48%|████▊     | 9569/19999 [03:30<03:49, 45.52it/s][A
 48%|████▊     | 9574/19999 [03:30<03:49, 45.52it/s][A
 48%|████▊     | 9579/19999 [03:30<03:48, 45.51it/s][A
 48%|████▊     | 9584/19999 [03:30<03:48, 45.51it/s][A
 48%|████▊     | 9589/19999 [03:30<03:48, 45.51it/s][A
 48%|████▊     | 9594/19999 [03:30<03:48, 45.51it/s][A
 48%|████▊     | 9599/19999 [03:30<03:48, 45.50it/s][A
 48%|████▊     | 9604/19999 [03:31<03:48, 45.50it/s][A
 48%|████▊     | 9609/19999 [03:31<03:48, 45.50it/s][A
 48%|████▊     | 9614/19999 [03:31<03:48, 45.49it/s][A
 48%|████▊     | 9619/19999 [03:31<03:48, 45.49it/s][A
 48%|████▊     | 9624/19999 [03:31<03:48, 45.49it/s][A
 48%|████▊     | 9629/19999 [03:31<03:47, 45.49it/s][A
 48%|████▊     | 9634/19999 [03:31<03:47, 45.48it/s][A
 48%|████▊     | 9639/19999 [03:31<03:47, 45.48it/s][A
 48%|████▊     | 9645/19999 [03:32<03:47, 45.48i

 52%|█████▏    | 10342/19999 [03:47<03:32, 45.49it/s][A
 52%|█████▏    | 10347/19999 [03:47<03:32, 45.48it/s][A
 52%|█████▏    | 10352/19999 [03:47<03:32, 45.49it/s][A
 52%|█████▏    | 10357/19999 [03:47<03:31, 45.48it/s][A
 52%|█████▏    | 10362/19999 [03:47<03:31, 45.48it/s][A
 52%|█████▏    | 10367/19999 [03:47<03:31, 45.48it/s][A
 52%|█████▏    | 10372/19999 [03:48<03:31, 45.47it/s][A
 52%|█████▏    | 10378/19999 [03:48<03:31, 45.48it/s][A
 52%|█████▏    | 10384/19999 [03:48<03:31, 45.48it/s][A
 52%|█████▏    | 10390/19999 [03:48<03:31, 45.48it/s][A
 52%|█████▏    | 10396/19999 [03:48<03:31, 45.48it/s][A
 52%|█████▏    | 10402/19999 [03:48<03:30, 45.49it/s][A
 52%|█████▏    | 10408/19999 [03:48<03:30, 45.49it/s][A
 52%|█████▏    | 10414/19999 [03:48<03:30, 45.49it/s][A
 52%|█████▏    | 10420/19999 [03:49<03:30, 45.49it/s][A
 52%|█████▏    | 10426/19999 [03:49<03:30, 45.50it/s][A
 52%|█████▏    | 10432/19999 [03:49<03:30, 45.50it/s][A
 52%|█████▏    | 10438/19999 [0

 56%|█████▌    | 11135/19999 [04:04<03:14, 45.56it/s][A
 56%|█████▌    | 11140/19999 [04:04<03:14, 45.56it/s][A
 56%|█████▌    | 11145/19999 [04:04<03:14, 45.56it/s][A
 56%|█████▌    | 11150/19999 [04:04<03:14, 45.56it/s][A
 56%|█████▌    | 11155/19999 [04:04<03:14, 45.55it/s][A
 56%|█████▌    | 11160/19999 [04:04<03:14, 45.55it/s][A
 56%|█████▌    | 11165/19999 [04:05<03:13, 45.55it/s][A
 56%|█████▌    | 11170/19999 [04:05<03:13, 45.55it/s][A
 56%|█████▌    | 11175/19999 [04:05<03:13, 45.54it/s][A
 56%|█████▌    | 11180/19999 [04:05<03:13, 45.54it/s][A
 56%|█████▌    | 11186/19999 [04:05<03:13, 45.54it/s][A
 56%|█████▌    | 11192/19999 [04:05<03:13, 45.55it/s][A
 56%|█████▌    | 11198/19999 [04:05<03:13, 45.55it/s][A
 56%|█████▌    | 11204/19999 [04:05<03:13, 45.55it/s][A
 56%|█████▌    | 11210/19999 [04:06<03:12, 45.55it/s][A
 56%|█████▌    | 11216/19999 [04:06<03:12, 45.56it/s][A
 56%|█████▌    | 11222/19999 [04:06<03:12, 45.56it/s][A
 56%|█████▌    | 11228/19999 [0

 59%|█████▉    | 11897/19999 [04:21<02:58, 45.46it/s][A
 60%|█████▉    | 11902/19999 [04:21<02:58, 45.46it/s][A
 60%|█████▉    | 11907/19999 [04:21<02:58, 45.46it/s][A
 60%|█████▉    | 11912/19999 [04:22<02:57, 45.46it/s][A
 60%|█████▉    | 11917/19999 [04:22<02:57, 45.46it/s][A
 60%|█████▉    | 11922/19999 [04:22<02:57, 45.45it/s][A
 60%|█████▉    | 11927/19999 [04:22<02:57, 45.45it/s][A
 60%|█████▉    | 11932/19999 [04:22<02:57, 45.45it/s][A
 60%|█████▉    | 11937/19999 [04:22<02:57, 45.45it/s][A
 60%|█████▉    | 11942/19999 [04:22<02:57, 45.45it/s][A
 60%|█████▉    | 11947/19999 [04:22<02:57, 45.44it/s][A
 60%|█████▉    | 11952/19999 [04:23<02:57, 45.44it/s][A
 60%|█████▉    | 11957/19999 [04:23<02:56, 45.44it/s][A
 60%|█████▉    | 11962/19999 [04:23<02:56, 45.44it/s][A
 60%|█████▉    | 11967/19999 [04:23<02:56, 45.43it/s][A
 60%|█████▉    | 11972/19999 [04:23<02:56, 45.43it/s][A
 60%|█████▉    | 11977/19999 [04:23<02:56, 45.43it/s][A
 60%|█████▉    | 11982/19999 [0

 63%|██████▎   | 12685/19999 [04:38<02:40, 45.51it/s][A
 63%|██████▎   | 12691/19999 [04:38<02:40, 45.51it/s][A
 63%|██████▎   | 12696/19999 [04:38<02:40, 45.51it/s][A
 64%|██████▎   | 12701/19999 [04:39<02:40, 45.51it/s][A
 64%|██████▎   | 12706/19999 [04:39<02:40, 45.51it/s][A
 64%|██████▎   | 12712/19999 [04:39<02:40, 45.51it/s][A
 64%|██████▎   | 12717/19999 [04:39<02:40, 45.51it/s][A
 64%|██████▎   | 12722/19999 [04:39<02:39, 45.51it/s][A
 64%|██████▎   | 12727/19999 [04:39<02:39, 45.51it/s][A
 64%|██████▎   | 12732/19999 [04:39<02:39, 45.50it/s][A
 64%|██████▎   | 12737/19999 [04:39<02:39, 45.50it/s][A
 64%|██████▎   | 12742/19999 [04:40<02:39, 45.50it/s][A
 64%|██████▎   | 12747/19999 [04:40<02:39, 45.50it/s][A
 64%|██████▍   | 12752/19999 [04:40<02:39, 45.50it/s][A
 64%|██████▍   | 12757/19999 [04:40<02:39, 45.50it/s][A
 64%|██████▍   | 12762/19999 [04:40<02:39, 45.50it/s][A
 64%|██████▍   | 12767/19999 [04:40<02:38, 45.50it/s][A
 64%|██████▍   | 12772/19999 [0

 67%|██████▋   | 13441/19999 [04:55<02:24, 45.46it/s][A
 67%|██████▋   | 13446/19999 [04:55<02:24, 45.46it/s][A
 67%|██████▋   | 13451/19999 [04:55<02:24, 45.46it/s][A
 67%|██████▋   | 13456/19999 [04:56<02:23, 45.46it/s][A
 67%|██████▋   | 13461/19999 [04:56<02:23, 45.46it/s][A
 67%|██████▋   | 13466/19999 [04:56<02:23, 45.45it/s][A
 67%|██████▋   | 13471/19999 [04:56<02:23, 45.45it/s][A
 67%|██████▋   | 13476/19999 [04:56<02:23, 45.45it/s][A
 67%|██████▋   | 13481/19999 [04:56<02:23, 45.45it/s][A
 67%|██████▋   | 13486/19999 [04:56<02:23, 45.44it/s][A
 67%|██████▋   | 13491/19999 [04:56<02:23, 45.44it/s][A
 67%|██████▋   | 13496/19999 [04:57<02:23, 45.44it/s][A
 68%|██████▊   | 13501/19999 [04:57<02:23, 45.44it/s][A
 68%|██████▊   | 13506/19999 [04:57<02:22, 45.44it/s][A
 68%|██████▊   | 13511/19999 [04:57<02:22, 45.43it/s][A
 68%|██████▊   | 13516/19999 [04:57<02:22, 45.43it/s][A
 68%|██████▊   | 13521/19999 [04:57<02:22, 45.43it/s][A
 68%|██████▊   | 13526/19999 [0

 71%|███████   | 14182/19999 [05:12<02:08, 45.32it/s][A
 71%|███████   | 14187/19999 [05:13<02:08, 45.33it/s][A
 71%|███████   | 14193/19999 [05:13<02:08, 45.33it/s][A
 71%|███████   | 14199/19999 [05:13<02:07, 45.33it/s][A
 71%|███████   | 14205/19999 [05:13<02:07, 45.33it/s][A
 71%|███████   | 14211/19999 [05:13<02:07, 45.34it/s][A
 71%|███████   | 14217/19999 [05:13<02:07, 45.34it/s][A
 71%|███████   | 14223/19999 [05:13<02:07, 45.34it/s][A
 71%|███████   | 14229/19999 [05:13<02:07, 45.34it/s][A
 71%|███████   | 14235/19999 [05:13<02:07, 45.34it/s][A
 71%|███████   | 14241/19999 [05:14<02:06, 45.35it/s][A
 71%|███████   | 14247/19999 [05:14<02:06, 45.35it/s][A
 71%|███████▏  | 14253/19999 [05:14<02:06, 45.35it/s][A
 71%|███████▏  | 14259/19999 [05:14<02:06, 45.35it/s][A
 71%|███████▏  | 14265/19999 [05:14<02:06, 45.36it/s][A
 71%|███████▏  | 14271/19999 [05:14<02:06, 45.36it/s][A
 71%|███████▏  | 14277/19999 [05:14<02:06, 45.36it/s][A
 71%|███████▏  | 14283/19999 [0

 75%|███████▍  | 14941/19999 [05:30<01:51, 45.26it/s][A
 75%|███████▍  | 14946/19999 [05:30<01:51, 45.26it/s][A
 75%|███████▍  | 14951/19999 [05:30<01:51, 45.26it/s][A
 75%|███████▍  | 14956/19999 [05:30<01:51, 45.26it/s][A
 75%|███████▍  | 14961/19999 [05:30<01:51, 45.25it/s][A
 75%|███████▍  | 14966/19999 [05:30<01:51, 45.25it/s][A
 75%|███████▍  | 14972/19999 [05:30<01:51, 45.25it/s][A
 75%|███████▍  | 14978/19999 [05:30<01:50, 45.26it/s][A
 75%|███████▍  | 14984/19999 [05:31<01:50, 45.26it/s][A
 75%|███████▍  | 14990/19999 [05:31<01:50, 45.26it/s][A
 75%|███████▍  | 14996/19999 [05:31<01:50, 45.26it/s][A
 75%|███████▌  | 15002/19999 [05:31<01:50, 45.27it/s][A
 75%|███████▌  | 15007/19999 [05:31<01:50, 45.27it/s][A
 75%|███████▌  | 15012/19999 [05:31<01:50, 45.26it/s][A
 75%|███████▌  | 15017/19999 [05:31<01:50, 45.26it/s][A
 75%|███████▌  | 15022/19999 [05:31<01:49, 45.26it/s][A
 75%|███████▌  | 15027/19999 [05:32<01:49, 45.26it/s][A
 75%|███████▌  | 15033/19999 [0

 79%|███████▊  | 15727/19999 [05:47<01:34, 45.31it/s][A
 79%|███████▊  | 15732/19999 [05:47<01:34, 45.31it/s][A
 79%|███████▊  | 15738/19999 [05:47<01:34, 45.31it/s][A
 79%|███████▊  | 15744/19999 [05:47<01:33, 45.31it/s][A
 79%|███████▉  | 15750/19999 [05:47<01:33, 45.31it/s][A
 79%|███████▉  | 15755/19999 [05:47<01:33, 45.31it/s][A
 79%|███████▉  | 15760/19999 [05:47<01:33, 45.31it/s][A
 79%|███████▉  | 15765/19999 [05:47<01:33, 45.31it/s][A
 79%|███████▉  | 15770/19999 [05:48<01:33, 45.31it/s][A
 79%|███████▉  | 15775/19999 [05:48<01:33, 45.31it/s][A
 79%|███████▉  | 15780/19999 [05:48<01:33, 45.30it/s][A
 79%|███████▉  | 15785/19999 [05:48<01:33, 45.30it/s][A
 79%|███████▉  | 15790/19999 [05:48<01:32, 45.30it/s][A
 79%|███████▉  | 15795/19999 [05:48<01:32, 45.30it/s][A
 79%|███████▉  | 15800/19999 [05:48<01:32, 45.30it/s][A
 79%|███████▉  | 15805/19999 [05:48<01:32, 45.30it/s][A
 79%|███████▉  | 15810/19999 [05:49<01:32, 45.29it/s][A
 79%|███████▉  | 15815/19999 [0

 83%|████████▎ | 16510/19999 [06:04<01:16, 45.32it/s][A
 83%|████████▎ | 16515/19999 [06:04<01:16, 45.32it/s][A
 83%|████████▎ | 16521/19999 [06:04<01:16, 45.32it/s][A
 83%|████████▎ | 16526/19999 [06:04<01:16, 45.32it/s][A
 83%|████████▎ | 16532/19999 [06:04<01:16, 45.32it/s][A
 83%|████████▎ | 16538/19999 [06:04<01:16, 45.32it/s][A
 83%|████████▎ | 16544/19999 [06:04<01:16, 45.33it/s][A
 83%|████████▎ | 16550/19999 [06:05<01:16, 45.33it/s][A
 83%|████████▎ | 16555/19999 [06:05<01:15, 45.33it/s][A
 83%|████████▎ | 16561/19999 [06:05<01:15, 45.33it/s][A
 83%|████████▎ | 16567/19999 [06:05<01:15, 45.33it/s][A
 83%|████████▎ | 16573/19999 [06:05<01:15, 45.34it/s][A
 83%|████████▎ | 16579/19999 [06:05<01:15, 45.34it/s][A
 83%|████████▎ | 16585/19999 [06:05<01:15, 45.34it/s][A
 83%|████████▎ | 16591/19999 [06:05<01:15, 45.34it/s][A
 83%|████████▎ | 16597/19999 [06:06<01:15, 45.34it/s][A
 83%|████████▎ | 16603/19999 [06:06<01:14, 45.34it/s][A
 83%|████████▎ | 16609/19999 [0

 87%|████████▋ | 17324/19999 [06:21<00:58, 45.44it/s][A
 87%|████████▋ | 17330/19999 [06:21<00:58, 45.44it/s][A
 87%|████████▋ | 17335/19999 [06:21<00:58, 45.44it/s][A
 87%|████████▋ | 17340/19999 [06:21<00:58, 45.44it/s][A
 87%|████████▋ | 17345/19999 [06:21<00:58, 45.44it/s][A
 87%|████████▋ | 17350/19999 [06:21<00:58, 45.43it/s][A
 87%|████████▋ | 17355/19999 [06:21<00:58, 45.43it/s][A
 87%|████████▋ | 17360/19999 [06:22<00:58, 45.43it/s][A
 87%|████████▋ | 17366/19999 [06:22<00:57, 45.43it/s][A
 87%|████████▋ | 17372/19999 [06:22<00:57, 45.43it/s][A
 87%|████████▋ | 17378/19999 [06:22<00:57, 45.44it/s][A
 87%|████████▋ | 17384/19999 [06:22<00:57, 45.44it/s][A
 87%|████████▋ | 17390/19999 [06:22<00:57, 45.44it/s][A
 87%|████████▋ | 17396/19999 [06:22<00:57, 45.44it/s][A
 87%|████████▋ | 17402/19999 [06:22<00:57, 45.44it/s][A
 87%|████████▋ | 17408/19999 [06:23<00:57, 45.44it/s][A
 87%|████████▋ | 17414/19999 [06:23<00:56, 45.45it/s][A
 87%|████████▋ | 17420/19999 [0

 91%|█████████ | 18117/19999 [06:38<00:41, 45.47it/s][A
 91%|█████████ | 18123/19999 [06:38<00:41, 45.47it/s][A
 91%|█████████ | 18129/19999 [06:38<00:41, 45.47it/s][A
 91%|█████████ | 18135/19999 [06:38<00:40, 45.48it/s][A
 91%|█████████ | 18141/19999 [06:38<00:40, 45.48it/s][A
 91%|█████████ | 18147/19999 [06:39<00:40, 45.48it/s][A
 91%|█████████ | 18153/19999 [06:39<00:40, 45.48it/s][A
 91%|█████████ | 18158/19999 [06:39<00:40, 45.48it/s][A
 91%|█████████ | 18163/19999 [06:39<00:40, 45.47it/s][A
 91%|█████████ | 18168/19999 [06:39<00:40, 45.47it/s][A
 91%|█████████ | 18173/19999 [06:39<00:40, 45.47it/s][A
 91%|█████████ | 18178/19999 [06:39<00:40, 45.47it/s][A
 91%|█████████ | 18183/19999 [06:39<00:39, 45.47it/s][A
 91%|█████████ | 18188/19999 [06:40<00:39, 45.47it/s][A
 91%|█████████ | 18193/19999 [06:40<00:39, 45.47it/s][A
 91%|█████████ | 18198/19999 [06:40<00:39, 45.46it/s][A
 91%|█████████ | 18203/19999 [06:40<00:39, 45.46it/s][A
 91%|█████████ | 18208/19999 [0

 95%|█████████▍| 18921/19999 [06:55<00:23, 45.55it/s][A
 95%|█████████▍| 18926/19999 [06:55<00:23, 45.55it/s][A
 95%|█████████▍| 18931/19999 [06:55<00:23, 45.55it/s][A
 95%|█████████▍| 18936/19999 [06:55<00:23, 45.54it/s][A
 95%|█████████▍| 18941/19999 [06:55<00:23, 45.54it/s][A
 95%|█████████▍| 18946/19999 [06:56<00:23, 45.54it/s][A
 95%|█████████▍| 18951/19999 [06:56<00:23, 45.54it/s][A
 95%|█████████▍| 18957/19999 [06:56<00:22, 45.54it/s][A
 95%|█████████▍| 18963/19999 [06:56<00:22, 45.54it/s][A
 95%|█████████▍| 18969/19999 [06:56<00:22, 45.54it/s][A
 95%|█████████▍| 18975/19999 [06:56<00:22, 45.55it/s][A
 95%|█████████▍| 18981/19999 [06:56<00:22, 45.55it/s][A
 95%|█████████▍| 18986/19999 [06:56<00:22, 45.55it/s][A
 95%|█████████▍| 18991/19999 [06:56<00:22, 45.55it/s][A
 95%|█████████▍| 18996/19999 [06:57<00:22, 45.55it/s][A
 95%|█████████▌| 19001/19999 [06:57<00:21, 45.54it/s][A
 95%|█████████▌| 19006/19999 [06:57<00:21, 45.55it/s][A
 95%|█████████▌| 19012/19999 [0

 98%|█████████▊| 19668/19999 [07:12<00:07, 45.45it/s][A
 98%|█████████▊| 19674/19999 [07:12<00:07, 45.45it/s][A
 98%|█████████▊| 19680/19999 [07:12<00:07, 45.45it/s][A
 98%|█████████▊| 19686/19999 [07:13<00:06, 45.45it/s][A
 98%|█████████▊| 19692/19999 [07:13<00:06, 45.46it/s][A
 98%|█████████▊| 19698/19999 [07:13<00:06, 45.46it/s][A
 99%|█████████▊| 19704/19999 [07:13<00:06, 45.46it/s][A
 99%|█████████▊| 19710/19999 [07:13<00:06, 45.46it/s][A
 99%|█████████▊| 19716/19999 [07:13<00:06, 45.46it/s][A
 99%|█████████▊| 19722/19999 [07:13<00:06, 45.46it/s][A
 99%|█████████▊| 19728/19999 [07:13<00:05, 45.46it/s][A
 99%|█████████▊| 19734/19999 [07:14<00:05, 45.46it/s][A
 99%|█████████▊| 19740/19999 [07:14<00:05, 45.46it/s][A
 99%|█████████▊| 19746/19999 [07:14<00:05, 45.47it/s][A
 99%|█████████▉| 19752/19999 [07:14<00:05, 45.47it/s][A
 99%|█████████▉| 19758/19999 [07:14<00:05, 45.47it/s][A
 99%|█████████▉| 19764/19999 [07:14<00:05, 45.47it/s][A
 99%|█████████▉| 19769/19999 [0

In [38]:
spatial.distance.cosine(res, res1)

0.94664735631031804