##### APPROACH:

Further fine-tuning an already fine-tuned model(HATE-SPEECH-BERT) for multilabel classification to identify subcategories of hate speech requires us to assess whether there are improvements in accuracy, precision, recall (F1 score) by initially using a triple classification model for hate speech detection before fine-tuning for multilabel classification. Alternatively, it may be worthwhile to directly fine-tune the model(BERT-LARGE) for multilabel classification from the start

#### Import necessary libraries

In [1]:
! pip install contractions
! pip install -U accelerate
! pip install -U transformers

Collecting contractions
  Downloading contractions-0.1.73-py2.py3-none-any.whl (8.7 kB)
Collecting textsearch>=0.0.21 (from contractions)
  Downloading textsearch-0.0.24-py2.py3-none-any.whl (7.6 kB)
Collecting anyascii (from textsearch>=0.0.21->contractions)
  Downloading anyascii-0.3.2-py3-none-any.whl (289 kB)
[2K     [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m289.9/289.9 kB[0m [31m5.3 MB/s[0m eta [36m0:00:00[0m
[?25hCollecting pyahocorasick (from textsearch>=0.0.21->contractions)
  Downloading pyahocorasick-2.1.0-cp310-cp310-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_12_x86_64.manylinux2010_x86_64.whl (110 kB)
[2K     [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m110.7/110.7 kB[0m [31m11.6 MB/s[0m eta [36m0:00:00[0m
[?25hInstalling collected packages: pyahocorasick, anyascii, textsearch, contractions
Successfully installed anyascii-0.3.2 contractions-0.1.73 pyahocorasick-2.1.0 textsearch-0.0.24
Collecting accelerate
  Downloading accelerat

In [41]:
from google.colab import drive
drive.mount('/content/drive',force_remount=True)

Mounted at /content/drive


In [2]:
import torch
import torch.nn as nn
import torch.nn.functional as F
import os
import pandas as pd
import numpy as np
import re
import contractions
import nltk
from nltk.corpus import stopwords
from nltk.stem import WordNetLemmatizer

from torch.utils.data import Dataset, DataLoader
from transformers import AdamW
from collections import defaultdict
import time
from torch.utils.data import DataLoader, TensorDataset
from sklearn.model_selection import train_test_split


#### Loading the pretrained_model
##### [hateBert](https://huggingface.co/GroNLP/hateBERT) Already fine-tuned model

In [3]:
## get the model from the huggingface model hub
!git clone https://huggingface.co/GroNLP/hateBERT

Cloning into 'hateBERT'...
remote: Enumerating objects: 21, done.[K
remote: Total 21 (delta 0), reused 0 (delta 0), pack-reused 21[K
Unpacking objects: 100% (21/21), 112.20 KiB | 7.01 MiB/s, done.
Filtering content: 100% (2/2), 840.10 MiB | 67.21 MiB/s, done.


In [4]:
## If you download the model locally , you can load it from the local path
PATH = os.getcwd()+"/hateBERT"

## Load the BERT model
from transformers import BertTokenizer, BertModel
tokenizer = BertTokenizer.from_pretrained(PATH)
model = BertModel.from_pretrained(PATH)

print(model)


BertModel(
  (embeddings): BertEmbeddings(
    (word_embeddings): Embedding(30522, 768, padding_idx=0)
    (position_embeddings): Embedding(512, 768)
    (token_type_embeddings): Embedding(2, 768)
    (LayerNorm): LayerNorm((768,), eps=1e-12, elementwise_affine=True)
    (dropout): Dropout(p=0.1, inplace=False)
  )
  (encoder): BertEncoder(
    (layer): ModuleList(
      (0-11): 12 x BertLayer(
        (attention): BertAttention(
          (self): BertSelfAttention(
            (query): Linear(in_features=768, out_features=768, bias=True)
            (key): Linear(in_features=768, out_features=768, bias=True)
            (value): Linear(in_features=768, out_features=768, bias=True)
            (dropout): Dropout(p=0.1, inplace=False)
          )
          (output): BertSelfOutput(
            (dense): Linear(in_features=768, out_features=768, bias=True)
            (LayerNorm): LayerNorm((768,), eps=1e-12, elementwise_affine=True)
            (dropout): Dropout(p=0.1, inplace=False)
  

In [5]:
# Load the model weights using hugingface model hub
from transformers import BertTokenizer, BertModel
import torch

# Example of getting the output of the model for a given text
def tokenize_text(text):
    return tokenizer(text, padding=True, truncation=True, return_tensors="pt")

# Use the model in inference mode and classify a give example
def classify(text):
    inputs = tokenize_text(text)
    print(inputs)
    outputs = model(**inputs)
    return outputs

text = "Hello World"
outputs = classify(text)
print(outputs)

{'input_ids': tensor([[ 101, 7592, 2088,  102]]), 'token_type_ids': tensor([[0, 0, 0, 0]]), 'attention_mask': tensor([[1, 1, 1, 1]])}
BaseModelOutputWithPoolingAndCrossAttentions(last_hidden_state=tensor([[[-0.6163,  0.4899,  0.6045,  ..., -0.0070,  0.6881,  0.5794],
         [-0.7543, -0.0851,  0.9398,  ..., -0.3023, -0.1036,  0.7563],
         [-0.4167,  0.3670,  0.5797,  ..., -0.2335,  0.2327, -0.3771],
         [ 0.1706,  0.1823,  1.2238,  ...,  0.1885,  1.3003,  0.2482]]],
       grad_fn=<NativeLayerNormBackward0>), pooler_output=tensor([[-0.8061, -0.1458,  0.9448,  0.6965, -0.7556, -0.2725,  0.7985,  0.1897,
          0.8852, -0.9938,  0.4638, -0.3088,  0.9876, -0.8221,  0.9338, -0.0994,
         -0.0384, -0.3089,  0.4715, -0.3408,  0.7167, -0.6686,  0.7346, -0.0056,
          0.0972, -0.5668, -0.4905,  0.9583,  0.9329,  0.7648, -0.6556,  0.1152,
         -0.9940, -0.3204,  0.8402, -0.9773, -0.0690, -0.6670, -0.0889, -0.0813,
         -0.9264,  0.3244,  0.9340,  0.2341,  0.0877, 

##### Import the multilabel data
##### [UCBerkeley - Hate Speech Dataset (Multilabel)](https://huggingface.co/datasets/ucberkeley-dlab/measuring-hate-speech)


In [10]:
# Download the data locally
# https://huggingface.co/datasets/ucberkeley-dlab/measuring-hate-speech/tree/main

## Read the measuring-hate-speech.parquet
parquet_data = pd.read_parquet('measuring-hate-speech.parquet')

## remove from df the redundant  columns
multilabel_dataset = parquet_data.iloc[:, :-116]

## Remove comment_idm,annotator_id,platform and put the column text in the first position
multilabel_dataset = multilabel_dataset[['text','sentiment', 'hatespeech', 'hate_speech_score', 'respect','insult','humiliate','status','dehumanize','violence','genocide' ,'attack_defend']]
multilabel_dataset

Unnamed: 0,text,sentiment,hatespeech,hate_speech_score,respect,insult,humiliate,status,dehumanize,violence,genocide,attack_defend
0,Yes indeed. She sort of reminds me of the elde...,0.0,0.0,-3.90,0.0,0.0,0.0,2.0,0.0,0.0,0.0,0.0
1,The trans women reading this tweet right now i...,0.0,0.0,-6.52,0.0,0.0,0.0,2.0,0.0,0.0,0.0,2.0
2,Question: These 4 broads who criticize America...,4.0,2.0,0.36,4.0,4.0,4.0,4.0,4.0,0.0,0.0,4.0
3,It is about time for all illegals to go back t...,2.0,0.0,0.26,3.0,2.0,1.0,2.0,0.0,0.0,0.0,3.0
4,For starters bend over the one in pink and kic...,4.0,2.0,1.54,4.0,4.0,4.0,4.0,4.0,4.0,1.0,3.0
...,...,...,...,...,...,...,...,...,...,...,...,...
135551,عاجل سماحة #السيد_عبدالملك_بدرالدين_الحوثي نص...,1.0,0.0,-4.88,1.0,0.0,0.0,2.0,0.0,0.0,0.0,2.0
135552,Millions of #Yemen-is participated in mass ral...,2.0,0.0,-4.40,0.0,0.0,0.0,2.0,0.0,0.0,0.0,1.0
135553,@AbeShinzo @realDonaldTrump @shinzoabe 独裁者は行きま...,1.0,0.0,-2.49,1.0,1.0,1.0,1.0,0.0,0.0,0.0,1.0
135554,Millions of #Yemen-is participated in mass ral...,2.0,0.0,-4.40,0.0,0.0,0.0,2.0,0.0,0.0,0.0,2.0


### Preprocessing text data

In [11]:
## Preprocess the TEXT data
## Remove HTML tags
def remove_html_tags(text):
    clean = re.compile('<.*?>')
    return re.sub(clean, '', text)

multilabel_dataset['text'] = multilabel_dataset['text'].apply(lambda x: remove_html_tags(x))

## Remove URL
def remove_url(text):
    return re.sub(r'http\S+', '', text)

multilabel_dataset['text'] = multilabel_dataset['text'].apply(lambda x: remove_url(x))

## Lowercase
multilabel_dataset['text'] = multilabel_dataset['text'].str.lower()

## Remove punctuation
def remove_punctuation(text):
    return re.sub(r'[^\w\s]', '', text)

multilabel_dataset['text'] = multilabel_dataset['text'].apply(lambda x: remove_punctuation(x))

## Handling Contractions using libraries

def expand_contractions(text):
    return contractions.fix(text)

multilabel_dataset['text'] = multilabel_dataset['text'].apply(lambda x: expand_contractions(x))

## Remove stopwords
nltk.download('stopwords')
stop_words = set(stopwords.words('english'))

def remove_stopwords(text):
    return " ".join([word for word in str(text).split() if word not in stop_words])

multilabel_dataset['text'] = multilabel_dataset['text'].apply(lambda x: remove_stopwords(x))

## Lemmatization
nltk.download('wordnet')
lemmatizer = WordNetLemmatizer()

def lemmatize_words(text):
    return " ".join([lemmatizer.lemmatize(word) for word in text.split()])
multilabel_dataset['text'] = multilabel_dataset['text'].apply(lambda x: lemmatize_words(x))

[nltk_data] Downloading package stopwords to /root/nltk_data...
[nltk_data]   Unzipping corpora/stopwords.zip.
[nltk_data] Downloading package wordnet to /root/nltk_data...


#### Preprocess labeling

In [12]:
## Replace each catefory of hatespeech with 0 or 1 for the columns respect, insult, humiliate, status, dehumanize, violence, genocide, attack_defend
## Do it more efficiently

# List of columns to transform
columns_to_transform = ['respect', 'insult', 'humiliate', 'status',
                        'dehumanize', 'violence', 'genocide', 'attack_defend']

# Apply the transformation
for column in columns_to_transform:
    multilabel_dataset[column] = multilabel_dataset[column].apply(lambda x: 1 if x > 0 else 0)
multilabel_dataset


Unnamed: 0,text,sentiment,hatespeech,hate_speech_score,respect,insult,humiliate,status,dehumanize,violence,genocide,attack_defend
0,yes indeed sort reminds elder lady played part...,0.0,0.0,-3.90,0,0,0,1,0,0,0,0
1,trans woman reading tweet right beautiful,0.0,0.0,-6.52,0,0,0,1,0,0,0,1
2,question 4 broad criticize america country fle...,4.0,2.0,0.36,1,1,1,1,1,0,0,1
3,time illegals go back country origin keep free...,2.0,0.0,0.26,1,1,1,1,0,0,0,1
4,starter bend one pink kick as pussy get taste ...,4.0,2.0,1.54,1,1,1,1,1,1,1,1
...,...,...,...,...,...,...,...,...,...,...,...,...
135551,عاجل سماحة السيد_عبدالملك_بدرالدين_الحوثي نصره...,1.0,0.0,-4.88,1,0,0,1,0,0,0,1
135552,million yemeni participated mass rally 13squar...,2.0,0.0,-4.40,0,0,0,1,0,0,0,1
135553,abeshinzo realdonaldtrump shinzoabe 独裁者は行きますこれ...,1.0,0.0,-2.49,1,1,1,1,0,0,0,1
135554,million yemeni participated mass rally 13squar...,2.0,0.0,-4.40,0,0,0,1,0,0,0,1


In [13]:
multilabel_dataset['labels']=multilabel_dataset[columns_to_transform].values.tolist()
multilabel_dataset = multilabel_dataset[multilabel_dataset['text'] != '']
multilabel_dataset

Unnamed: 0,text,sentiment,hatespeech,hate_speech_score,respect,insult,humiliate,status,dehumanize,violence,genocide,attack_defend,labels
0,yes indeed sort reminds elder lady played part...,0.0,0.0,-3.90,0,0,0,1,0,0,0,0,"[0, 0, 0, 1, 0, 0, 0, 0]"
1,trans woman reading tweet right beautiful,0.0,0.0,-6.52,0,0,0,1,0,0,0,1,"[0, 0, 0, 1, 0, 0, 0, 1]"
2,question 4 broad criticize america country fle...,4.0,2.0,0.36,1,1,1,1,1,0,0,1,"[1, 1, 1, 1, 1, 0, 0, 1]"
3,time illegals go back country origin keep free...,2.0,0.0,0.26,1,1,1,1,0,0,0,1,"[1, 1, 1, 1, 0, 0, 0, 1]"
4,starter bend one pink kick as pussy get taste ...,4.0,2.0,1.54,1,1,1,1,1,1,1,1,"[1, 1, 1, 1, 1, 1, 1, 1]"
...,...,...,...,...,...,...,...,...,...,...,...,...,...
135551,عاجل سماحة السيد_عبدالملك_بدرالدين_الحوثي نصره...,1.0,0.0,-4.88,1,0,0,1,0,0,0,1,"[1, 0, 0, 1, 0, 0, 0, 1]"
135552,million yemeni participated mass rally 13squar...,2.0,0.0,-4.40,0,0,0,1,0,0,0,1,"[0, 0, 0, 1, 0, 0, 0, 1]"
135553,abeshinzo realdonaldtrump shinzoabe 独裁者は行きますこれ...,1.0,0.0,-2.49,1,1,1,1,0,0,0,1,"[1, 1, 1, 1, 0, 0, 0, 1]"
135554,million yemeni participated mass rally 13squar...,2.0,0.0,-4.40,0,0,0,1,0,0,0,1,"[0, 0, 0, 1, 0, 0, 0, 1]"


#### Dataset/Dataloader

In [9]:
#X = multilabel_dataset['text'].values.tolist()
#encoded_inputs = tokenizer(X, padding=True, truncation=True,max_length=256, return_tensors='pt')

In [10]:
#labels = multilabel_dataset[columns_to_transform].values  # Assuming you have extracted binary labels
#encoded_inputs['labels']=torch.tensor(labels, dtype=torch.float)

In [11]:
#encoded_inputs

In [12]:
#inputs = multilabel_dataset['text'].values
#labels = multilabel_dataset[columns_to_transform].values

In [14]:
MAX_LEN = 256
TRAIN_BATCH_SIZE = 16
VALID_BATCH_SIZE = 8
EPOCHS = 1
LEARNING_RATE = 1e-05

In [15]:
device = torch.device('cuda') if torch.cuda.is_available() else torch.device('cpu')

In [16]:
import torch
from torch.utils.data import Dataset

class HateSpeechDataset(Dataset):
    def __init__(self, data, tokenizer,max_len=256):

        self.tokenizer = tokenizer
        self.data = data
        self.text = data.text
        self.targets = self.data.labels
        self.max_len = max_len

    def __len__(self):
        return len(self.data)

    def __getitem__(self, idx):

        text = str(self.text.iloc[idx])

        encoding = self.tokenizer.encode_plus(
            text,
            add_special_tokens=True,
            max_length=self.max_len,
            padding='max_length',
            truncation=True,
            return_token_type_ids=True
        )


        ids = encoding['input_ids']
        mask = encoding['attention_mask']
        token_type_ids = encoding['token_type_ids']

        return {
            'input_ids': torch.tensor(ids, dtype=torch.long),
            'attention_mask': torch.tensor(mask, dtype=torch.long),
            'token_type_ids': torch.tensor(token_type_ids, dtype=torch.long),
            'targets': torch.tensor(self.targets.iloc[idx], dtype=torch.float).to(device)
        }


In [17]:
train_texts, val_texts,= train_test_split(multilabel_dataset,test_size=0.2)

print("Dataset length: {}".format(multilabel_dataset.shape))
print("Train Dataset length: {}".format(train_texts.shape))
print("Val Dataset length: {}".format(val_texts.shape))

Dataset length: (135555, 13)
Train Dataset length: (108444, 13)
Val Dataset length: (27111, 13)


In [18]:
training_dataset = HateSpeechDataset(train_texts,tokenizer,MAX_LEN)
validation_dataset = HateSpeechDataset(val_texts,tokenizer,MAX_LEN)

In [19]:
train_params = {'batch_size': TRAIN_BATCH_SIZE,
                'shuffle': True,
                'num_workers': 0
                }

test_params = {'batch_size': VALID_BATCH_SIZE,
                'shuffle': True,
                'num_workers': 0
                }

training_loader = DataLoader(training_dataset, **train_params)
validation_loader = DataLoader(validation_dataset, **test_params)

In [20]:
next(iter(training_loader))

{'input_ids': tensor([[  101,  3287,  2066,  ...,     0,     0,     0],
         [  101, 14120,  2516,  ...,     0,     0,     0],
         [  101,  5907, 10067,  ...,     0,     0,     0],
         ...,
         [  101, 27793,  2102,  ...,     0,     0,     0],
         [  101,  2111,  2066,  ...,     0,     0,     0],
         [  101, 11376,  5094,  ...,     0,     0,     0]]),
 'attention_mask': tensor([[1, 1, 1,  ..., 0, 0, 0],
         [1, 1, 1,  ..., 0, 0, 0],
         [1, 1, 1,  ..., 0, 0, 0],
         ...,
         [1, 1, 1,  ..., 0, 0, 0],
         [1, 1, 1,  ..., 0, 0, 0],
         [1, 1, 1,  ..., 0, 0, 0]]),
 'token_type_ids': tensor([[0, 0, 0,  ..., 0, 0, 0],
         [0, 0, 0,  ..., 0, 0, 0],
         [0, 0, 0,  ..., 0, 0, 0],
         ...,
         [0, 0, 0,  ..., 0, 0, 0],
         [0, 0, 0,  ..., 0, 0, 0],
         [0, 0, 0,  ..., 0, 0, 0]]),
 'targets': tensor([[1., 1., 1., 1., 1., 0., 0., 1.],
         [1., 1., 1., 1., 1., 0., 0., 1.],
         [0., 0., 0., 1., 0., 0.

#### Fine Tuning the model

In [21]:
print(model)

BertModel(
  (embeddings): BertEmbeddings(
    (word_embeddings): Embedding(30522, 768, padding_idx=0)
    (position_embeddings): Embedding(512, 768)
    (token_type_embeddings): Embedding(2, 768)
    (LayerNorm): LayerNorm((768,), eps=1e-12, elementwise_affine=True)
    (dropout): Dropout(p=0.1, inplace=False)
  )
  (encoder): BertEncoder(
    (layer): ModuleList(
      (0-11): 12 x BertLayer(
        (attention): BertAttention(
          (self): BertSelfAttention(
            (query): Linear(in_features=768, out_features=768, bias=True)
            (key): Linear(in_features=768, out_features=768, bias=True)
            (value): Linear(in_features=768, out_features=768, bias=True)
            (dropout): Dropout(p=0.1, inplace=False)
          )
          (output): BertSelfOutput(
            (dense): Linear(in_features=768, out_features=768, bias=True)
            (LayerNorm): LayerNorm((768,), eps=1e-12, elementwise_affine=True)
            (dropout): Dropout(p=0.1, inplace=False)
  

In [22]:
# Creating the customized model, by adding a drop out and a dense layer on top of distil bert to get the final output for the model.

class MultilabelHateBert(torch.nn.Module):
    def __init__(self,bertmodel):
        super(MultilabelHateBert, self).__init__()
        self.bertmodel = bertmodel
        self.dropout = torch.nn.Dropout(0.3)
        self.linear = torch.nn.Linear(768, len(columns_to_transform))

    def forward(self, ids, mask, token_type_ids):

      output_1= self.bertmodel(ids, attention_mask = mask, token_type_ids = token_type_ids)
      output_2 = self.dropout(output_1.pooler_output)
      output = self.linear(output_2)
      return output

multilabel_model = MultilabelHateBert(model)
multilabel_model.to(device)

MultilabelHateBert(
  (bertmodel): BertModel(
    (embeddings): BertEmbeddings(
      (word_embeddings): Embedding(30522, 768, padding_idx=0)
      (position_embeddings): Embedding(512, 768)
      (token_type_embeddings): Embedding(2, 768)
      (LayerNorm): LayerNorm((768,), eps=1e-12, elementwise_affine=True)
      (dropout): Dropout(p=0.1, inplace=False)
    )
    (encoder): BertEncoder(
      (layer): ModuleList(
        (0-11): 12 x BertLayer(
          (attention): BertAttention(
            (self): BertSelfAttention(
              (query): Linear(in_features=768, out_features=768, bias=True)
              (key): Linear(in_features=768, out_features=768, bias=True)
              (value): Linear(in_features=768, out_features=768, bias=True)
              (dropout): Dropout(p=0.1, inplace=False)
            )
            (output): BertSelfOutput(
              (dense): Linear(in_features=768, out_features=768, bias=True)
              (LayerNorm): LayerNorm((768,), eps=1e-12, eleme

In [23]:
def criterion(outputs, targets):
    return torch.nn.BCEWithLogitsLoss()(outputs, targets)

In [24]:
optimizer = torch.optim.Adam(params =  multilabel_model.parameters(), lr=LEARNING_RATE)


#### Training Loop

In [26]:
from tqdm import tqdm

total_loss = 0.0
batch_count = 0

for epoch in tqdm(range(EPOCHS), desc="Epochs"):

  multilabel_model.train()

  for i, batch in tqdm(enumerate(training_loader), desc=f"Epoch {epoch + 1}", total=len(training_loader)):

    input_ids = batch['input_ids'].to(device)
    attention_mask = batch['attention_mask'].to(device)
    token_type_ids = batch['token_type_ids'].to(device)
    targets = batch['targets'].to(device)

    outputs = multilabel_model(input_ids,attention_mask,token_type_ids)
    optimizer.zero_grad()
    loss = criterion(outputs,targets)

    total_loss += loss.item()
    batch_count += 1
    if i%50==0:
      print()
      print(f'Epoch: {epoch}, Loss{total_loss/batch_count}')

    optimizer.zero_grad()
    loss.backward()
    optimizer.step()

Epochs:   0%|          | 0/1 [00:00<?, ?it/s]
Epoch 1:   0%|          | 0/6778 [00:00<?, ?it/s][A
Epoch 1:   0%|          | 1/6778 [00:00<40:29,  2.79it/s][A


Epoch: 0, Loss0.3581532835960388



Epoch 1:   0%|          | 2/6778 [00:01<59:03,  1.91it/s][A
Epoch 1:   0%|          | 3/6778 [00:01<1:07:08,  1.68it/s][A
Epoch 1:   0%|          | 4/6778 [00:02<1:09:39,  1.62it/s][A
Epoch 1:   0%|          | 5/6778 [00:03<1:12:36,  1.55it/s][A
Epoch 1:   0%|          | 6/6778 [00:03<1:13:26,  1.54it/s][A
Epoch 1:   0%|          | 7/6778 [00:04<1:12:31,  1.56it/s][A
Epoch 1:   0%|          | 8/6778 [00:04<1:14:03,  1.52it/s][A
Epoch 1:   0%|          | 9/6778 [00:05<1:13:29,  1.54it/s][A
Epoch 1:   0%|          | 10/6778 [00:06<1:13:28,  1.54it/s][A
Epoch 1:   0%|          | 11/6778 [00:06<1:14:06,  1.52it/s][A
Epoch 1:   0%|          | 12/6778 [00:07<1:14:00,  1.52it/s][A
Epoch 1:   0%|          | 13/6778 [00:08<1:13:49,  1.53it/s][A
Epoch 1:   0%|          | 14/6778 [00:08<1:14:17,  1.52it/s][A
Epoch 1:   0%|          | 15/6778 [00:09<1:14:01,  1.52it/s][A
Epoch 1:   0%|          | 16/6778 [00:10<1:14:34,  1.51it/s][A
Epoch 1:   0%|          | 17/6778 [00:11<1:17:31,


Epoch: 0, Loss0.3296339935531803



Epoch 1:   1%|          | 52/6778 [00:34<1:15:44,  1.48it/s][A
Epoch 1:   1%|          | 53/6778 [00:35<1:15:28,  1.49it/s][A
Epoch 1:   1%|          | 54/6778 [00:35<1:15:23,  1.49it/s][A
Epoch 1:   1%|          | 55/6778 [00:36<1:15:16,  1.49it/s][A
Epoch 1:   1%|          | 56/6778 [00:37<1:15:14,  1.49it/s][A
Epoch 1:   1%|          | 57/6778 [00:37<1:15:02,  1.49it/s][A
Epoch 1:   1%|          | 58/6778 [00:38<1:14:57,  1.49it/s][A
Epoch 1:   1%|          | 59/6778 [00:39<1:14:52,  1.50it/s][A
Epoch 1:   1%|          | 60/6778 [00:39<1:14:55,  1.49it/s][A
Epoch 1:   1%|          | 61/6778 [00:40<1:14:48,  1.50it/s][A
Epoch 1:   1%|          | 62/6778 [00:41<1:14:49,  1.50it/s][A
Epoch 1:   1%|          | 63/6778 [00:41<1:14:28,  1.50it/s][A
Epoch 1:   1%|          | 64/6778 [00:42<1:14:56,  1.49it/s][A
Epoch 1:   1%|          | 65/6778 [00:43<1:14:49,  1.50it/s][A
Epoch 1:   1%|          | 66/6778 [00:43<1:14:42,  1.50it/s][A
Epoch 1:   1%|          | 67/6778 [00:4


Epoch: 0, Loss0.32888761044728876



Epoch 1:   2%|▏         | 102/6778 [01:07<1:12:27,  1.54it/s][A
Epoch 1:   2%|▏         | 103/6778 [01:08<1:12:19,  1.54it/s][A
Epoch 1:   2%|▏         | 104/6778 [01:08<1:12:17,  1.54it/s][A
Epoch 1:   2%|▏         | 105/6778 [01:09<1:12:48,  1.53it/s][A
Epoch 1:   2%|▏         | 106/6778 [01:09<1:13:24,  1.51it/s][A
Epoch 1:   2%|▏         | 107/6778 [01:10<1:12:40,  1.53it/s][A
Epoch 1:   2%|▏         | 108/6778 [01:11<1:13:06,  1.52it/s][A
Epoch 1:   2%|▏         | 109/6778 [01:11<1:12:46,  1.53it/s][A
Epoch 1:   2%|▏         | 110/6778 [01:12<1:12:00,  1.54it/s][A
Epoch 1:   2%|▏         | 111/6778 [01:13<1:12:27,  1.53it/s][A
Epoch 1:   2%|▏         | 112/6778 [01:13<1:11:51,  1.55it/s][A
Epoch 1:   2%|▏         | 113/6778 [01:14<1:12:05,  1.54it/s][A
Epoch 1:   2%|▏         | 114/6778 [01:15<1:12:24,  1.53it/s][A
Epoch 1:   2%|▏         | 115/6778 [01:15<1:11:50,  1.55it/s][A
Epoch 1:   2%|▏         | 116/6778 [01:16<1:11:50,  1.55it/s][A
Epoch 1:   2%|▏         


Epoch: 0, Loss0.3270567094056022



Epoch 1:   2%|▏         | 152/6778 [01:40<1:12:30,  1.52it/s][A
Epoch 1:   2%|▏         | 153/6778 [01:40<1:12:24,  1.52it/s][A
Epoch 1:   2%|▏         | 154/6778 [01:41<1:12:23,  1.52it/s][A
Epoch 1:   2%|▏         | 155/6778 [01:42<1:12:17,  1.53it/s][A
Epoch 1:   2%|▏         | 156/6778 [01:42<1:12:20,  1.53it/s][A
Epoch 1:   2%|▏         | 157/6778 [01:43<1:12:22,  1.52it/s][A
Epoch 1:   2%|▏         | 158/6778 [01:43<1:12:24,  1.52it/s][A
Epoch 1:   2%|▏         | 159/6778 [01:44<1:12:20,  1.52it/s][A
Epoch 1:   2%|▏         | 160/6778 [01:45<1:12:30,  1.52it/s][A
Epoch 1:   2%|▏         | 161/6778 [01:45<1:12:22,  1.52it/s][A
Epoch 1:   2%|▏         | 162/6778 [01:46<1:12:34,  1.52it/s][A
Epoch 1:   2%|▏         | 163/6778 [01:47<1:12:40,  1.52it/s][A
Epoch 1:   2%|▏         | 164/6778 [01:47<1:12:40,  1.52it/s][A
Epoch 1:   2%|▏         | 165/6778 [01:48<1:12:37,  1.52it/s][A
Epoch 1:   2%|▏         | 166/6778 [01:49<1:13:11,  1.51it/s][A
Epoch 1:   2%|▏         


Epoch: 0, Loss0.3260041510880883



Epoch 1:   3%|▎         | 202/6778 [02:13<1:13:48,  1.48it/s][A
Epoch 1:   3%|▎         | 203/6778 [02:13<1:13:14,  1.50it/s][A
Epoch 1:   3%|▎         | 204/6778 [02:14<1:11:47,  1.53it/s][A
Epoch 1:   3%|▎         | 205/6778 [02:15<1:11:54,  1.52it/s][A
Epoch 1:   3%|▎         | 206/6778 [02:15<1:11:45,  1.53it/s][A
Epoch 1:   3%|▎         | 207/6778 [02:16<1:12:20,  1.51it/s][A
Epoch 1:   3%|▎         | 208/6778 [02:17<1:12:26,  1.51it/s][A
Epoch 1:   3%|▎         | 209/6778 [02:17<1:12:35,  1.51it/s][A
Epoch 1:   3%|▎         | 210/6778 [02:18<1:12:27,  1.51it/s][A
Epoch 1:   3%|▎         | 211/6778 [02:19<1:12:45,  1.50it/s][A
Epoch 1:   3%|▎         | 212/6778 [02:19<1:12:10,  1.52it/s][A
Epoch 1:   3%|▎         | 213/6778 [02:20<1:12:01,  1.52it/s][A
Epoch 1:   3%|▎         | 214/6778 [02:21<1:11:42,  1.53it/s][A
Epoch 1:   3%|▎         | 215/6778 [02:21<1:12:00,  1.52it/s][A
Epoch 1:   3%|▎         | 216/6778 [02:22<1:11:53,  1.52it/s][A
Epoch 1:   3%|▎         


Epoch: 0, Loss0.3271339896071955



Epoch 1:   4%|▎         | 252/6778 [02:46<1:12:17,  1.50it/s][A
Epoch 1:   4%|▎         | 253/6778 [02:46<1:11:56,  1.51it/s][A
Epoch 1:   4%|▎         | 254/6778 [02:47<1:11:32,  1.52it/s][A
Epoch 1:   4%|▍         | 255/6778 [02:47<1:11:36,  1.52it/s][A
Epoch 1:   4%|▍         | 256/6778 [02:48<1:11:23,  1.52it/s][A
Epoch 1:   4%|▍         | 257/6778 [02:49<1:11:15,  1.53it/s][A
Epoch 1:   4%|▍         | 258/6778 [02:49<1:11:13,  1.53it/s][A
Epoch 1:   4%|▍         | 259/6778 [02:50<1:11:06,  1.53it/s][A
Epoch 1:   4%|▍         | 260/6778 [02:51<1:11:08,  1.53it/s][A
Epoch 1:   4%|▍         | 261/6778 [02:51<1:11:02,  1.53it/s][A
Epoch 1:   4%|▍         | 262/6778 [02:52<1:11:04,  1.53it/s][A
Epoch 1:   4%|▍         | 263/6778 [02:53<1:10:48,  1.53it/s][A
Epoch 1:   4%|▍         | 264/6778 [02:53<1:10:56,  1.53it/s][A
Epoch 1:   4%|▍         | 265/6778 [02:54<1:10:52,  1.53it/s][A
Epoch 1:   4%|▍         | 266/6778 [02:55<1:10:57,  1.53it/s][A
Epoch 1:   4%|▍         


Epoch: 0, Loss0.3256120888200709



Epoch 1:   4%|▍         | 302/6778 [03:18<1:10:31,  1.53it/s][A
Epoch 1:   4%|▍         | 303/6778 [03:19<1:10:35,  1.53it/s][A
Epoch 1:   4%|▍         | 304/6778 [03:20<1:10:37,  1.53it/s][A
Epoch 1:   4%|▍         | 305/6778 [03:20<1:10:39,  1.53it/s][A
Epoch 1:   5%|▍         | 306/6778 [03:21<1:10:29,  1.53it/s][A
Epoch 1:   5%|▍         | 307/6778 [03:22<1:10:24,  1.53it/s][A
Epoch 1:   5%|▍         | 308/6778 [03:22<1:10:20,  1.53it/s][A
Epoch 1:   5%|▍         | 309/6778 [03:23<1:11:02,  1.52it/s][A
Epoch 1:   5%|▍         | 310/6778 [03:24<1:10:53,  1.52it/s][A
Epoch 1:   5%|▍         | 311/6778 [03:24<1:10:44,  1.52it/s][A
Epoch 1:   5%|▍         | 312/6778 [03:25<1:10:48,  1.52it/s][A
Epoch 1:   5%|▍         | 313/6778 [03:26<1:11:04,  1.52it/s][A
Epoch 1:   5%|▍         | 314/6778 [03:26<1:11:03,  1.52it/s][A
Epoch 1:   5%|▍         | 315/6778 [03:27<1:10:25,  1.53it/s][A
Epoch 1:   5%|▍         | 316/6778 [03:27<1:10:43,  1.52it/s][A
Epoch 1:   5%|▍         


Epoch: 0, Loss0.3225639381809452



Epoch 1:   5%|▌         | 352/6778 [03:51<1:10:27,  1.52it/s][A
Epoch 1:   5%|▌         | 353/6778 [03:52<1:10:35,  1.52it/s][A
Epoch 1:   5%|▌         | 354/6778 [03:53<1:10:41,  1.51it/s][A
Epoch 1:   5%|▌         | 355/6778 [03:53<1:11:07,  1.51it/s][A
Epoch 1:   5%|▌         | 356/6778 [03:54<1:10:14,  1.52it/s][A
Epoch 1:   5%|▌         | 357/6778 [03:55<1:10:00,  1.53it/s][A
Epoch 1:   5%|▌         | 358/6778 [03:55<1:10:00,  1.53it/s][A
Epoch 1:   5%|▌         | 359/6778 [03:56<1:09:54,  1.53it/s][A
Epoch 1:   5%|▌         | 360/6778 [03:57<1:10:03,  1.53it/s][A
Epoch 1:   5%|▌         | 361/6778 [03:57<1:10:03,  1.53it/s][A
Epoch 1:   5%|▌         | 362/6778 [03:58<1:09:58,  1.53it/s][A
Epoch 1:   5%|▌         | 363/6778 [03:59<1:09:58,  1.53it/s][A
Epoch 1:   5%|▌         | 364/6778 [03:59<1:09:57,  1.53it/s][A
Epoch 1:   5%|▌         | 365/6778 [04:00<1:09:57,  1.53it/s][A
Epoch 1:   5%|▌         | 366/6778 [04:01<1:10:15,  1.52it/s][A
Epoch 1:   5%|▌         


Epoch: 0, Loss0.319475893405013



Epoch 1:   6%|▌         | 402/6778 [04:24<1:09:37,  1.53it/s][A
Epoch 1:   6%|▌         | 403/6778 [04:25<1:09:42,  1.52it/s][A
Epoch 1:   6%|▌         | 404/6778 [04:26<1:09:37,  1.53it/s][A
Epoch 1:   6%|▌         | 405/6778 [04:26<1:10:09,  1.51it/s][A
Epoch 1:   6%|▌         | 406/6778 [04:27<1:09:29,  1.53it/s][A
Epoch 1:   6%|▌         | 407/6778 [04:28<1:09:32,  1.53it/s][A
Epoch 1:   6%|▌         | 408/6778 [04:28<1:09:36,  1.53it/s][A
Epoch 1:   6%|▌         | 409/6778 [04:29<1:09:28,  1.53it/s][A
Epoch 1:   6%|▌         | 410/6778 [04:29<1:09:27,  1.53it/s][A
Epoch 1:   6%|▌         | 411/6778 [04:30<1:09:21,  1.53it/s][A
Epoch 1:   6%|▌         | 412/6778 [04:31<1:09:47,  1.52it/s][A
Epoch 1:   6%|▌         | 413/6778 [04:31<1:09:43,  1.52it/s][A
Epoch 1:   6%|▌         | 414/6778 [04:32<1:10:02,  1.51it/s][A
Epoch 1:   6%|▌         | 415/6778 [04:33<1:10:09,  1.51it/s][A
Epoch 1:   6%|▌         | 416/6778 [04:33<1:11:12,  1.49it/s][A
Epoch 1:   6%|▌         


Epoch: 0, Loss0.3194871261352446



Epoch 1:   7%|▋         | 452/6778 [04:57<1:08:53,  1.53it/s][A
Epoch 1:   7%|▋         | 453/6778 [04:58<1:09:32,  1.52it/s][A
Epoch 1:   7%|▋         | 454/6778 [04:58<1:09:33,  1.52it/s][A
Epoch 1:   7%|▋         | 455/6778 [04:59<1:09:35,  1.51it/s][A
Epoch 1:   7%|▋         | 456/6778 [05:00<1:09:49,  1.51it/s][A
Epoch 1:   7%|▋         | 457/6778 [05:00<1:10:18,  1.50it/s][A
Epoch 1:   7%|▋         | 458/6778 [05:01<1:09:41,  1.51it/s][A
Epoch 1:   7%|▋         | 459/6778 [05:02<1:09:23,  1.52it/s][A
Epoch 1:   7%|▋         | 460/6778 [05:02<1:09:12,  1.52it/s][A
Epoch 1:   7%|▋         | 461/6778 [05:03<1:09:08,  1.52it/s][A
Epoch 1:   7%|▋         | 462/6778 [05:04<1:09:04,  1.52it/s][A
Epoch 1:   7%|▋         | 463/6778 [05:04<1:09:04,  1.52it/s][A
Epoch 1:   7%|▋         | 464/6778 [05:05<1:08:53,  1.53it/s][A
Epoch 1:   7%|▋         | 465/6778 [05:06<1:08:56,  1.53it/s][A
Epoch 1:   7%|▋         | 466/6778 [05:06<1:08:53,  1.53it/s][A
Epoch 1:   7%|▋         


Epoch: 0, Loss0.32016241651571203



Epoch 1:   7%|▋         | 502/6778 [05:30<1:08:41,  1.52it/s][A
Epoch 1:   7%|▋         | 503/6778 [05:31<1:08:41,  1.52it/s][A
Epoch 1:   7%|▋         | 504/6778 [05:31<1:09:02,  1.51it/s][A
Epoch 1:   7%|▋         | 505/6778 [05:32<1:08:27,  1.53it/s][A
Epoch 1:   7%|▋         | 506/6778 [05:33<1:08:33,  1.52it/s][A
Epoch 1:   7%|▋         | 507/6778 [05:33<1:08:24,  1.53it/s][A
Epoch 1:   7%|▋         | 508/6778 [05:34<1:08:31,  1.52it/s][A
Epoch 1:   8%|▊         | 509/6778 [05:35<1:08:25,  1.53it/s][A
Epoch 1:   8%|▊         | 510/6778 [05:35<1:08:21,  1.53it/s][A
Epoch 1:   8%|▊         | 511/6778 [05:36<1:08:17,  1.53it/s][A
Epoch 1:   8%|▊         | 512/6778 [05:36<1:08:23,  1.53it/s][A
Epoch 1:   8%|▊         | 513/6778 [05:37<1:08:13,  1.53it/s][A
Epoch 1:   8%|▊         | 514/6778 [05:38<1:08:30,  1.52it/s][A
Epoch 1:   8%|▊         | 515/6778 [05:38<1:08:42,  1.52it/s][A
Epoch 1:   8%|▊         | 516/6778 [05:39<1:08:52,  1.52it/s][A
Epoch 1:   8%|▊         


Epoch: 0, Loss0.3204045403079415



Epoch 1:   8%|▊         | 552/6778 [06:03<1:07:52,  1.53it/s][A
Epoch 1:   8%|▊         | 553/6778 [06:03<1:08:04,  1.52it/s][A
Epoch 1:   8%|▊         | 554/6778 [06:04<1:07:55,  1.53it/s][A
Epoch 1:   8%|▊         | 555/6778 [06:05<1:08:36,  1.51it/s][A
Epoch 1:   8%|▊         | 556/6778 [06:05<1:08:36,  1.51it/s][A
Epoch 1:   8%|▊         | 557/6778 [06:06<1:08:29,  1.51it/s][A
Epoch 1:   8%|▊         | 558/6778 [06:07<1:08:42,  1.51it/s][A
Epoch 1:   8%|▊         | 559/6778 [06:07<1:08:54,  1.50it/s][A
Epoch 1:   8%|▊         | 560/6778 [06:08<1:08:13,  1.52it/s][A
Epoch 1:   8%|▊         | 561/6778 [06:09<1:08:00,  1.52it/s][A
Epoch 1:   8%|▊         | 562/6778 [06:09<1:07:56,  1.52it/s][A
Epoch 1:   8%|▊         | 563/6778 [06:10<1:07:49,  1.53it/s][A
Epoch 1:   8%|▊         | 564/6778 [06:11<1:08:00,  1.52it/s][A
Epoch 1:   8%|▊         | 565/6778 [06:11<1:07:54,  1.52it/s][A
Epoch 1:   8%|▊         | 566/6778 [06:12<1:08:00,  1.52it/s][A
Epoch 1:   8%|▊         


Epoch: 0, Loss0.31953641997895105



Epoch 1:   9%|▉         | 602/6778 [06:36<1:07:57,  1.51it/s][A
Epoch 1:   9%|▉         | 603/6778 [06:36<1:07:51,  1.52it/s][A
Epoch 1:   9%|▉         | 604/6778 [06:37<1:07:43,  1.52it/s][A
Epoch 1:   9%|▉         | 605/6778 [06:38<1:07:29,  1.52it/s][A
Epoch 1:   9%|▉         | 606/6778 [06:38<1:07:22,  1.53it/s][A
Epoch 1:   9%|▉         | 607/6778 [06:39<1:07:19,  1.53it/s][A
Epoch 1:   9%|▉         | 608/6778 [06:40<1:07:23,  1.53it/s][A
Epoch 1:   9%|▉         | 609/6778 [06:40<1:07:16,  1.53it/s][A
Epoch 1:   9%|▉         | 610/6778 [06:41<1:07:14,  1.53it/s][A
Epoch 1:   9%|▉         | 611/6778 [06:42<1:07:13,  1.53it/s][A
Epoch 1:   9%|▉         | 612/6778 [06:42<1:07:06,  1.53it/s][A
Epoch 1:   9%|▉         | 613/6778 [06:43<1:07:10,  1.53it/s][A
Epoch 1:   9%|▉         | 614/6778 [06:43<1:07:05,  1.53it/s][A
Epoch 1:   9%|▉         | 615/6778 [06:44<1:07:05,  1.53it/s][A
Epoch 1:   9%|▉         | 616/6778 [06:45<1:07:35,  1.52it/s][A
Epoch 1:   9%|▉         


Epoch: 0, Loss0.31834280259689796



Epoch 1:  10%|▉         | 652/6778 [07:08<1:06:42,  1.53it/s][A
Epoch 1:  10%|▉         | 653/6778 [07:09<1:06:50,  1.53it/s][A
Epoch 1:  10%|▉         | 654/6778 [07:10<1:06:46,  1.53it/s][A
Epoch 1:  10%|▉         | 655/6778 [07:10<1:06:46,  1.53it/s][A
Epoch 1:  10%|▉         | 656/6778 [07:11<1:06:45,  1.53it/s][A
Epoch 1:  10%|▉         | 657/6778 [07:12<1:07:12,  1.52it/s][A
Epoch 1:  10%|▉         | 658/6778 [07:12<1:07:12,  1.52it/s][A
Epoch 1:  10%|▉         | 659/6778 [07:13<1:07:07,  1.52it/s][A
Epoch 1:  10%|▉         | 660/6778 [07:14<1:07:16,  1.52it/s][A
Epoch 1:  10%|▉         | 661/6778 [07:14<1:07:46,  1.50it/s][A
Epoch 1:  10%|▉         | 662/6778 [07:15<1:07:49,  1.50it/s][A
Epoch 1:  10%|▉         | 663/6778 [07:16<1:06:48,  1.53it/s][A
Epoch 1:  10%|▉         | 664/6778 [07:16<1:06:48,  1.53it/s][A
Epoch 1:  10%|▉         | 665/6778 [07:17<1:06:43,  1.53it/s][A
Epoch 1:  10%|▉         | 666/6778 [07:18<1:06:35,  1.53it/s][A
Epoch 1:  10%|▉         


Epoch: 0, Loss0.31850694753389047



Epoch 1:  10%|█         | 702/6778 [07:41<1:06:58,  1.51it/s][A
Epoch 1:  10%|█         | 703/6778 [07:42<1:07:04,  1.51it/s][A
Epoch 1:  10%|█         | 704/6778 [07:43<1:06:34,  1.52it/s][A
Epoch 1:  10%|█         | 705/6778 [07:43<1:06:30,  1.52it/s][A
Epoch 1:  10%|█         | 706/6778 [07:44<1:06:23,  1.52it/s][A
Epoch 1:  10%|█         | 707/6778 [07:45<1:06:26,  1.52it/s][A
Epoch 1:  10%|█         | 708/6778 [07:45<1:06:18,  1.53it/s][A
Epoch 1:  10%|█         | 709/6778 [07:46<1:06:13,  1.53it/s][A
Epoch 1:  10%|█         | 710/6778 [07:46<1:06:05,  1.53it/s][A
Epoch 1:  10%|█         | 711/6778 [07:47<1:06:06,  1.53it/s][A
Epoch 1:  11%|█         | 712/6778 [07:48<1:06:06,  1.53it/s][A
Epoch 1:  11%|█         | 713/6778 [07:48<1:06:18,  1.52it/s][A
Epoch 1:  11%|█         | 714/6778 [07:49<1:06:17,  1.52it/s][A
Epoch 1:  11%|█         | 715/6778 [07:50<1:06:12,  1.53it/s][A
Epoch 1:  11%|█         | 716/6778 [07:50<1:06:09,  1.53it/s][A
Epoch 1:  11%|█         


Epoch: 0, Loss0.31783745377343126



Epoch 1:  11%|█         | 752/6778 [08:14<1:05:33,  1.53it/s][A
Epoch 1:  11%|█         | 753/6778 [08:15<1:05:35,  1.53it/s][A
Epoch 1:  11%|█         | 754/6778 [08:15<1:05:34,  1.53it/s][A
Epoch 1:  11%|█         | 755/6778 [08:16<1:05:31,  1.53it/s][A
Epoch 1:  11%|█         | 756/6778 [08:17<1:05:33,  1.53it/s][A
Epoch 1:  11%|█         | 757/6778 [08:17<1:05:42,  1.53it/s][A
Epoch 1:  11%|█         | 758/6778 [08:18<1:05:35,  1.53it/s][A
Epoch 1:  11%|█         | 759/6778 [08:19<1:05:33,  1.53it/s][A
Epoch 1:  11%|█         | 760/6778 [08:19<1:06:06,  1.52it/s][A
Epoch 1:  11%|█         | 761/6778 [08:20<1:06:08,  1.52it/s][A
Epoch 1:  11%|█         | 762/6778 [08:21<1:06:11,  1.51it/s][A
Epoch 1:  11%|█▏        | 763/6778 [08:21<1:06:32,  1.51it/s][A
Epoch 1:  11%|█▏        | 764/6778 [08:22<1:06:26,  1.51it/s][A
Epoch 1:  11%|█▏        | 765/6778 [08:23<1:05:40,  1.53it/s][A
Epoch 1:  11%|█▏        | 766/6778 [08:23<1:05:36,  1.53it/s][A
Epoch 1:  11%|█▏        


Epoch: 0, Loss0.3168600583344363



Epoch 1:  12%|█▏        | 802/6778 [08:47<1:05:54,  1.51it/s][A
Epoch 1:  12%|█▏        | 803/6778 [08:48<1:05:37,  1.52it/s][A
Epoch 1:  12%|█▏        | 804/6778 [08:48<1:05:37,  1.52it/s][A
Epoch 1:  12%|█▏        | 805/6778 [08:49<1:05:32,  1.52it/s][A
Epoch 1:  12%|█▏        | 806/6778 [08:49<1:05:21,  1.52it/s][A
Epoch 1:  12%|█▏        | 807/6778 [08:50<1:05:12,  1.53it/s][A
Epoch 1:  12%|█▏        | 808/6778 [08:51<1:05:09,  1.53it/s][A
Epoch 1:  12%|█▏        | 809/6778 [08:51<1:05:03,  1.53it/s][A
Epoch 1:  12%|█▏        | 810/6778 [08:52<1:04:53,  1.53it/s][A
Epoch 1:  12%|█▏        | 811/6778 [08:53<1:05:14,  1.52it/s][A
Epoch 1:  12%|█▏        | 812/6778 [08:53<1:04:44,  1.54it/s][A
Epoch 1:  12%|█▏        | 813/6778 [08:54<1:04:51,  1.53it/s][A
Epoch 1:  12%|█▏        | 814/6778 [08:55<1:04:49,  1.53it/s][A
Epoch 1:  12%|█▏        | 815/6778 [08:55<1:04:49,  1.53it/s][A
Epoch 1:  12%|█▏        | 816/6778 [08:56<1:04:54,  1.53it/s][A
Epoch 1:  12%|█▏        


Epoch: 0, Loss0.31561834950844914



Epoch 1:  13%|█▎        | 852/6778 [09:20<1:04:30,  1.53it/s][A
Epoch 1:  13%|█▎        | 853/6778 [09:20<1:04:41,  1.53it/s][A
Epoch 1:  13%|█▎        | 854/6778 [09:21<1:04:38,  1.53it/s][A
Epoch 1:  13%|█▎        | 855/6778 [09:22<1:05:04,  1.52it/s][A
Epoch 1:  13%|█▎        | 856/6778 [09:22<1:04:21,  1.53it/s][A
Epoch 1:  13%|█▎        | 857/6778 [09:23<1:04:22,  1.53it/s][A
Epoch 1:  13%|█▎        | 858/6778 [09:24<1:04:31,  1.53it/s][A
Epoch 1:  13%|█▎        | 859/6778 [09:24<1:04:33,  1.53it/s][A
Epoch 1:  13%|█▎        | 860/6778 [09:25<1:04:29,  1.53it/s][A
Epoch 1:  13%|█▎        | 861/6778 [09:26<1:04:57,  1.52it/s][A
Epoch 1:  13%|█▎        | 862/6778 [09:26<1:04:39,  1.52it/s][A
Epoch 1:  13%|█▎        | 863/6778 [09:27<1:05:01,  1.52it/s][A
Epoch 1:  13%|█▎        | 864/6778 [09:28<1:05:05,  1.51it/s][A
Epoch 1:  13%|█▎        | 865/6778 [09:28<1:05:25,  1.51it/s][A
Epoch 1:  13%|█▎        | 866/6778 [09:29<1:05:14,  1.51it/s][A
Epoch 1:  13%|█▎        


Epoch: 0, Loss0.3146079644213506



Epoch 1:  13%|█▎        | 902/6778 [09:52<1:03:58,  1.53it/s][A
Epoch 1:  13%|█▎        | 903/6778 [09:53<1:04:20,  1.52it/s][A
Epoch 1:  13%|█▎        | 904/6778 [09:54<1:04:40,  1.51it/s][A
Epoch 1:  13%|█▎        | 905/6778 [09:54<1:04:21,  1.52it/s][A
Epoch 1:  13%|█▎        | 906/6778 [09:55<1:04:54,  1.51it/s][A
Epoch 1:  13%|█▎        | 907/6778 [09:56<1:04:45,  1.51it/s][A
Epoch 1:  13%|█▎        | 908/6778 [09:56<1:04:00,  1.53it/s][A
Epoch 1:  13%|█▎        | 909/6778 [09:57<1:04:03,  1.53it/s][A
Epoch 1:  13%|█▎        | 910/6778 [09:58<1:03:57,  1.53it/s][A
Epoch 1:  13%|█▎        | 911/6778 [09:58<1:03:53,  1.53it/s][A
Epoch 1:  13%|█▎        | 912/6778 [09:59<1:03:51,  1.53it/s][A
Epoch 1:  13%|█▎        | 913/6778 [10:00<1:03:57,  1.53it/s][A
Epoch 1:  13%|█▎        | 914/6778 [10:00<1:03:51,  1.53it/s][A
Epoch 1:  13%|█▎        | 915/6778 [10:01<1:04:05,  1.52it/s][A
Epoch 1:  14%|█▎        | 916/6778 [10:02<1:03:48,  1.53it/s][A
Epoch 1:  14%|█▎        


Epoch: 0, Loss0.3138672708368201



Epoch 1:  14%|█▍        | 952/6778 [10:25<1:03:32,  1.53it/s][A
Epoch 1:  14%|█▍        | 953/6778 [10:26<1:03:25,  1.53it/s][A
Epoch 1:  14%|█▍        | 954/6778 [10:27<1:03:22,  1.53it/s][A
Epoch 1:  14%|█▍        | 955/6778 [10:27<1:03:32,  1.53it/s][A
Epoch 1:  14%|█▍        | 956/6778 [10:28<1:03:16,  1.53it/s][A
Epoch 1:  14%|█▍        | 957/6778 [10:28<1:03:05,  1.54it/s][A
Epoch 1:  14%|█▍        | 958/6778 [10:29<1:03:06,  1.54it/s][A
Epoch 1:  14%|█▍        | 959/6778 [10:30<1:03:11,  1.53it/s][A
Epoch 1:  14%|█▍        | 960/6778 [10:30<1:03:21,  1.53it/s][A
Epoch 1:  14%|█▍        | 961/6778 [10:31<1:03:17,  1.53it/s][A
Epoch 1:  14%|█▍        | 962/6778 [10:32<1:03:14,  1.53it/s][A
Epoch 1:  14%|█▍        | 963/6778 [10:32<1:03:27,  1.53it/s][A
Epoch 1:  14%|█▍        | 964/6778 [10:33<1:04:09,  1.51it/s][A
Epoch 1:  14%|█▍        | 965/6778 [10:34<1:03:58,  1.51it/s][A
Epoch 1:  14%|█▍        | 966/6778 [10:34<1:03:48,  1.52it/s][A
Epoch 1:  14%|█▍        


Epoch: 0, Loss0.3134012095458977



Epoch 1:  15%|█▍        | 1002/6778 [10:58<1:03:05,  1.53it/s][A
Epoch 1:  15%|█▍        | 1003/6778 [10:59<1:02:54,  1.53it/s][A
Epoch 1:  15%|█▍        | 1004/6778 [10:59<1:03:05,  1.53it/s][A
Epoch 1:  15%|█▍        | 1005/6778 [11:00<1:03:38,  1.51it/s][A
Epoch 1:  15%|█▍        | 1006/6778 [11:01<1:03:30,  1.51it/s][A
Epoch 1:  15%|█▍        | 1007/6778 [11:01<1:03:25,  1.52it/s][A
Epoch 1:  15%|█▍        | 1008/6778 [11:02<1:03:37,  1.51it/s][A
Epoch 1:  15%|█▍        | 1009/6778 [11:03<1:03:51,  1.51it/s][A
Epoch 1:  15%|█▍        | 1010/6778 [11:03<1:03:40,  1.51it/s][A
Epoch 1:  15%|█▍        | 1011/6778 [11:04<1:03:26,  1.52it/s][A
Epoch 1:  15%|█▍        | 1012/6778 [11:05<1:03:08,  1.52it/s][A
Epoch 1:  15%|█▍        | 1013/6778 [11:05<1:03:06,  1.52it/s][A
Epoch 1:  15%|█▍        | 1014/6778 [11:06<1:02:55,  1.53it/s][A
Epoch 1:  15%|█▍        | 1015/6778 [11:07<1:02:56,  1.53it/s][A
Epoch 1:  15%|█▍        | 1016/6778 [11:07<1:02:52,  1.53it/s][A
Epoch 1: 


Epoch: 0, Loss0.3139553092753286



Epoch 1:  16%|█▌        | 1052/6778 [11:31<1:02:31,  1.53it/s][A
Epoch 1:  16%|█▌        | 1053/6778 [11:32<1:02:33,  1.53it/s][A
Epoch 1:  16%|█▌        | 1054/6778 [11:32<1:02:34,  1.52it/s][A
Epoch 1:  16%|█▌        | 1055/6778 [11:33<1:02:31,  1.53it/s][A
Epoch 1:  16%|█▌        | 1056/6778 [11:33<1:02:21,  1.53it/s][A
Epoch 1:  16%|█▌        | 1057/6778 [11:34<1:02:12,  1.53it/s][A
Epoch 1:  16%|█▌        | 1058/6778 [11:35<1:02:07,  1.53it/s][A
Epoch 1:  16%|█▌        | 1059/6778 [11:35<1:02:10,  1.53it/s][A
Epoch 1:  16%|█▌        | 1060/6778 [11:36<1:02:04,  1.54it/s][A
Epoch 1:  16%|█▌        | 1061/6778 [11:37<1:02:18,  1.53it/s][A
Epoch 1:  16%|█▌        | 1062/6778 [11:37<1:02:11,  1.53it/s][A
Epoch 1:  16%|█▌        | 1063/6778 [11:38<1:02:15,  1.53it/s][A
Epoch 1:  16%|█▌        | 1064/6778 [11:39<1:02:04,  1.53it/s][A
Epoch 1:  16%|█▌        | 1065/6778 [11:39<1:02:11,  1.53it/s][A
Epoch 1:  16%|█▌        | 1066/6778 [11:40<1:02:11,  1.53it/s][A
Epoch 1: 


Epoch: 0, Loss0.31343030022773605



Epoch 1:  16%|█▋        | 1102/6778 [12:04<1:02:03,  1.52it/s][A
Epoch 1:  16%|█▋        | 1103/6778 [12:04<1:01:55,  1.53it/s][A
Epoch 1:  16%|█▋        | 1104/6778 [12:05<1:01:57,  1.53it/s][A
Epoch 1:  16%|█▋        | 1105/6778 [12:06<1:01:57,  1.53it/s][A
Epoch 1:  16%|█▋        | 1106/6778 [12:06<1:01:49,  1.53it/s][A
Epoch 1:  16%|█▋        | 1107/6778 [12:07<1:01:41,  1.53it/s][A
Epoch 1:  16%|█▋        | 1108/6778 [12:08<1:02:25,  1.51it/s][A
Epoch 1:  16%|█▋        | 1109/6778 [12:08<1:02:26,  1.51it/s][A
Epoch 1:  16%|█▋        | 1110/6778 [12:09<1:02:45,  1.51it/s][A
Epoch 1:  16%|█▋        | 1111/6778 [12:10<1:02:47,  1.50it/s][A
Epoch 1:  16%|█▋        | 1112/6778 [12:10<1:02:58,  1.50it/s][A
Epoch 1:  16%|█▋        | 1113/6778 [12:11<1:02:07,  1.52it/s][A
Epoch 1:  16%|█▋        | 1114/6778 [12:12<1:02:13,  1.52it/s][A
Epoch 1:  16%|█▋        | 1115/6778 [12:12<1:02:08,  1.52it/s][A
Epoch 1:  16%|█▋        | 1116/6778 [12:13<1:01:56,  1.52it/s][A
Epoch 1: 


Epoch: 0, Loss0.31283611217133384



Epoch 1:  17%|█▋        | 1152/6778 [12:37<1:02:26,  1.50it/s][A
Epoch 1:  17%|█▋        | 1153/6778 [12:37<1:02:19,  1.50it/s][A
Epoch 1:  17%|█▋        | 1154/6778 [12:38<1:01:38,  1.52it/s][A
Epoch 1:  17%|█▋        | 1155/6778 [12:39<1:01:33,  1.52it/s][A
Epoch 1:  17%|█▋        | 1156/6778 [12:39<1:01:32,  1.52it/s][A
Epoch 1:  17%|█▋        | 1157/6778 [12:40<1:01:29,  1.52it/s][A
Epoch 1:  17%|█▋        | 1158/6778 [12:41<1:01:29,  1.52it/s][A
Epoch 1:  17%|█▋        | 1159/6778 [12:41<1:01:31,  1.52it/s][A
Epoch 1:  17%|█▋        | 1160/6778 [12:42<1:01:31,  1.52it/s][A
Epoch 1:  17%|█▋        | 1161/6778 [12:43<1:01:28,  1.52it/s][A
Epoch 1:  17%|█▋        | 1162/6778 [12:43<1:01:21,  1.53it/s][A
Epoch 1:  17%|█▋        | 1163/6778 [12:44<1:01:34,  1.52it/s][A
Epoch 1:  17%|█▋        | 1164/6778 [12:44<1:01:27,  1.52it/s][A
Epoch 1:  17%|█▋        | 1165/6778 [12:45<1:01:35,  1.52it/s][A
Epoch 1:  17%|█▋        | 1166/6778 [12:46<1:01:24,  1.52it/s][A
Epoch 1: 


Epoch: 0, Loss0.31263060048904945



Epoch 1:  18%|█▊        | 1202/6778 [13:10<1:00:58,  1.52it/s][A
Epoch 1:  18%|█▊        | 1203/6778 [13:10<1:01:06,  1.52it/s][A
Epoch 1:  18%|█▊        | 1204/6778 [13:11<1:00:56,  1.52it/s][A
Epoch 1:  18%|█▊        | 1205/6778 [13:12<1:00:54,  1.53it/s][A
Epoch 1:  18%|█▊        | 1206/6778 [13:12<1:00:57,  1.52it/s][A
Epoch 1:  18%|█▊        | 1207/6778 [13:13<1:00:56,  1.52it/s][A
Epoch 1:  18%|█▊        | 1208/6778 [13:13<1:00:56,  1.52it/s][A
Epoch 1:  18%|█▊        | 1209/6778 [13:14<1:00:44,  1.53it/s][A
Epoch 1:  18%|█▊        | 1210/6778 [13:15<1:01:20,  1.51it/s][A
Epoch 1:  18%|█▊        | 1211/6778 [13:15<1:01:26,  1.51it/s][A
Epoch 1:  18%|█▊        | 1212/6778 [13:16<1:01:34,  1.51it/s][A
Epoch 1:  18%|█▊        | 1213/6778 [13:17<1:01:23,  1.51it/s][A
Epoch 1:  18%|█▊        | 1214/6778 [13:17<1:01:42,  1.50it/s][A
Epoch 1:  18%|█▊        | 1215/6778 [13:18<1:00:51,  1.52it/s][A
Epoch 1:  18%|█▊        | 1216/6778 [13:19<1:00:40,  1.53it/s][A
Epoch 1: 


Epoch: 0, Loss0.31305277329697595



Epoch 1:  18%|█▊        | 1252/6778 [13:42<1:00:48,  1.51it/s][A
Epoch 1:  18%|█▊        | 1253/6778 [13:43<1:01:04,  1.51it/s][A
Epoch 1:  19%|█▊        | 1254/6778 [13:44<1:01:12,  1.50it/s][A
Epoch 1:  19%|█▊        | 1255/6778 [13:44<1:01:19,  1.50it/s][A
Epoch 1:  19%|█▊        | 1256/6778 [13:45<1:00:44,  1.52it/s][A
Epoch 1:  19%|█▊        | 1257/6778 [13:46<1:00:28,  1.52it/s][A
Epoch 1:  19%|█▊        | 1258/6778 [13:46<1:00:17,  1.53it/s][A
Epoch 1:  19%|█▊        | 1259/6778 [13:47<1:00:19,  1.52it/s][A
Epoch 1:  19%|█▊        | 1260/6778 [13:48<1:00:23,  1.52it/s][A
Epoch 1:  19%|█▊        | 1261/6778 [13:48<1:00:10,  1.53it/s][A
Epoch 1:  19%|█▊        | 1262/6778 [13:49<1:00:05,  1.53it/s][A
Epoch 1:  19%|█▊        | 1263/6778 [13:50<1:00:06,  1.53it/s][A
Epoch 1:  19%|█▊        | 1264/6778 [13:50<1:00:01,  1.53it/s][A
Epoch 1:  19%|█▊        | 1265/6778 [13:51<1:00:09,  1.53it/s][A
Epoch 1:  19%|█▊        | 1266/6778 [13:52<1:00:07,  1.53it/s][A
Epoch 1: 


Epoch: 0, Loss0.3120468462617648



Epoch 1:  19%|█▉        | 1302/6778 [14:15<59:35,  1.53it/s][A
Epoch 1:  19%|█▉        | 1303/6778 [14:16<59:42,  1.53it/s][A
Epoch 1:  19%|█▉        | 1304/6778 [14:17<1:00:01,  1.52it/s][A
Epoch 1:  19%|█▉        | 1305/6778 [14:17<1:00:01,  1.52it/s][A
Epoch 1:  19%|█▉        | 1306/6778 [14:18<59:51,  1.52it/s]  [A
Epoch 1:  19%|█▉        | 1307/6778 [14:19<59:46,  1.53it/s][A
Epoch 1:  19%|█▉        | 1308/6778 [14:19<59:41,  1.53it/s][A
Epoch 1:  19%|█▉        | 1309/6778 [14:20<59:47,  1.52it/s][A
Epoch 1:  19%|█▉        | 1310/6778 [14:20<59:43,  1.53it/s][A
Epoch 1:  19%|█▉        | 1311/6778 [14:21<59:44,  1.53it/s][A
Epoch 1:  19%|█▉        | 1312/6778 [14:22<1:00:15,  1.51it/s][A
Epoch 1:  19%|█▉        | 1313/6778 [14:22<1:00:20,  1.51it/s][A
Epoch 1:  19%|█▉        | 1314/6778 [14:23<1:00:02,  1.52it/s][A
Epoch 1:  19%|█▉        | 1315/6778 [14:24<1:00:02,  1.52it/s][A
Epoch 1:  19%|█▉        | 1316/6778 [14:24<1:00:08,  1.51it/s][A
Epoch 1:  19%|█▉       


Epoch: 0, Loss0.3123251149316438



Epoch 1:  20%|█▉        | 1352/6778 [14:48<59:08,  1.53it/s][A
Epoch 1:  20%|█▉        | 1353/6778 [14:49<59:40,  1.52it/s][A
Epoch 1:  20%|█▉        | 1354/6778 [14:49<59:42,  1.51it/s][A
Epoch 1:  20%|█▉        | 1355/6778 [14:50<1:00:04,  1.50it/s][A
Epoch 1:  20%|██        | 1356/6778 [14:51<59:53,  1.51it/s]  [A
Epoch 1:  20%|██        | 1357/6778 [14:51<1:00:21,  1.50it/s][A
Epoch 1:  20%|██        | 1358/6778 [14:52<59:40,  1.51it/s]  [A
Epoch 1:  20%|██        | 1359/6778 [14:53<59:53,  1.51it/s][A
Epoch 1:  20%|██        | 1360/6778 [14:53<59:37,  1.51it/s][A
Epoch 1:  20%|██        | 1361/6778 [14:54<59:34,  1.52it/s][A
Epoch 1:  20%|██        | 1362/6778 [14:55<59:27,  1.52it/s][A
Epoch 1:  20%|██        | 1363/6778 [14:55<59:17,  1.52it/s][A
Epoch 1:  20%|██        | 1364/6778 [14:56<59:06,  1.53it/s][A
Epoch 1:  20%|██        | 1365/6778 [14:57<59:07,  1.53it/s][A
Epoch 1:  20%|██        | 1366/6778 [14:57<59:00,  1.53it/s][A
Epoch 1:  20%|██        | 1367/


Epoch: 0, Loss0.31268385305819896



Epoch 1:  21%|██        | 1402/6778 [15:21<58:55,  1.52it/s][A
Epoch 1:  21%|██        | 1403/6778 [15:22<59:06,  1.52it/s][A
Epoch 1:  21%|██        | 1404/6778 [15:22<58:52,  1.52it/s][A
Epoch 1:  21%|██        | 1405/6778 [15:23<58:54,  1.52it/s][A
Epoch 1:  21%|██        | 1406/6778 [15:24<58:51,  1.52it/s][A
Epoch 1:  21%|██        | 1407/6778 [15:24<58:42,  1.52it/s][A
Epoch 1:  21%|██        | 1408/6778 [15:25<58:38,  1.53it/s][A
Epoch 1:  21%|██        | 1409/6778 [15:26<58:32,  1.53it/s][A
Epoch 1:  21%|██        | 1410/6778 [15:26<58:37,  1.53it/s][A
Epoch 1:  21%|██        | 1411/6778 [15:27<58:31,  1.53it/s][A
Epoch 1:  21%|██        | 1412/6778 [15:28<58:40,  1.52it/s][A
Epoch 1:  21%|██        | 1413/6778 [15:28<58:23,  1.53it/s][A
Epoch 1:  21%|██        | 1414/6778 [15:29<58:26,  1.53it/s][A
Epoch 1:  21%|██        | 1415/6778 [15:29<58:50,  1.52it/s][A
Epoch 1:  21%|██        | 1416/6778 [15:30<59:00,  1.51it/s][A
Epoch 1:  21%|██        | 1417/6778 [15


Epoch: 0, Loss0.31229650438201584



Epoch 1:  21%|██▏       | 1452/6778 [15:54<58:08,  1.53it/s][A
Epoch 1:  21%|██▏       | 1453/6778 [15:54<58:08,  1.53it/s][A
Epoch 1:  21%|██▏       | 1454/6778 [15:55<58:06,  1.53it/s][A
Epoch 1:  21%|██▏       | 1455/6778 [15:56<58:30,  1.52it/s][A
Epoch 1:  21%|██▏       | 1456/6778 [15:56<58:36,  1.51it/s][A
Epoch 1:  21%|██▏       | 1457/6778 [15:57<58:32,  1.52it/s][A
Epoch 1:  22%|██▏       | 1458/6778 [15:58<58:42,  1.51it/s][A
Epoch 1:  22%|██▏       | 1459/6778 [15:58<58:57,  1.50it/s][A
Epoch 1:  22%|██▏       | 1460/6778 [15:59<58:53,  1.50it/s][A
Epoch 1:  22%|██▏       | 1461/6778 [16:00<58:10,  1.52it/s][A
Epoch 1:  22%|██▏       | 1462/6778 [16:00<58:05,  1.53it/s][A
Epoch 1:  22%|██▏       | 1463/6778 [16:01<58:12,  1.52it/s][A
Epoch 1:  22%|██▏       | 1464/6778 [16:02<58:05,  1.52it/s][A
Epoch 1:  22%|██▏       | 1465/6778 [16:02<57:47,  1.53it/s][A
Epoch 1:  22%|██▏       | 1466/6778 [16:03<57:54,  1.53it/s][A
Epoch 1:  22%|██▏       | 1467/6778 [16


Epoch: 0, Loss0.31186170162239685



Epoch 1:  22%|██▏       | 1502/6778 [16:27<58:00,  1.52it/s][A
Epoch 1:  22%|██▏       | 1503/6778 [16:27<57:47,  1.52it/s][A
Epoch 1:  22%|██▏       | 1504/6778 [16:28<57:54,  1.52it/s][A
Epoch 1:  22%|██▏       | 1505/6778 [16:29<57:49,  1.52it/s][A
Epoch 1:  22%|██▏       | 1506/6778 [16:29<57:45,  1.52it/s][A
Epoch 1:  22%|██▏       | 1507/6778 [16:30<57:39,  1.52it/s][A
Epoch 1:  22%|██▏       | 1508/6778 [16:31<57:30,  1.53it/s][A
Epoch 1:  22%|██▏       | 1509/6778 [16:31<57:22,  1.53it/s][A
Epoch 1:  22%|██▏       | 1510/6778 [16:32<57:25,  1.53it/s][A
Epoch 1:  22%|██▏       | 1511/6778 [16:33<57:21,  1.53it/s][A
Epoch 1:  22%|██▏       | 1512/6778 [16:33<57:17,  1.53it/s][A
Epoch 1:  22%|██▏       | 1513/6778 [16:34<57:21,  1.53it/s][A
Epoch 1:  22%|██▏       | 1514/6778 [16:35<57:17,  1.53it/s][A
Epoch 1:  22%|██▏       | 1515/6778 [16:35<57:26,  1.53it/s][A
Epoch 1:  22%|██▏       | 1516/6778 [16:36<57:27,  1.53it/s][A
Epoch 1:  22%|██▏       | 1517/6778 [16


Epoch: 0, Loss0.3115647828901759



Epoch 1:  23%|██▎       | 1552/6778 [16:59<56:58,  1.53it/s][A
Epoch 1:  23%|██▎       | 1553/6778 [17:00<56:54,  1.53it/s][A
Epoch 1:  23%|██▎       | 1554/6778 [17:01<56:49,  1.53it/s][A
Epoch 1:  23%|██▎       | 1555/6778 [17:01<57:01,  1.53it/s][A
Epoch 1:  23%|██▎       | 1556/6778 [17:02<56:58,  1.53it/s][A
Epoch 1:  23%|██▎       | 1557/6778 [17:03<57:00,  1.53it/s][A
Epoch 1:  23%|██▎       | 1558/6778 [17:03<57:20,  1.52it/s][A
Epoch 1:  23%|██▎       | 1559/6778 [17:04<57:09,  1.52it/s][A
Epoch 1:  23%|██▎       | 1560/6778 [17:05<57:09,  1.52it/s][A
Epoch 1:  23%|██▎       | 1561/6778 [17:05<57:34,  1.51it/s][A
Epoch 1:  23%|██▎       | 1562/6778 [17:06<57:39,  1.51it/s][A
Epoch 1:  23%|██▎       | 1563/6778 [17:07<57:16,  1.52it/s][A
Epoch 1:  23%|██▎       | 1564/6778 [17:07<57:04,  1.52it/s][A
Epoch 1:  23%|██▎       | 1565/6778 [17:08<57:09,  1.52it/s][A
Epoch 1:  23%|██▎       | 1566/6778 [17:09<57:13,  1.52it/s][A
Epoch 1:  23%|██▎       | 1567/6778 [17


Epoch: 0, Loss0.3110983843806384



Epoch 1:  24%|██▎       | 1602/6778 [17:32<57:25,  1.50it/s][A
Epoch 1:  24%|██▎       | 1603/6778 [17:33<57:24,  1.50it/s][A
Epoch 1:  24%|██▎       | 1604/6778 [17:34<56:49,  1.52it/s][A
Epoch 1:  24%|██▎       | 1605/6778 [17:34<56:50,  1.52it/s][A
Epoch 1:  24%|██▎       | 1606/6778 [17:35<56:30,  1.53it/s][A
Epoch 1:  24%|██▎       | 1607/6778 [17:36<56:26,  1.53it/s][A
Epoch 1:  24%|██▎       | 1608/6778 [17:36<56:29,  1.53it/s][A
Epoch 1:  24%|██▎       | 1609/6778 [17:37<56:20,  1.53it/s][A
Epoch 1:  24%|██▍       | 1610/6778 [17:38<56:18,  1.53it/s][A
Epoch 1:  24%|██▍       | 1611/6778 [17:38<56:25,  1.53it/s][A
Epoch 1:  24%|██▍       | 1612/6778 [17:39<56:22,  1.53it/s][A
Epoch 1:  24%|██▍       | 1613/6778 [17:40<56:16,  1.53it/s][A
Epoch 1:  24%|██▍       | 1614/6778 [17:40<56:22,  1.53it/s][A
Epoch 1:  24%|██▍       | 1615/6778 [17:41<56:21,  1.53it/s][A
Epoch 1:  24%|██▍       | 1616/6778 [17:42<56:16,  1.53it/s][A
Epoch 1:  24%|██▍       | 1617/6778 [17


Epoch: 0, Loss0.3108156582646338



Epoch 1:  24%|██▍       | 1652/6778 [18:05<56:02,  1.52it/s][A
Epoch 1:  24%|██▍       | 1653/6778 [18:06<56:05,  1.52it/s][A
Epoch 1:  24%|██▍       | 1654/6778 [18:06<55:56,  1.53it/s][A
Epoch 1:  24%|██▍       | 1655/6778 [18:07<55:48,  1.53it/s][A
Epoch 1:  24%|██▍       | 1656/6778 [18:08<56:00,  1.52it/s][A
Epoch 1:  24%|██▍       | 1657/6778 [18:08<55:51,  1.53it/s][A
Epoch 1:  24%|██▍       | 1658/6778 [18:09<55:55,  1.53it/s][A
Epoch 1:  24%|██▍       | 1659/6778 [18:10<55:51,  1.53it/s][A
Epoch 1:  24%|██▍       | 1660/6778 [18:10<56:34,  1.51it/s][A
Epoch 1:  25%|██▍       | 1661/6778 [18:11<56:31,  1.51it/s][A
Epoch 1:  25%|██▍       | 1662/6778 [18:12<56:38,  1.51it/s][A
Epoch 1:  25%|██▍       | 1663/6778 [18:12<56:31,  1.51it/s][A
Epoch 1:  25%|██▍       | 1664/6778 [18:13<56:52,  1.50it/s][A
Epoch 1:  25%|██▍       | 1665/6778 [18:14<56:25,  1.51it/s][A
Epoch 1:  25%|██▍       | 1666/6778 [18:14<56:10,  1.52it/s][A
Epoch 1:  25%|██▍       | 1667/6778 [18


Epoch: 0, Loss0.31056019616505454



Epoch 1:  25%|██▌       | 1702/6778 [18:38<55:47,  1.52it/s][A
Epoch 1:  25%|██▌       | 1703/6778 [18:39<56:04,  1.51it/s][A
Epoch 1:  25%|██▌       | 1704/6778 [18:39<56:12,  1.50it/s][A
Epoch 1:  25%|██▌       | 1705/6778 [18:40<56:07,  1.51it/s][A
Epoch 1:  25%|██▌       | 1706/6778 [18:41<55:40,  1.52it/s][A
Epoch 1:  25%|██▌       | 1707/6778 [18:41<55:29,  1.52it/s][A
Epoch 1:  25%|██▌       | 1708/6778 [18:42<55:33,  1.52it/s][A
Epoch 1:  25%|██▌       | 1709/6778 [18:43<55:23,  1.53it/s][A
Epoch 1:  25%|██▌       | 1710/6778 [18:43<55:25,  1.52it/s][A
Epoch 1:  25%|██▌       | 1711/6778 [18:44<55:26,  1.52it/s][A
Epoch 1:  25%|██▌       | 1712/6778 [18:45<55:21,  1.53it/s][A
Epoch 1:  25%|██▌       | 1713/6778 [18:45<55:12,  1.53it/s][A
Epoch 1:  25%|██▌       | 1714/6778 [18:46<55:10,  1.53it/s][A
Epoch 1:  25%|██▌       | 1715/6778 [18:47<55:06,  1.53it/s][A
Epoch 1:  25%|██▌       | 1716/6778 [18:47<55:05,  1.53it/s][A
Epoch 1:  25%|██▌       | 1717/6778 [18


Epoch: 0, Loss0.31030063686848774



Epoch 1:  26%|██▌       | 1752/6778 [19:11<55:11,  1.52it/s][A
Epoch 1:  26%|██▌       | 1753/6778 [19:12<55:03,  1.52it/s][A
Epoch 1:  26%|██▌       | 1754/6778 [19:12<54:51,  1.53it/s][A
Epoch 1:  26%|██▌       | 1755/6778 [19:13<54:50,  1.53it/s][A
Epoch 1:  26%|██▌       | 1756/6778 [19:14<54:47,  1.53it/s][A
Epoch 1:  26%|██▌       | 1757/6778 [19:14<54:40,  1.53it/s][A
Epoch 1:  26%|██▌       | 1758/6778 [19:15<54:45,  1.53it/s][A
Epoch 1:  26%|██▌       | 1759/6778 [19:16<54:50,  1.53it/s][A
Epoch 1:  26%|██▌       | 1760/6778 [19:16<54:32,  1.53it/s][A
Epoch 1:  26%|██▌       | 1761/6778 [19:17<54:36,  1.53it/s][A
Epoch 1:  26%|██▌       | 1762/6778 [19:17<55:00,  1.52it/s][A
Epoch 1:  26%|██▌       | 1763/6778 [19:18<54:55,  1.52it/s][A
Epoch 1:  26%|██▌       | 1764/6778 [19:19<55:14,  1.51it/s][A
Epoch 1:  26%|██▌       | 1765/6778 [19:19<55:13,  1.51it/s][A
Epoch 1:  26%|██▌       | 1766/6778 [19:20<55:30,  1.51it/s][A
Epoch 1:  26%|██▌       | 1767/6778 [19


Epoch: 0, Loss0.30989915708794585



Epoch 1:  27%|██▋       | 1802/6778 [19:44<54:08,  1.53it/s][A
Epoch 1:  27%|██▋       | 1803/6778 [19:44<54:26,  1.52it/s][A
Epoch 1:  27%|██▋       | 1804/6778 [19:45<54:15,  1.53it/s][A
Epoch 1:  27%|██▋       | 1805/6778 [19:46<54:26,  1.52it/s][A
Epoch 1:  27%|██▋       | 1806/6778 [19:46<54:29,  1.52it/s][A
Epoch 1:  27%|██▋       | 1807/6778 [19:47<54:51,  1.51it/s][A
Epoch 1:  27%|██▋       | 1808/6778 [19:48<54:54,  1.51it/s][A
Epoch 1:  27%|██▋       | 1809/6778 [19:48<54:11,  1.53it/s][A
Epoch 1:  27%|██▋       | 1810/6778 [19:49<54:31,  1.52it/s][A
Epoch 1:  27%|██▋       | 1811/6778 [19:50<54:08,  1.53it/s][A
Epoch 1:  27%|██▋       | 1812/6778 [19:50<54:11,  1.53it/s][A
Epoch 1:  27%|██▋       | 1813/6778 [19:51<54:09,  1.53it/s][A
Epoch 1:  27%|██▋       | 1814/6778 [19:52<54:14,  1.53it/s][A
Epoch 1:  27%|██▋       | 1815/6778 [19:52<54:08,  1.53it/s][A
Epoch 1:  27%|██▋       | 1816/6778 [19:53<54:05,  1.53it/s][A
Epoch 1:  27%|██▋       | 1817/6778 [19


Epoch: 0, Loss0.30958999052184905



Epoch 1:  27%|██▋       | 1852/6778 [20:17<53:44,  1.53it/s][A
Epoch 1:  27%|██▋       | 1853/6778 [20:17<53:45,  1.53it/s][A
Epoch 1:  27%|██▋       | 1854/6778 [20:18<53:47,  1.53it/s][A
Epoch 1:  27%|██▋       | 1855/6778 [20:18<53:45,  1.53it/s][A
Epoch 1:  27%|██▋       | 1856/6778 [20:19<53:46,  1.53it/s][A
Epoch 1:  27%|██▋       | 1857/6778 [20:20<53:50,  1.52it/s][A
Epoch 1:  27%|██▋       | 1858/6778 [20:20<53:44,  1.53it/s][A
Epoch 1:  27%|██▋       | 1859/6778 [20:21<53:36,  1.53it/s][A
Epoch 1:  27%|██▋       | 1860/6778 [20:22<53:37,  1.53it/s][A
Epoch 1:  27%|██▋       | 1861/6778 [20:22<53:44,  1.53it/s][A
Epoch 1:  27%|██▋       | 1862/6778 [20:23<53:40,  1.53it/s][A
Epoch 1:  27%|██▋       | 1863/6778 [20:24<53:37,  1.53it/s][A
Epoch 1:  28%|██▊       | 1864/6778 [20:24<53:39,  1.53it/s][A
Epoch 1:  28%|██▊       | 1865/6778 [20:25<54:15,  1.51it/s][A
Epoch 1:  28%|██▊       | 1866/6778 [20:26<53:52,  1.52it/s][A
Epoch 1:  28%|██▊       | 1867/6778 [20


Epoch: 0, Loss0.3095998609029952



Epoch 1:  28%|██▊       | 1902/6778 [20:49<53:04,  1.53it/s][A
Epoch 1:  28%|██▊       | 1903/6778 [20:50<53:07,  1.53it/s][A
Epoch 1:  28%|██▊       | 1904/6778 [20:51<53:05,  1.53it/s][A
Epoch 1:  28%|██▊       | 1905/6778 [20:51<53:09,  1.53it/s][A
Epoch 1:  28%|██▊       | 1906/6778 [20:52<53:30,  1.52it/s][A
Epoch 1:  28%|██▊       | 1907/6778 [20:53<53:26,  1.52it/s][A
Epoch 1:  28%|██▊       | 1908/6778 [20:53<53:42,  1.51it/s][A
Epoch 1:  28%|██▊       | 1909/6778 [20:54<53:49,  1.51it/s][A
Epoch 1:  28%|██▊       | 1910/6778 [20:55<53:54,  1.50it/s][A
Epoch 1:  28%|██▊       | 1911/6778 [20:55<53:17,  1.52it/s][A
Epoch 1:  28%|██▊       | 1912/6778 [20:56<53:32,  1.51it/s][A
Epoch 1:  28%|██▊       | 1913/6778 [20:57<53:05,  1.53it/s][A
Epoch 1:  28%|██▊       | 1914/6778 [20:57<53:05,  1.53it/s][A
Epoch 1:  28%|██▊       | 1915/6778 [20:58<53:00,  1.53it/s][A
Epoch 1:  28%|██▊       | 1916/6778 [20:59<52:53,  1.53it/s][A
Epoch 1:  28%|██▊       | 1917/6778 [20


Epoch: 0, Loss0.3090506783399687



Epoch 1:  29%|██▉       | 1952/6778 [21:22<53:04,  1.52it/s][A
Epoch 1:  29%|██▉       | 1953/6778 [21:23<52:56,  1.52it/s][A
Epoch 1:  29%|██▉       | 1954/6778 [21:24<52:54,  1.52it/s][A
Epoch 1:  29%|██▉       | 1955/6778 [21:24<52:45,  1.52it/s][A
Epoch 1:  29%|██▉       | 1956/6778 [21:25<52:53,  1.52it/s][A
Epoch 1:  29%|██▉       | 1957/6778 [21:25<52:26,  1.53it/s][A
Epoch 1:  29%|██▉       | 1958/6778 [21:26<52:25,  1.53it/s][A
Epoch 1:  29%|██▉       | 1959/6778 [21:27<52:33,  1.53it/s][A
Epoch 1:  29%|██▉       | 1960/6778 [21:27<52:32,  1.53it/s][A
Epoch 1:  29%|██▉       | 1961/6778 [21:28<52:30,  1.53it/s][A
Epoch 1:  29%|██▉       | 1962/6778 [21:29<52:31,  1.53it/s][A
Epoch 1:  29%|██▉       | 1963/6778 [21:29<52:25,  1.53it/s][A
Epoch 1:  29%|██▉       | 1964/6778 [21:30<52:28,  1.53it/s][A
Epoch 1:  29%|██▉       | 1965/6778 [21:31<52:28,  1.53it/s][A
Epoch 1:  29%|██▉       | 1966/6778 [21:31<52:26,  1.53it/s][A
Epoch 1:  29%|██▉       | 1967/6778 [21


Epoch: 0, Loss0.3094622467284736



Epoch 1:  30%|██▉       | 2002/6778 [21:55<52:17,  1.52it/s][A
Epoch 1:  30%|██▉       | 2003/6778 [21:56<52:06,  1.53it/s][A
Epoch 1:  30%|██▉       | 2004/6778 [21:56<52:07,  1.53it/s][A
Epoch 1:  30%|██▉       | 2005/6778 [21:57<52:16,  1.52it/s][A
Epoch 1:  30%|██▉       | 2006/6778 [21:58<52:15,  1.52it/s][A
Epoch 1:  30%|██▉       | 2007/6778 [21:58<52:06,  1.53it/s][A
Epoch 1:  30%|██▉       | 2008/6778 [21:59<52:29,  1.51it/s][A
Epoch 1:  30%|██▉       | 2009/6778 [22:00<52:35,  1.51it/s][A
Epoch 1:  30%|██▉       | 2010/6778 [22:00<52:32,  1.51it/s][A
Epoch 1:  30%|██▉       | 2011/6778 [22:01<52:31,  1.51it/s][A
Epoch 1:  30%|██▉       | 2012/6778 [22:02<52:46,  1.51it/s][A
Epoch 1:  30%|██▉       | 2013/6778 [22:02<52:31,  1.51it/s][A
Epoch 1:  30%|██▉       | 2014/6778 [22:03<52:29,  1.51it/s][A
Epoch 1:  30%|██▉       | 2015/6778 [22:04<52:19,  1.52it/s][A
Epoch 1:  30%|██▉       | 2016/6778 [22:04<52:11,  1.52it/s][A
Epoch 1:  30%|██▉       | 2017/6778 [22


Epoch: 0, Loss0.3098894831997368



Epoch 1:  30%|███       | 2052/6778 [22:28<52:06,  1.51it/s][A
Epoch 1:  30%|███       | 2053/6778 [22:29<51:59,  1.51it/s][A
Epoch 1:  30%|███       | 2054/6778 [22:29<51:56,  1.52it/s][A
Epoch 1:  30%|███       | 2055/6778 [22:30<51:51,  1.52it/s][A
Epoch 1:  30%|███       | 2056/6778 [22:31<51:43,  1.52it/s][A
Epoch 1:  30%|███       | 2057/6778 [22:31<51:35,  1.53it/s][A
Epoch 1:  30%|███       | 2058/6778 [22:32<51:32,  1.53it/s][A
Epoch 1:  30%|███       | 2059/6778 [22:32<51:26,  1.53it/s][A
Epoch 1:  30%|███       | 2060/6778 [22:33<51:19,  1.53it/s][A
Epoch 1:  30%|███       | 2061/6778 [22:34<51:21,  1.53it/s][A
Epoch 1:  30%|███       | 2062/6778 [22:34<51:22,  1.53it/s][A
Epoch 1:  30%|███       | 2063/6778 [22:35<51:32,  1.52it/s][A
Epoch 1:  30%|███       | 2064/6778 [22:36<51:29,  1.53it/s][A
Epoch 1:  30%|███       | 2065/6778 [22:36<51:15,  1.53it/s][A
Epoch 1:  30%|███       | 2066/6778 [22:37<51:14,  1.53it/s][A
Epoch 1:  30%|███       | 2067/6778 [22


Epoch: 0, Loss0.30971924467335876



Epoch 1:  31%|███       | 2102/6778 [23:01<50:59,  1.53it/s][A
Epoch 1:  31%|███       | 2103/6778 [23:01<51:00,  1.53it/s][A
Epoch 1:  31%|███       | 2104/6778 [23:02<50:59,  1.53it/s][A
Epoch 1:  31%|███       | 2105/6778 [23:03<50:57,  1.53it/s][A
Epoch 1:  31%|███       | 2106/6778 [23:03<50:57,  1.53it/s][A
Epoch 1:  31%|███       | 2107/6778 [23:04<51:01,  1.53it/s][A
Epoch 1:  31%|███       | 2108/6778 [23:05<51:00,  1.53it/s][A
Epoch 1:  31%|███       | 2109/6778 [23:05<51:05,  1.52it/s][A
Epoch 1:  31%|███       | 2110/6778 [23:06<50:59,  1.53it/s][A
Epoch 1:  31%|███       | 2111/6778 [23:07<51:16,  1.52it/s][A
Epoch 1:  31%|███       | 2112/6778 [23:07<51:10,  1.52it/s][A
Epoch 1:  31%|███       | 2113/6778 [23:08<51:15,  1.52it/s][A
Epoch 1:  31%|███       | 2114/6778 [23:09<51:11,  1.52it/s][A
Epoch 1:  31%|███       | 2115/6778 [23:09<51:30,  1.51it/s][A
Epoch 1:  31%|███       | 2116/6778 [23:10<50:47,  1.53it/s][A
Epoch 1:  31%|███       | 2117/6778 [23


Epoch: 0, Loss0.309490080183326



Epoch 1:  32%|███▏      | 2152/6778 [23:33<50:55,  1.51it/s][A
Epoch 1:  32%|███▏      | 2153/6778 [23:34<51:06,  1.51it/s][A
Epoch 1:  32%|███▏      | 2154/6778 [23:35<51:09,  1.51it/s][A
Epoch 1:  32%|███▏      | 2155/6778 [23:35<50:58,  1.51it/s][A
Epoch 1:  32%|███▏      | 2156/6778 [23:36<51:05,  1.51it/s][A
Epoch 1:  32%|███▏      | 2157/6778 [23:37<50:35,  1.52it/s][A
Epoch 1:  32%|███▏      | 2158/6778 [23:37<50:31,  1.52it/s][A
Epoch 1:  32%|███▏      | 2159/6778 [23:38<50:30,  1.52it/s][A
Epoch 1:  32%|███▏      | 2160/6778 [23:39<50:25,  1.53it/s][A
Epoch 1:  32%|███▏      | 2161/6778 [23:39<50:21,  1.53it/s][A
Epoch 1:  32%|███▏      | 2162/6778 [23:40<50:15,  1.53it/s][A
Epoch 1:  32%|███▏      | 2163/6778 [23:41<50:14,  1.53it/s][A
Epoch 1:  32%|███▏      | 2164/6778 [23:41<50:13,  1.53it/s][A
Epoch 1:  32%|███▏      | 2165/6778 [23:42<50:14,  1.53it/s][A
Epoch 1:  32%|███▏      | 2166/6778 [23:43<50:16,  1.53it/s][A
Epoch 1:  32%|███▏      | 2167/6778 [23


Epoch: 0, Loss0.3091003506163855



Epoch 1:  32%|███▏      | 2202/6778 [24:06<49:57,  1.53it/s][A
Epoch 1:  33%|███▎      | 2203/6778 [24:07<49:51,  1.53it/s][A
Epoch 1:  33%|███▎      | 2204/6778 [24:08<49:49,  1.53it/s][A
Epoch 1:  33%|███▎      | 2205/6778 [24:08<49:56,  1.53it/s][A
Epoch 1:  33%|███▎      | 2206/6778 [24:09<49:58,  1.52it/s][A
Epoch 1:  33%|███▎      | 2207/6778 [24:10<49:58,  1.52it/s][A
Epoch 1:  33%|███▎      | 2208/6778 [24:10<49:52,  1.53it/s][A
Epoch 1:  33%|███▎      | 2209/6778 [24:11<50:03,  1.52it/s][A
Epoch 1:  33%|███▎      | 2210/6778 [24:12<50:02,  1.52it/s][A
Epoch 1:  33%|███▎      | 2211/6778 [24:12<49:55,  1.52it/s][A
Epoch 1:  33%|███▎      | 2212/6778 [24:13<49:56,  1.52it/s][A
Epoch 1:  33%|███▎      | 2213/6778 [24:14<50:19,  1.51it/s][A
Epoch 1:  33%|███▎      | 2214/6778 [24:14<50:09,  1.52it/s][A
Epoch 1:  33%|███▎      | 2215/6778 [24:15<50:13,  1.51it/s][A
Epoch 1:  33%|███▎      | 2216/6778 [24:16<50:08,  1.52it/s][A
Epoch 1:  33%|███▎      | 2217/6778 [24


Epoch: 0, Loss0.3090244912170453



Epoch 1:  33%|███▎      | 2252/6778 [24:39<49:19,  1.53it/s][A
Epoch 1:  33%|███▎      | 2253/6778 [24:40<49:12,  1.53it/s][A
Epoch 1:  33%|███▎      | 2254/6778 [24:40<49:42,  1.52it/s][A
Epoch 1:  33%|███▎      | 2255/6778 [24:41<49:43,  1.52it/s][A
Epoch 1:  33%|███▎      | 2256/6778 [24:42<49:35,  1.52it/s][A
Epoch 1:  33%|███▎      | 2257/6778 [24:42<49:45,  1.51it/s][A
Epoch 1:  33%|███▎      | 2258/6778 [24:43<49:55,  1.51it/s][A
Epoch 1:  33%|███▎      | 2259/6778 [24:44<49:26,  1.52it/s][A
Epoch 1:  33%|███▎      | 2260/6778 [24:44<49:19,  1.53it/s][A
Epoch 1:  33%|███▎      | 2261/6778 [24:45<49:19,  1.53it/s][A
Epoch 1:  33%|███▎      | 2262/6778 [24:46<49:14,  1.53it/s][A
Epoch 1:  33%|███▎      | 2263/6778 [24:46<49:26,  1.52it/s][A
Epoch 1:  33%|███▎      | 2264/6778 [24:47<49:25,  1.52it/s][A
Epoch 1:  33%|███▎      | 2265/6778 [24:48<49:20,  1.52it/s][A
Epoch 1:  33%|███▎      | 2266/6778 [24:48<49:22,  1.52it/s][A
Epoch 1:  33%|███▎      | 2267/6778 [24


Epoch: 0, Loss0.3090332702825454



Epoch 1:  34%|███▍      | 2302/6778 [25:12<48:59,  1.52it/s][A
Epoch 1:  34%|███▍      | 2303/6778 [25:13<48:59,  1.52it/s][A
Epoch 1:  34%|███▍      | 2304/6778 [25:13<48:57,  1.52it/s][A
Epoch 1:  34%|███▍      | 2305/6778 [25:14<48:51,  1.53it/s][A
Epoch 1:  34%|███▍      | 2306/6778 [25:15<48:46,  1.53it/s][A
Epoch 1:  34%|███▍      | 2307/6778 [25:15<48:48,  1.53it/s][A
Epoch 1:  34%|███▍      | 2308/6778 [25:16<48:44,  1.53it/s][A
Epoch 1:  34%|███▍      | 2309/6778 [25:17<48:45,  1.53it/s][A
Epoch 1:  34%|███▍      | 2310/6778 [25:17<48:42,  1.53it/s][A
Epoch 1:  34%|███▍      | 2311/6778 [25:18<48:38,  1.53it/s][A
Epoch 1:  34%|███▍      | 2312/6778 [25:18<48:38,  1.53it/s][A
Epoch 1:  34%|███▍      | 2313/6778 [25:19<48:42,  1.53it/s][A
Epoch 1:  34%|███▍      | 2314/6778 [25:20<48:43,  1.53it/s][A
Epoch 1:  34%|███▍      | 2315/6778 [25:20<48:38,  1.53it/s][A
Epoch 1:  34%|███▍      | 2316/6778 [25:21<48:55,  1.52it/s][A
Epoch 1:  34%|███▍      | 2317/6778 [25


Epoch: 0, Loss0.30883615391716357



Epoch 1:  35%|███▍      | 2352/6778 [25:45<48:05,  1.53it/s][A
Epoch 1:  35%|███▍      | 2353/6778 [25:45<48:09,  1.53it/s][A
Epoch 1:  35%|███▍      | 2354/6778 [25:46<48:15,  1.53it/s][A
Epoch 1:  35%|███▍      | 2355/6778 [25:47<48:10,  1.53it/s][A
Epoch 1:  35%|███▍      | 2356/6778 [25:47<48:03,  1.53it/s][A
Epoch 1:  35%|███▍      | 2357/6778 [25:48<48:28,  1.52it/s][A
Epoch 1:  35%|███▍      | 2358/6778 [25:49<48:36,  1.52it/s][A
Epoch 1:  35%|███▍      | 2359/6778 [25:49<48:38,  1.51it/s][A
Epoch 1:  35%|███▍      | 2360/6778 [25:50<48:47,  1.51it/s][A
Epoch 1:  35%|███▍      | 2361/6778 [25:51<48:37,  1.51it/s][A
Epoch 1:  35%|███▍      | 2362/6778 [25:51<48:05,  1.53it/s][A
Epoch 1:  35%|███▍      | 2363/6778 [25:52<47:58,  1.53it/s][A
Epoch 1:  35%|███▍      | 2364/6778 [25:53<48:16,  1.52it/s][A
Epoch 1:  35%|███▍      | 2365/6778 [25:53<48:06,  1.53it/s][A
Epoch 1:  35%|███▍      | 2366/6778 [25:54<48:07,  1.53it/s][A
Epoch 1:  35%|███▍      | 2367/6778 [25


Epoch: 0, Loss0.30850498954525396



Epoch 1:  35%|███▌      | 2402/6778 [26:18<48:12,  1.51it/s][A
Epoch 1:  35%|███▌      | 2403/6778 [26:18<47:58,  1.52it/s][A
Epoch 1:  35%|███▌      | 2404/6778 [26:19<47:45,  1.53it/s][A
Epoch 1:  35%|███▌      | 2405/6778 [26:20<47:40,  1.53it/s][A
Epoch 1:  35%|███▌      | 2406/6778 [26:20<47:40,  1.53it/s][A
Epoch 1:  36%|███▌      | 2407/6778 [26:21<47:44,  1.53it/s][A
Epoch 1:  36%|███▌      | 2408/6778 [26:21<47:37,  1.53it/s][A
Epoch 1:  36%|███▌      | 2409/6778 [26:22<47:39,  1.53it/s][A
Epoch 1:  36%|███▌      | 2410/6778 [26:23<47:37,  1.53it/s][A
Epoch 1:  36%|███▌      | 2411/6778 [26:23<47:37,  1.53it/s][A
Epoch 1:  36%|███▌      | 2412/6778 [26:24<47:41,  1.53it/s][A
Epoch 1:  36%|███▌      | 2413/6778 [26:25<47:37,  1.53it/s][A
Epoch 1:  36%|███▌      | 2414/6778 [26:25<47:33,  1.53it/s][A
Epoch 1:  36%|███▌      | 2415/6778 [26:26<47:37,  1.53it/s][A
Epoch 1:  36%|███▌      | 2416/6778 [26:27<47:36,  1.53it/s][A
Epoch 1:  36%|███▌      | 2417/6778 [26


Epoch: 0, Loss0.3083988423343339



Epoch 1:  36%|███▌      | 2452/6778 [26:50<47:25,  1.52it/s][A
Epoch 1:  36%|███▌      | 2453/6778 [26:51<47:24,  1.52it/s][A
Epoch 1:  36%|███▌      | 2454/6778 [26:52<47:18,  1.52it/s][A
Epoch 1:  36%|███▌      | 2455/6778 [26:52<47:14,  1.53it/s][A
Epoch 1:  36%|███▌      | 2456/6778 [26:53<47:09,  1.53it/s][A
Epoch 1:  36%|███▌      | 2457/6778 [26:54<47:09,  1.53it/s][A
Epoch 1:  36%|███▋      | 2458/6778 [26:54<47:06,  1.53it/s][A
Epoch 1:  36%|███▋      | 2459/6778 [26:55<47:39,  1.51it/s][A
Epoch 1:  36%|███▋      | 2460/6778 [26:56<47:28,  1.52it/s][A
Epoch 1:  36%|███▋      | 2461/6778 [26:56<47:47,  1.51it/s][A
Epoch 1:  36%|███▋      | 2462/6778 [26:57<47:52,  1.50it/s][A
Epoch 1:  36%|███▋      | 2463/6778 [26:58<47:45,  1.51it/s][A
Epoch 1:  36%|███▋      | 2464/6778 [26:58<47:37,  1.51it/s][A
Epoch 1:  36%|███▋      | 2465/6778 [26:59<47:37,  1.51it/s][A
Epoch 1:  36%|███▋      | 2466/6778 [27:00<47:27,  1.51it/s][A
Epoch 1:  36%|███▋      | 2467/6778 [27


Epoch: 0, Loss0.3082867876255288



Epoch 1:  37%|███▋      | 2502/6778 [27:23<46:59,  1.52it/s][A
Epoch 1:  37%|███▋      | 2503/6778 [27:24<46:58,  1.52it/s][A
Epoch 1:  37%|███▋      | 2504/6778 [27:25<47:17,  1.51it/s][A
Epoch 1:  37%|███▋      | 2505/6778 [27:25<46:59,  1.52it/s][A
Epoch 1:  37%|███▋      | 2506/6778 [27:26<46:51,  1.52it/s][A
Epoch 1:  37%|███▋      | 2507/6778 [27:27<46:45,  1.52it/s][A
Epoch 1:  37%|███▋      | 2508/6778 [27:27<46:42,  1.52it/s][A
Epoch 1:  37%|███▋      | 2509/6778 [27:28<46:41,  1.52it/s][A
Epoch 1:  37%|███▋      | 2510/6778 [27:28<46:37,  1.53it/s][A
Epoch 1:  37%|███▋      | 2511/6778 [27:29<46:36,  1.53it/s][A
Epoch 1:  37%|███▋      | 2512/6778 [27:30<46:32,  1.53it/s][A
Epoch 1:  37%|███▋      | 2513/6778 [27:30<46:36,  1.53it/s][A
Epoch 1:  37%|███▋      | 2514/6778 [27:31<46:28,  1.53it/s][A
Epoch 1:  37%|███▋      | 2515/6778 [27:32<46:25,  1.53it/s][A
Epoch 1:  37%|███▋      | 2516/6778 [27:32<46:30,  1.53it/s][A
Epoch 1:  37%|███▋      | 2517/6778 [27


Epoch: 0, Loss0.30834602138158246



Epoch 1:  38%|███▊      | 2552/6778 [27:56<46:04,  1.53it/s][A
Epoch 1:  38%|███▊      | 2553/6778 [27:57<46:08,  1.53it/s][A
Epoch 1:  38%|███▊      | 2554/6778 [27:57<46:10,  1.52it/s][A
Epoch 1:  38%|███▊      | 2555/6778 [27:58<46:15,  1.52it/s][A
Epoch 1:  38%|███▊      | 2556/6778 [27:59<46:12,  1.52it/s][A
Epoch 1:  38%|███▊      | 2557/6778 [27:59<46:07,  1.53it/s][A
Epoch 1:  38%|███▊      | 2558/6778 [28:00<46:00,  1.53it/s][A
Epoch 1:  38%|███▊      | 2559/6778 [28:01<46:02,  1.53it/s][A
Epoch 1:  38%|███▊      | 2560/6778 [28:01<46:03,  1.53it/s][A
Epoch 1:  38%|███▊      | 2561/6778 [28:02<46:19,  1.52it/s][A
Epoch 1:  38%|███▊      | 2562/6778 [28:03<46:19,  1.52it/s][A
Epoch 1:  38%|███▊      | 2563/6778 [28:03<46:25,  1.51it/s][A
Epoch 1:  38%|███▊      | 2564/6778 [28:04<46:26,  1.51it/s][A
Epoch 1:  38%|███▊      | 2565/6778 [28:05<46:59,  1.49it/s][A
Epoch 1:  38%|███▊      | 2566/6778 [28:05<46:50,  1.50it/s][A
Epoch 1:  38%|███▊      | 2567/6778 [28


Epoch: 0, Loss0.30830232801631247



Epoch 1:  38%|███▊      | 2602/6778 [28:29<45:44,  1.52it/s][A
Epoch 1:  38%|███▊      | 2603/6778 [28:30<45:46,  1.52it/s][A
Epoch 1:  38%|███▊      | 2604/6778 [28:30<45:47,  1.52it/s][A
Epoch 1:  38%|███▊      | 2605/6778 [28:31<45:43,  1.52it/s][A
Epoch 1:  38%|███▊      | 2606/6778 [28:32<45:58,  1.51it/s][A
Epoch 1:  38%|███▊      | 2607/6778 [28:32<46:02,  1.51it/s][A
Epoch 1:  38%|███▊      | 2608/6778 [28:33<45:32,  1.53it/s][A
Epoch 1:  38%|███▊      | 2609/6778 [28:34<45:30,  1.53it/s][A
Epoch 1:  39%|███▊      | 2610/6778 [28:34<45:28,  1.53it/s][A
Epoch 1:  39%|███▊      | 2611/6778 [28:35<45:33,  1.52it/s][A
Epoch 1:  39%|███▊      | 2612/6778 [28:35<45:30,  1.53it/s][A
Epoch 1:  39%|███▊      | 2613/6778 [28:36<45:27,  1.53it/s][A
Epoch 1:  39%|███▊      | 2614/6778 [28:37<45:31,  1.52it/s][A
Epoch 1:  39%|███▊      | 2615/6778 [28:37<45:23,  1.53it/s][A
Epoch 1:  39%|███▊      | 2616/6778 [28:38<45:22,  1.53it/s][A
Epoch 1:  39%|███▊      | 2617/6778 [28


Epoch: 0, Loss0.3081075963306004



Epoch 1:  39%|███▉      | 2652/6778 [29:02<45:09,  1.52it/s][A
Epoch 1:  39%|███▉      | 2653/6778 [29:02<45:03,  1.53it/s][A
Epoch 1:  39%|███▉      | 2654/6778 [29:03<45:13,  1.52it/s][A
Epoch 1:  39%|███▉      | 2655/6778 [29:04<45:29,  1.51it/s][A
Epoch 1:  39%|███▉      | 2656/6778 [29:04<45:15,  1.52it/s][A
Epoch 1:  39%|███▉      | 2657/6778 [29:05<45:16,  1.52it/s][A
Epoch 1:  39%|███▉      | 2658/6778 [29:06<45:06,  1.52it/s][A
Epoch 1:  39%|███▉      | 2659/6778 [29:06<45:02,  1.52it/s][A
Epoch 1:  39%|███▉      | 2660/6778 [29:07<44:57,  1.53it/s][A
Epoch 1:  39%|███▉      | 2661/6778 [29:08<44:52,  1.53it/s][A
Epoch 1:  39%|███▉      | 2662/6778 [29:08<44:52,  1.53it/s][A
Epoch 1:  39%|███▉      | 2663/6778 [29:09<44:47,  1.53it/s][A
Epoch 1:  39%|███▉      | 2664/6778 [29:10<45:28,  1.51it/s][A
Epoch 1:  39%|███▉      | 2665/6778 [29:10<44:59,  1.52it/s][A
Epoch 1:  39%|███▉      | 2666/6778 [29:11<45:14,  1.52it/s][A
Epoch 1:  39%|███▉      | 2667/6778 [29


Epoch: 0, Loss0.3078638636863969



Epoch 1:  40%|███▉      | 2702/6778 [29:35<44:21,  1.53it/s][A
Epoch 1:  40%|███▉      | 2703/6778 [29:35<44:22,  1.53it/s][A
Epoch 1:  40%|███▉      | 2704/6778 [29:36<44:21,  1.53it/s][A
Epoch 1:  40%|███▉      | 2705/6778 [29:37<44:33,  1.52it/s][A
Epoch 1:  40%|███▉      | 2706/6778 [29:37<44:33,  1.52it/s][A
Epoch 1:  40%|███▉      | 2707/6778 [29:38<44:49,  1.51it/s][A
Epoch 1:  40%|███▉      | 2708/6778 [29:39<44:54,  1.51it/s][A
Epoch 1:  40%|███▉      | 2709/6778 [29:39<44:58,  1.51it/s][A
Epoch 1:  40%|███▉      | 2710/6778 [29:40<44:48,  1.51it/s][A
Epoch 1:  40%|███▉      | 2711/6778 [29:40<44:40,  1.52it/s][A
Epoch 1:  40%|████      | 2712/6778 [29:41<44:35,  1.52it/s][A
Epoch 1:  40%|████      | 2713/6778 [29:42<44:33,  1.52it/s][A
Epoch 1:  40%|████      | 2714/6778 [29:42<44:29,  1.52it/s][A
Epoch 1:  40%|████      | 2715/6778 [29:43<44:32,  1.52it/s][A
Epoch 1:  40%|████      | 2716/6778 [29:44<44:28,  1.52it/s][A
Epoch 1:  40%|████      | 2717/6778 [29


Epoch: 0, Loss0.30792438898605246



Epoch 1:  41%|████      | 2752/6778 [30:07<43:57,  1.53it/s][A
Epoch 1:  41%|████      | 2753/6778 [30:08<44:03,  1.52it/s][A
Epoch 1:  41%|████      | 2754/6778 [30:09<43:56,  1.53it/s][A
Epoch 1:  41%|████      | 2755/6778 [30:09<43:55,  1.53it/s][A
Epoch 1:  41%|████      | 2756/6778 [30:10<43:53,  1.53it/s][A
Epoch 1:  41%|████      | 2757/6778 [30:11<43:47,  1.53it/s][A
Epoch 1:  41%|████      | 2758/6778 [30:11<43:43,  1.53it/s][A
Epoch 1:  41%|████      | 2759/6778 [30:12<43:55,  1.52it/s][A
Epoch 1:  41%|████      | 2760/6778 [30:13<43:48,  1.53it/s][A
Epoch 1:  41%|████      | 2761/6778 [30:13<43:50,  1.53it/s][A
Epoch 1:  41%|████      | 2762/6778 [30:14<43:46,  1.53it/s][A
Epoch 1:  41%|████      | 2763/6778 [30:15<43:43,  1.53it/s][A
Epoch 1:  41%|████      | 2764/6778 [30:15<43:49,  1.53it/s][A
Epoch 1:  41%|████      | 2765/6778 [30:16<43:39,  1.53it/s][A
Epoch 1:  41%|████      | 2766/6778 [30:17<43:55,  1.52it/s][A
Epoch 1:  41%|████      | 2767/6778 [30


Epoch: 0, Loss0.30770121508679277



Epoch 1:  41%|████▏     | 2802/6778 [30:40<43:23,  1.53it/s][A
Epoch 1:  41%|████▏     | 2803/6778 [30:41<43:20,  1.53it/s][A
Epoch 1:  41%|████▏     | 2804/6778 [30:42<43:19,  1.53it/s][A
Epoch 1:  41%|████▏     | 2805/6778 [30:42<43:18,  1.53it/s][A
Epoch 1:  41%|████▏     | 2806/6778 [30:43<43:19,  1.53it/s][A
Epoch 1:  41%|████▏     | 2807/6778 [30:44<43:29,  1.52it/s][A
Epoch 1:  41%|████▏     | 2808/6778 [30:44<43:28,  1.52it/s][A
Epoch 1:  41%|████▏     | 2809/6778 [30:45<43:28,  1.52it/s][A
Epoch 1:  41%|████▏     | 2810/6778 [30:45<43:31,  1.52it/s][A
Epoch 1:  41%|████▏     | 2811/6778 [30:46<43:52,  1.51it/s][A
Epoch 1:  41%|████▏     | 2812/6778 [30:47<44:00,  1.50it/s][A
Epoch 1:  42%|████▏     | 2813/6778 [30:47<43:29,  1.52it/s][A
Epoch 1:  42%|████▏     | 2814/6778 [30:48<43:19,  1.52it/s][A
Epoch 1:  42%|████▏     | 2815/6778 [30:49<43:18,  1.53it/s][A
Epoch 1:  42%|████▏     | 2816/6778 [30:49<43:13,  1.53it/s][A
Epoch 1:  42%|████▏     | 2817/6778 [30


Epoch: 0, Loss0.30763459432202445



Epoch 1:  42%|████▏     | 2852/6778 [31:13<43:09,  1.52it/s][A
Epoch 1:  42%|████▏     | 2853/6778 [31:14<43:18,  1.51it/s][A
Epoch 1:  42%|████▏     | 2854/6778 [31:14<42:57,  1.52it/s][A
Epoch 1:  42%|████▏     | 2855/6778 [31:15<42:53,  1.52it/s][A
Epoch 1:  42%|████▏     | 2856/6778 [31:16<42:49,  1.53it/s][A
Epoch 1:  42%|████▏     | 2857/6778 [31:16<42:49,  1.53it/s][A
Epoch 1:  42%|████▏     | 2858/6778 [31:17<42:52,  1.52it/s][A
Epoch 1:  42%|████▏     | 2859/6778 [31:18<42:48,  1.53it/s][A
Epoch 1:  42%|████▏     | 2860/6778 [31:18<42:42,  1.53it/s][A
Epoch 1:  42%|████▏     | 2861/6778 [31:19<42:41,  1.53it/s][A
Epoch 1:  42%|████▏     | 2862/6778 [31:20<42:49,  1.52it/s][A
Epoch 1:  42%|████▏     | 2863/6778 [31:20<42:44,  1.53it/s][A
Epoch 1:  42%|████▏     | 2864/6778 [31:21<42:47,  1.52it/s][A
Epoch 1:  42%|████▏     | 2865/6778 [31:22<42:42,  1.53it/s][A
Epoch 1:  42%|████▏     | 2866/6778 [31:22<42:41,  1.53it/s][A
Epoch 1:  42%|████▏     | 2867/6778 [31


Epoch: 0, Loss0.3078192796805981



Epoch 1:  43%|████▎     | 2902/6778 [31:46<42:18,  1.53it/s][A
Epoch 1:  43%|████▎     | 2903/6778 [31:47<42:22,  1.52it/s][A
Epoch 1:  43%|████▎     | 2904/6778 [31:47<42:18,  1.53it/s][A
Epoch 1:  43%|████▎     | 2905/6778 [31:48<42:24,  1.52it/s][A
Epoch 1:  43%|████▎     | 2906/6778 [31:49<42:19,  1.52it/s][A
Epoch 1:  43%|████▎     | 2907/6778 [31:49<42:23,  1.52it/s][A
Epoch 1:  43%|████▎     | 2908/6778 [31:50<42:24,  1.52it/s][A
Epoch 1:  43%|████▎     | 2909/6778 [31:51<42:24,  1.52it/s][A
Epoch 1:  43%|████▎     | 2910/6778 [31:51<42:49,  1.51it/s][A
Epoch 1:  43%|████▎     | 2911/6778 [31:52<42:57,  1.50it/s][A
Epoch 1:  43%|████▎     | 2912/6778 [31:53<42:54,  1.50it/s][A
Epoch 1:  43%|████▎     | 2913/6778 [31:53<42:53,  1.50it/s][A
Epoch 1:  43%|████▎     | 2914/6778 [31:54<42:39,  1.51it/s][A
Epoch 1:  43%|████▎     | 2915/6778 [31:54<42:18,  1.52it/s][A
Epoch 1:  43%|████▎     | 2916/6778 [31:55<42:17,  1.52it/s][A
Epoch 1:  43%|████▎     | 2917/6778 [31


Epoch: 0, Loss0.3078834512114767



Epoch 1:  44%|████▎     | 2952/6778 [32:19<42:12,  1.51it/s][A
Epoch 1:  44%|████▎     | 2953/6778 [32:19<42:15,  1.51it/s][A
Epoch 1:  44%|████▎     | 2954/6778 [32:20<42:26,  1.50it/s][A
Epoch 1:  44%|████▎     | 2955/6778 [32:21<42:30,  1.50it/s][A
Epoch 1:  44%|████▎     | 2956/6778 [32:21<42:01,  1.52it/s][A
Epoch 1:  44%|████▎     | 2957/6778 [32:22<41:59,  1.52it/s][A
Epoch 1:  44%|████▎     | 2958/6778 [32:23<41:55,  1.52it/s][A
Epoch 1:  44%|████▎     | 2959/6778 [32:23<41:46,  1.52it/s][A
Epoch 1:  44%|████▎     | 2960/6778 [32:24<41:45,  1.52it/s][A
Epoch 1:  44%|████▎     | 2961/6778 [32:25<41:43,  1.52it/s][A
Epoch 1:  44%|████▎     | 2962/6778 [32:25<41:46,  1.52it/s][A
Epoch 1:  44%|████▎     | 2963/6778 [32:26<41:46,  1.52it/s][A
Epoch 1:  44%|████▎     | 2964/6778 [32:27<41:36,  1.53it/s][A
Epoch 1:  44%|████▎     | 2965/6778 [32:27<41:33,  1.53it/s][A
Epoch 1:  44%|████▍     | 2966/6778 [32:28<41:26,  1.53it/s][A
Epoch 1:  44%|████▍     | 2967/6778 [32


Epoch: 0, Loss0.3077472127360807



Epoch 1:  44%|████▍     | 3002/6778 [32:52<41:20,  1.52it/s][A
Epoch 1:  44%|████▍     | 3003/6778 [32:52<41:26,  1.52it/s][A
Epoch 1:  44%|████▍     | 3004/6778 [32:53<41:11,  1.53it/s][A
Epoch 1:  44%|████▍     | 3005/6778 [32:54<41:14,  1.52it/s][A
Epoch 1:  44%|████▍     | 3006/6778 [32:54<41:10,  1.53it/s][A
Epoch 1:  44%|████▍     | 3007/6778 [32:55<41:10,  1.53it/s][A
Epoch 1:  44%|████▍     | 3008/6778 [32:56<41:10,  1.53it/s][A
Epoch 1:  44%|████▍     | 3009/6778 [32:56<41:08,  1.53it/s][A
Epoch 1:  44%|████▍     | 3010/6778 [32:57<41:11,  1.52it/s][A
Epoch 1:  44%|████▍     | 3011/6778 [32:58<41:06,  1.53it/s][A
Epoch 1:  44%|████▍     | 3012/6778 [32:58<41:20,  1.52it/s][A
Epoch 1:  44%|████▍     | 3013/6778 [32:59<41:20,  1.52it/s][A
Epoch 1:  44%|████▍     | 3014/6778 [33:00<41:34,  1.51it/s][A
Epoch 1:  44%|████▍     | 3015/6778 [33:00<41:37,  1.51it/s][A
Epoch 1:  44%|████▍     | 3016/6778 [33:01<41:41,  1.50it/s][A
Epoch 1:  45%|████▍     | 3017/6778 [33


Epoch: 0, Loss0.30760120964321847



Epoch 1:  45%|████▌     | 3052/6778 [33:24<40:33,  1.53it/s][A
Epoch 1:  45%|████▌     | 3053/6778 [33:25<40:35,  1.53it/s][A
Epoch 1:  45%|████▌     | 3054/6778 [33:26<40:55,  1.52it/s][A
Epoch 1:  45%|████▌     | 3055/6778 [33:26<41:02,  1.51it/s][A
Epoch 1:  45%|████▌     | 3056/6778 [33:27<40:57,  1.51it/s][A
Epoch 1:  45%|████▌     | 3057/6778 [33:28<41:03,  1.51it/s][A
Epoch 1:  45%|████▌     | 3058/6778 [33:28<41:09,  1.51it/s][A
Epoch 1:  45%|████▌     | 3059/6778 [33:29<40:45,  1.52it/s][A
Epoch 1:  45%|████▌     | 3060/6778 [33:30<40:43,  1.52it/s][A
Epoch 1:  45%|████▌     | 3061/6778 [33:30<40:46,  1.52it/s][A
Epoch 1:  45%|████▌     | 3062/6778 [33:31<40:44,  1.52it/s][A
Epoch 1:  45%|████▌     | 3063/6778 [33:32<40:39,  1.52it/s][A
Epoch 1:  45%|████▌     | 3064/6778 [33:32<40:41,  1.52it/s][A
Epoch 1:  45%|████▌     | 3065/6778 [33:33<40:31,  1.53it/s][A
Epoch 1:  45%|████▌     | 3066/6778 [33:34<40:35,  1.52it/s][A
Epoch 1:  45%|████▌     | 3067/6778 [33


Epoch: 0, Loss0.3075780738859898



Epoch 1:  46%|████▌     | 3102/6778 [33:57<40:17,  1.52it/s][A
Epoch 1:  46%|████▌     | 3103/6778 [33:58<40:07,  1.53it/s][A
Epoch 1:  46%|████▌     | 3104/6778 [33:59<40:16,  1.52it/s][A
Epoch 1:  46%|████▌     | 3105/6778 [33:59<40:11,  1.52it/s][A
Epoch 1:  46%|████▌     | 3106/6778 [34:00<40:16,  1.52it/s][A
Epoch 1:  46%|████▌     | 3107/6778 [34:01<40:08,  1.52it/s][A
Epoch 1:  46%|████▌     | 3108/6778 [34:01<40:14,  1.52it/s][A
Epoch 1:  46%|████▌     | 3109/6778 [34:02<40:11,  1.52it/s][A
Epoch 1:  46%|████▌     | 3110/6778 [34:03<40:07,  1.52it/s][A
Epoch 1:  46%|████▌     | 3111/6778 [34:03<40:03,  1.53it/s][A
Epoch 1:  46%|████▌     | 3112/6778 [34:04<40:00,  1.53it/s][A
Epoch 1:  46%|████▌     | 3113/6778 [34:05<40:07,  1.52it/s][A
Epoch 1:  46%|████▌     | 3114/6778 [34:05<40:02,  1.52it/s][A
Epoch 1:  46%|████▌     | 3115/6778 [34:06<40:20,  1.51it/s][A
Epoch 1:  46%|████▌     | 3116/6778 [34:07<40:22,  1.51it/s][A
Epoch 1:  46%|████▌     | 3117/6778 [34


Epoch: 0, Loss0.30749102956631646



Epoch 1:  47%|████▋     | 3152/6778 [34:30<39:44,  1.52it/s][A
Epoch 1:  47%|████▋     | 3153/6778 [34:31<39:45,  1.52it/s][A
Epoch 1:  47%|████▋     | 3154/6778 [34:32<39:48,  1.52it/s][A
Epoch 1:  47%|████▋     | 3155/6778 [34:32<39:43,  1.52it/s][A
Epoch 1:  47%|████▋     | 3156/6778 [34:33<39:58,  1.51it/s][A
Epoch 1:  47%|████▋     | 3157/6778 [34:34<39:53,  1.51it/s][A
Epoch 1:  47%|████▋     | 3158/6778 [34:34<39:59,  1.51it/s][A
Epoch 1:  47%|████▋     | 3159/6778 [34:35<39:57,  1.51it/s][A
Epoch 1:  47%|████▋     | 3160/6778 [34:36<39:53,  1.51it/s][A
Epoch 1:  47%|████▋     | 3161/6778 [34:36<39:37,  1.52it/s][A
Epoch 1:  47%|████▋     | 3162/6778 [34:37<39:32,  1.52it/s][A
Epoch 1:  47%|████▋     | 3163/6778 [34:38<39:33,  1.52it/s][A
Epoch 1:  47%|████▋     | 3164/6778 [34:38<39:28,  1.53it/s][A
Epoch 1:  47%|████▋     | 3165/6778 [34:39<39:40,  1.52it/s][A
Epoch 1:  47%|████▋     | 3166/6778 [34:39<39:28,  1.52it/s][A
Epoch 1:  47%|████▋     | 3167/6778 [34


Epoch: 0, Loss0.30738004655930745



Epoch 1:  47%|████▋     | 3202/6778 [35:03<39:28,  1.51it/s][A
Epoch 1:  47%|████▋     | 3203/6778 [35:04<39:14,  1.52it/s][A
Epoch 1:  47%|████▋     | 3204/6778 [35:05<39:17,  1.52it/s][A
Epoch 1:  47%|████▋     | 3205/6778 [35:05<39:15,  1.52it/s][A
Epoch 1:  47%|████▋     | 3206/6778 [35:06<39:12,  1.52it/s][A
Epoch 1:  47%|████▋     | 3207/6778 [35:07<39:08,  1.52it/s][A
Epoch 1:  47%|████▋     | 3208/6778 [35:07<39:07,  1.52it/s][A
Epoch 1:  47%|████▋     | 3209/6778 [35:08<39:07,  1.52it/s][A
Epoch 1:  47%|████▋     | 3210/6778 [35:09<39:02,  1.52it/s][A
Epoch 1:  47%|████▋     | 3211/6778 [35:09<39:03,  1.52it/s][A
Epoch 1:  47%|████▋     | 3212/6778 [35:10<38:59,  1.52it/s][A
Epoch 1:  47%|████▋     | 3213/6778 [35:10<38:58,  1.52it/s][A
Epoch 1:  47%|████▋     | 3214/6778 [35:11<38:59,  1.52it/s][A
Epoch 1:  47%|████▋     | 3215/6778 [35:12<38:59,  1.52it/s][A
Epoch 1:  47%|████▋     | 3216/6778 [35:12<39:00,  1.52it/s][A
Epoch 1:  47%|████▋     | 3217/6778 [35


Epoch: 0, Loss0.3075948230823676



Epoch 1:  48%|████▊     | 3252/6778 [35:36<38:27,  1.53it/s][A
Epoch 1:  48%|████▊     | 3253/6778 [35:37<38:28,  1.53it/s][A
Epoch 1:  48%|████▊     | 3254/6778 [35:37<38:29,  1.53it/s][A
Epoch 1:  48%|████▊     | 3255/6778 [35:38<38:30,  1.52it/s][A
Epoch 1:  48%|████▊     | 3256/6778 [35:39<38:22,  1.53it/s][A
Epoch 1:  48%|████▊     | 3257/6778 [35:39<38:34,  1.52it/s][A
Epoch 1:  48%|████▊     | 3258/6778 [35:40<38:47,  1.51it/s][A
Epoch 1:  48%|████▊     | 3259/6778 [35:41<38:44,  1.51it/s][A
Epoch 1:  48%|████▊     | 3260/6778 [35:41<38:44,  1.51it/s][A
Epoch 1:  48%|████▊     | 3261/6778 [35:42<38:43,  1.51it/s][A
Epoch 1:  48%|████▊     | 3262/6778 [35:43<38:56,  1.51it/s][A
Epoch 1:  48%|████▊     | 3263/6778 [35:43<38:49,  1.51it/s][A
Epoch 1:  48%|████▊     | 3264/6778 [35:44<38:41,  1.51it/s][A
Epoch 1:  48%|████▊     | 3265/6778 [35:45<38:36,  1.52it/s][A
Epoch 1:  48%|████▊     | 3266/6778 [35:45<38:32,  1.52it/s][A
Epoch 1:  48%|████▊     | 3267/6778 [35


Epoch: 0, Loss0.30727801924264997



Epoch 1:  49%|████▊     | 3302/6778 [36:09<38:16,  1.51it/s][A
Epoch 1:  49%|████▊     | 3303/6778 [36:10<38:25,  1.51it/s][A
Epoch 1:  49%|████▊     | 3304/6778 [36:10<38:25,  1.51it/s][A
Epoch 1:  49%|████▉     | 3305/6778 [36:11<38:19,  1.51it/s][A
Epoch 1:  49%|████▉     | 3306/6778 [36:12<38:12,  1.51it/s][A
Epoch 1:  49%|████▉     | 3307/6778 [36:12<38:10,  1.52it/s][A
Epoch 1:  49%|████▉     | 3308/6778 [36:13<38:02,  1.52it/s][A
Epoch 1:  49%|████▉     | 3309/6778 [36:14<38:07,  1.52it/s][A
Epoch 1:  49%|████▉     | 3310/6778 [36:14<37:56,  1.52it/s][A
Epoch 1:  49%|████▉     | 3311/6778 [36:15<37:55,  1.52it/s][A
Epoch 1:  49%|████▉     | 3312/6778 [36:16<37:55,  1.52it/s][A
Epoch 1:  49%|████▉     | 3313/6778 [36:16<38:00,  1.52it/s][A
Epoch 1:  49%|████▉     | 3314/6778 [36:17<37:56,  1.52it/s][A
Epoch 1:  49%|████▉     | 3315/6778 [36:18<37:55,  1.52it/s][A
Epoch 1:  49%|████▉     | 3316/6778 [36:18<37:51,  1.52it/s][A
Epoch 1:  49%|████▉     | 3317/6778 [36


Epoch: 0, Loss0.3071202922515711



Epoch 1:  49%|████▉     | 3352/6778 [36:42<37:24,  1.53it/s][A
Epoch 1:  49%|████▉     | 3353/6778 [36:43<37:17,  1.53it/s][A
Epoch 1:  49%|████▉     | 3354/6778 [36:43<37:19,  1.53it/s][A
Epoch 1:  49%|████▉     | 3355/6778 [36:44<37:16,  1.53it/s][A
Epoch 1:  50%|████▉     | 3356/6778 [36:45<37:19,  1.53it/s][A
Epoch 1:  50%|████▉     | 3357/6778 [36:45<37:21,  1.53it/s][A
Epoch 1:  50%|████▉     | 3358/6778 [36:46<37:20,  1.53it/s][A
Epoch 1:  50%|████▉     | 3359/6778 [36:47<37:16,  1.53it/s][A
Epoch 1:  50%|████▉     | 3360/6778 [36:47<37:28,  1.52it/s][A
Epoch 1:  50%|████▉     | 3361/6778 [36:48<37:23,  1.52it/s][A
Epoch 1:  50%|████▉     | 3362/6778 [36:49<37:29,  1.52it/s][A
Epoch 1:  50%|████▉     | 3363/6778 [36:49<37:34,  1.51it/s][A
Epoch 1:  50%|████▉     | 3364/6778 [36:50<37:45,  1.51it/s][A
Epoch 1:  50%|████▉     | 3365/6778 [36:51<37:48,  1.50it/s][A
Epoch 1:  50%|████▉     | 3366/6778 [36:51<37:26,  1.52it/s][A
Epoch 1:  50%|████▉     | 3367/6778 [36


Epoch: 0, Loss0.3070238264355895



Epoch 1:  50%|█████     | 3402/6778 [37:15<37:04,  1.52it/s][A
Epoch 1:  50%|█████     | 3403/6778 [37:16<37:18,  1.51it/s][A
Epoch 1:  50%|█████     | 3404/6778 [37:16<37:03,  1.52it/s][A
Epoch 1:  50%|█████     | 3405/6778 [37:17<37:15,  1.51it/s][A
Epoch 1:  50%|█████     | 3406/6778 [37:17<37:15,  1.51it/s][A
Epoch 1:  50%|█████     | 3407/6778 [37:18<36:49,  1.53it/s][A
Epoch 1:  50%|█████     | 3408/6778 [37:19<36:44,  1.53it/s][A
Epoch 1:  50%|█████     | 3409/6778 [37:19<36:42,  1.53it/s][A
Epoch 1:  50%|█████     | 3410/6778 [37:20<36:45,  1.53it/s][A
Epoch 1:  50%|█████     | 3411/6778 [37:21<36:40,  1.53it/s][A
Epoch 1:  50%|█████     | 3412/6778 [37:21<36:36,  1.53it/s][A
Epoch 1:  50%|█████     | 3413/6778 [37:22<36:43,  1.53it/s][A
Epoch 1:  50%|█████     | 3414/6778 [37:23<36:44,  1.53it/s][A
Epoch 1:  50%|█████     | 3415/6778 [37:23<36:34,  1.53it/s][A
Epoch 1:  50%|█████     | 3416/6778 [37:24<36:37,  1.53it/s][A
Epoch 1:  50%|█████     | 3417/6778 [37


Epoch: 0, Loss0.30666267269290176



Epoch 1:  51%|█████     | 3452/6778 [37:48<36:15,  1.53it/s][A
Epoch 1:  51%|█████     | 3453/6778 [37:48<36:14,  1.53it/s][A
Epoch 1:  51%|█████     | 3454/6778 [37:49<36:17,  1.53it/s][A
Epoch 1:  51%|█████     | 3455/6778 [37:50<36:25,  1.52it/s][A
Epoch 1:  51%|█████     | 3456/6778 [37:50<36:14,  1.53it/s][A
Epoch 1:  51%|█████     | 3457/6778 [37:51<36:12,  1.53it/s][A
Epoch 1:  51%|█████     | 3458/6778 [37:52<36:20,  1.52it/s][A
Epoch 1:  51%|█████     | 3459/6778 [37:52<36:08,  1.53it/s][A
Epoch 1:  51%|█████     | 3460/6778 [37:53<36:09,  1.53it/s][A
Epoch 1:  51%|█████     | 3461/6778 [37:54<36:12,  1.53it/s][A
Epoch 1:  51%|█████     | 3462/6778 [37:54<36:06,  1.53it/s][A
Epoch 1:  51%|█████     | 3463/6778 [37:55<36:31,  1.51it/s][A
Epoch 1:  51%|█████     | 3464/6778 [37:56<36:20,  1.52it/s][A
Epoch 1:  51%|█████     | 3465/6778 [37:56<36:22,  1.52it/s][A
Epoch 1:  51%|█████     | 3466/6778 [37:57<36:37,  1.51it/s][A
Epoch 1:  51%|█████     | 3467/6778 [37


Epoch: 0, Loss0.30698563201287515



Epoch 1:  52%|█████▏    | 3502/6778 [38:21<35:42,  1.53it/s][A
Epoch 1:  52%|█████▏    | 3503/6778 [38:21<35:42,  1.53it/s][A
Epoch 1:  52%|█████▏    | 3504/6778 [38:22<36:02,  1.51it/s][A
Epoch 1:  52%|█████▏    | 3505/6778 [38:23<36:04,  1.51it/s][A
Epoch 1:  52%|█████▏    | 3506/6778 [38:23<36:06,  1.51it/s][A
Epoch 1:  52%|█████▏    | 3507/6778 [38:24<36:04,  1.51it/s][A
Epoch 1:  52%|█████▏    | 3508/6778 [38:25<36:03,  1.51it/s][A
Epoch 1:  52%|█████▏    | 3509/6778 [38:25<36:06,  1.51it/s][A
Epoch 1:  52%|█████▏    | 3510/6778 [38:26<35:43,  1.52it/s][A
Epoch 1:  52%|█████▏    | 3511/6778 [38:26<35:42,  1.52it/s][A
Epoch 1:  52%|█████▏    | 3512/6778 [38:27<35:39,  1.53it/s][A
Epoch 1:  52%|█████▏    | 3513/6778 [38:28<35:39,  1.53it/s][A
Epoch 1:  52%|█████▏    | 3514/6778 [38:28<35:35,  1.53it/s][A
Epoch 1:  52%|█████▏    | 3515/6778 [38:29<35:42,  1.52it/s][A
Epoch 1:  52%|█████▏    | 3516/6778 [38:30<35:38,  1.53it/s][A
Epoch 1:  52%|█████▏    | 3517/6778 [38


Epoch: 0, Loss0.30702072937357294



Epoch 1:  52%|█████▏    | 3552/6778 [38:53<35:20,  1.52it/s][A
Epoch 1:  52%|█████▏    | 3553/6778 [38:54<35:15,  1.52it/s][A
Epoch 1:  52%|█████▏    | 3554/6778 [38:55<35:22,  1.52it/s][A
Epoch 1:  52%|█████▏    | 3555/6778 [38:55<35:09,  1.53it/s][A
Epoch 1:  52%|█████▏    | 3556/6778 [38:56<35:02,  1.53it/s][A
Epoch 1:  52%|█████▏    | 3557/6778 [38:57<35:02,  1.53it/s][A
Epoch 1:  52%|█████▏    | 3558/6778 [38:57<35:03,  1.53it/s][A
Epoch 1:  53%|█████▎    | 3559/6778 [38:58<34:57,  1.53it/s][A
Epoch 1:  53%|█████▎    | 3560/6778 [38:59<34:59,  1.53it/s][A
Epoch 1:  53%|█████▎    | 3561/6778 [38:59<34:59,  1.53it/s][A
Epoch 1:  53%|█████▎    | 3562/6778 [39:00<35:01,  1.53it/s][A
Epoch 1:  53%|█████▎    | 3563/6778 [39:01<35:02,  1.53it/s][A
Epoch 1:  53%|█████▎    | 3564/6778 [39:01<35:00,  1.53it/s][A
Epoch 1:  53%|█████▎    | 3565/6778 [39:02<35:02,  1.53it/s][A
Epoch 1:  53%|█████▎    | 3566/6778 [39:03<35:05,  1.53it/s][A
Epoch 1:  53%|█████▎    | 3567/6778 [39


Epoch: 0, Loss0.306920529398793



Epoch 1:  53%|█████▎    | 3602/6778 [39:26<34:43,  1.52it/s][A
Epoch 1:  53%|█████▎    | 3603/6778 [39:27<34:43,  1.52it/s][A
Epoch 1:  53%|█████▎    | 3604/6778 [39:28<34:39,  1.53it/s][A
Epoch 1:  53%|█████▎    | 3605/6778 [39:28<34:44,  1.52it/s][A
Epoch 1:  53%|█████▎    | 3606/6778 [39:29<34:37,  1.53it/s][A
Epoch 1:  53%|█████▎    | 3607/6778 [39:30<34:48,  1.52it/s][A
Epoch 1:  53%|█████▎    | 3608/6778 [39:30<34:43,  1.52it/s][A
Epoch 1:  53%|█████▎    | 3609/6778 [39:31<34:52,  1.51it/s][A
Epoch 1:  53%|█████▎    | 3610/6778 [39:31<34:45,  1.52it/s][A
Epoch 1:  53%|█████▎    | 3611/6778 [39:32<34:52,  1.51it/s][A
Epoch 1:  53%|█████▎    | 3612/6778 [39:33<34:47,  1.52it/s][A
Epoch 1:  53%|█████▎    | 3613/6778 [39:33<34:41,  1.52it/s][A
Epoch 1:  53%|█████▎    | 3614/6778 [39:34<34:37,  1.52it/s][A
Epoch 1:  53%|█████▎    | 3615/6778 [39:35<34:34,  1.52it/s][A
Epoch 1:  53%|█████▎    | 3616/6778 [39:35<34:35,  1.52it/s][A
Epoch 1:  53%|█████▎    | 3617/6778 [39


Epoch: 0, Loss0.30660868231212235



Epoch 1:  54%|█████▍    | 3652/6778 [39:59<34:26,  1.51it/s][A
Epoch 1:  54%|█████▍    | 3653/6778 [40:00<34:24,  1.51it/s][A
Epoch 1:  54%|█████▍    | 3654/6778 [40:00<34:20,  1.52it/s][A
Epoch 1:  54%|█████▍    | 3655/6778 [40:01<34:16,  1.52it/s][A
Epoch 1:  54%|█████▍    | 3656/6778 [40:02<34:08,  1.52it/s][A
Epoch 1:  54%|█████▍    | 3657/6778 [40:02<34:02,  1.53it/s][A
Epoch 1:  54%|█████▍    | 3658/6778 [40:03<33:55,  1.53it/s][A
Epoch 1:  54%|█████▍    | 3659/6778 [40:04<33:59,  1.53it/s][A
Epoch 1:  54%|█████▍    | 3660/6778 [40:04<33:57,  1.53it/s][A
Epoch 1:  54%|█████▍    | 3661/6778 [40:05<33:55,  1.53it/s][A
Epoch 1:  54%|█████▍    | 3662/6778 [40:06<34:01,  1.53it/s][A
Epoch 1:  54%|█████▍    | 3663/6778 [40:06<33:56,  1.53it/s][A
Epoch 1:  54%|█████▍    | 3664/6778 [40:07<33:57,  1.53it/s][A
Epoch 1:  54%|█████▍    | 3665/6778 [40:08<33:57,  1.53it/s][A
Epoch 1:  54%|█████▍    | 3666/6778 [40:08<33:57,  1.53it/s][A
Epoch 1:  54%|█████▍    | 3667/6778 [40


Epoch: 0, Loss0.30657854899502357



Epoch 1:  55%|█████▍    | 3702/6778 [40:32<33:35,  1.53it/s][A
Epoch 1:  55%|█████▍    | 3703/6778 [40:33<33:37,  1.52it/s][A
Epoch 1:  55%|█████▍    | 3704/6778 [40:33<33:37,  1.52it/s][A
Epoch 1:  55%|█████▍    | 3705/6778 [40:34<33:39,  1.52it/s][A
Epoch 1:  55%|█████▍    | 3706/6778 [40:34<33:36,  1.52it/s][A
Epoch 1:  55%|█████▍    | 3707/6778 [40:35<33:34,  1.52it/s][A
Epoch 1:  55%|█████▍    | 3708/6778 [40:36<33:33,  1.52it/s][A
Epoch 1:  55%|█████▍    | 3709/6778 [40:36<33:35,  1.52it/s][A
Epoch 1:  55%|█████▍    | 3710/6778 [40:37<33:45,  1.52it/s][A
Epoch 1:  55%|█████▍    | 3711/6778 [40:38<33:43,  1.52it/s][A
Epoch 1:  55%|█████▍    | 3712/6778 [40:38<33:47,  1.51it/s][A
Epoch 1:  55%|█████▍    | 3713/6778 [40:39<34:02,  1.50it/s][A
Epoch 1:  55%|█████▍    | 3714/6778 [40:40<34:04,  1.50it/s][A
Epoch 1:  55%|█████▍    | 3715/6778 [40:40<33:42,  1.51it/s][A
Epoch 1:  55%|█████▍    | 3716/6778 [40:41<33:43,  1.51it/s][A
Epoch 1:  55%|█████▍    | 3717/6778 [40


Epoch: 0, Loss0.3066208252796997



Epoch 1:  55%|█████▌    | 3752/6778 [41:05<33:28,  1.51it/s][A
Epoch 1:  55%|█████▌    | 3753/6778 [41:05<33:27,  1.51it/s][A
Epoch 1:  55%|█████▌    | 3754/6778 [41:06<33:30,  1.50it/s][A
Epoch 1:  55%|█████▌    | 3755/6778 [41:07<33:38,  1.50it/s][A
Epoch 1:  55%|█████▌    | 3756/6778 [41:07<33:22,  1.51it/s][A
Epoch 1:  55%|█████▌    | 3757/6778 [41:08<33:16,  1.51it/s][A
Epoch 1:  55%|█████▌    | 3758/6778 [41:09<33:11,  1.52it/s][A
Epoch 1:  55%|█████▌    | 3759/6778 [41:09<33:00,  1.52it/s][A
Epoch 1:  55%|█████▌    | 3760/6778 [41:10<33:02,  1.52it/s][A
Epoch 1:  55%|█████▌    | 3761/6778 [41:11<32:56,  1.53it/s][A
Epoch 1:  56%|█████▌    | 3762/6778 [41:11<32:54,  1.53it/s][A
Epoch 1:  56%|█████▌    | 3763/6778 [41:12<32:56,  1.53it/s][A
Epoch 1:  56%|█████▌    | 3764/6778 [41:13<32:55,  1.53it/s][A
Epoch 1:  56%|█████▌    | 3765/6778 [41:13<32:57,  1.52it/s][A
Epoch 1:  56%|█████▌    | 3766/6778 [41:14<32:53,  1.53it/s][A
Epoch 1:  56%|█████▌    | 3767/6778 [41


Epoch: 0, Loss0.3064255500229463



Epoch 1:  56%|█████▌    | 3802/6778 [41:38<32:29,  1.53it/s][A
Epoch 1:  56%|█████▌    | 3803/6778 [41:38<32:37,  1.52it/s][A
Epoch 1:  56%|█████▌    | 3804/6778 [41:39<32:30,  1.52it/s][A
Epoch 1:  56%|█████▌    | 3805/6778 [41:40<32:32,  1.52it/s][A
Epoch 1:  56%|█████▌    | 3806/6778 [41:40<32:31,  1.52it/s][A
Epoch 1:  56%|█████▌    | 3807/6778 [41:41<32:30,  1.52it/s][A
Epoch 1:  56%|█████▌    | 3808/6778 [41:42<32:28,  1.52it/s][A
Epoch 1:  56%|█████▌    | 3809/6778 [41:42<32:30,  1.52it/s][A
Epoch 1:  56%|█████▌    | 3810/6778 [41:43<32:27,  1.52it/s][A
Epoch 1:  56%|█████▌    | 3811/6778 [41:44<32:23,  1.53it/s][A
Epoch 1:  56%|█████▌    | 3812/6778 [41:44<32:33,  1.52it/s][A
Epoch 1:  56%|█████▋    | 3813/6778 [41:45<32:39,  1.51it/s][A
Epoch 1:  56%|█████▋    | 3814/6778 [41:46<32:45,  1.51it/s][A
Epoch 1:  56%|█████▋    | 3815/6778 [41:46<32:39,  1.51it/s][A
Epoch 1:  56%|█████▋    | 3816/6778 [41:47<32:42,  1.51it/s][A
Epoch 1:  56%|█████▋    | 3817/6778 [41


Epoch: 0, Loss0.3064853791249043



Epoch 1:  57%|█████▋    | 3852/6778 [42:10<31:53,  1.53it/s][A
Epoch 1:  57%|█████▋    | 3853/6778 [42:11<31:55,  1.53it/s][A
Epoch 1:  57%|█████▋    | 3854/6778 [42:12<32:08,  1.52it/s][A
Epoch 1:  57%|█████▋    | 3855/6778 [42:12<32:07,  1.52it/s][A
Epoch 1:  57%|█████▋    | 3856/6778 [42:13<32:07,  1.52it/s][A
Epoch 1:  57%|█████▋    | 3857/6778 [42:14<32:13,  1.51it/s][A
Epoch 1:  57%|█████▋    | 3858/6778 [42:14<32:18,  1.51it/s][A
Epoch 1:  57%|█████▋    | 3859/6778 [42:15<32:00,  1.52it/s][A
Epoch 1:  57%|█████▋    | 3860/6778 [42:16<32:02,  1.52it/s][A
Epoch 1:  57%|█████▋    | 3861/6778 [42:16<31:54,  1.52it/s][A
Epoch 1:  57%|█████▋    | 3862/6778 [42:17<31:52,  1.52it/s][A
Epoch 1:  57%|█████▋    | 3863/6778 [42:18<31:48,  1.53it/s][A
Epoch 1:  57%|█████▋    | 3864/6778 [42:18<31:46,  1.53it/s][A
Epoch 1:  57%|█████▋    | 3865/6778 [42:19<31:47,  1.53it/s][A
Epoch 1:  57%|█████▋    | 3866/6778 [42:20<31:46,  1.53it/s][A
Epoch 1:  57%|█████▋    | 3867/6778 [42


Epoch: 0, Loss0.3066040541450509



Epoch 1:  58%|█████▊    | 3902/6778 [42:43<31:18,  1.53it/s][A
Epoch 1:  58%|█████▊    | 3903/6778 [42:44<31:14,  1.53it/s][A
Epoch 1:  58%|█████▊    | 3904/6778 [42:45<31:13,  1.53it/s][A
Epoch 1:  58%|█████▊    | 3905/6778 [42:45<31:16,  1.53it/s][A
Epoch 1:  58%|█████▊    | 3906/6778 [42:46<31:13,  1.53it/s][A
Epoch 1:  58%|█████▊    | 3907/6778 [42:47<31:24,  1.52it/s][A
Epoch 1:  58%|█████▊    | 3908/6778 [42:47<31:21,  1.53it/s][A
Epoch 1:  58%|█████▊    | 3909/6778 [42:48<31:15,  1.53it/s][A
Epoch 1:  58%|█████▊    | 3910/6778 [42:49<31:15,  1.53it/s][A
Epoch 1:  58%|█████▊    | 3911/6778 [42:49<31:15,  1.53it/s][A
Epoch 1:  58%|█████▊    | 3912/6778 [42:50<31:13,  1.53it/s][A
Epoch 1:  58%|█████▊    | 3913/6778 [42:51<31:11,  1.53it/s][A
Epoch 1:  58%|█████▊    | 3914/6778 [42:51<31:13,  1.53it/s][A
Epoch 1:  58%|█████▊    | 3915/6778 [42:52<31:21,  1.52it/s][A
Epoch 1:  58%|█████▊    | 3916/6778 [42:53<31:26,  1.52it/s][A
Epoch 1:  58%|█████▊    | 3917/6778 [42


Epoch: 0, Loss0.30641113331961467



Epoch 1:  58%|█████▊    | 3952/6778 [43:16<30:52,  1.53it/s][A
Epoch 1:  58%|█████▊    | 3953/6778 [43:17<30:57,  1.52it/s][A
Epoch 1:  58%|█████▊    | 3954/6778 [43:17<30:46,  1.53it/s][A
Epoch 1:  58%|█████▊    | 3955/6778 [43:18<30:49,  1.53it/s][A
Epoch 1:  58%|█████▊    | 3956/6778 [43:19<30:56,  1.52it/s][A
Epoch 1:  58%|█████▊    | 3957/6778 [43:19<31:08,  1.51it/s][A
Epoch 1:  58%|█████▊    | 3958/6778 [43:20<31:16,  1.50it/s][A
Epoch 1:  58%|█████▊    | 3959/6778 [43:21<31:06,  1.51it/s][A
Epoch 1:  58%|█████▊    | 3960/6778 [43:21<31:12,  1.51it/s][A
Epoch 1:  58%|█████▊    | 3961/6778 [43:22<31:03,  1.51it/s][A
Epoch 1:  58%|█████▊    | 3962/6778 [43:23<30:56,  1.52it/s][A
Epoch 1:  58%|█████▊    | 3963/6778 [43:23<30:52,  1.52it/s][A
Epoch 1:  58%|█████▊    | 3964/6778 [43:24<30:48,  1.52it/s][A
Epoch 1:  58%|█████▊    | 3965/6778 [43:25<30:46,  1.52it/s][A
Epoch 1:  59%|█████▊    | 3966/6778 [43:25<30:45,  1.52it/s][A
Epoch 1:  59%|█████▊    | 3967/6778 [43


Epoch: 0, Loss0.30629787085332505



Epoch 1:  59%|█████▉    | 4002/6778 [43:49<30:32,  1.51it/s][A
Epoch 1:  59%|█████▉    | 4003/6778 [43:50<30:34,  1.51it/s][A
Epoch 1:  59%|█████▉    | 4004/6778 [43:50<30:28,  1.52it/s][A
Epoch 1:  59%|█████▉    | 4005/6778 [43:51<30:26,  1.52it/s][A
Epoch 1:  59%|█████▉    | 4006/6778 [43:52<30:23,  1.52it/s][A
Epoch 1:  59%|█████▉    | 4007/6778 [43:52<30:23,  1.52it/s][A
Epoch 1:  59%|█████▉    | 4008/6778 [43:53<30:19,  1.52it/s][A
Epoch 1:  59%|█████▉    | 4009/6778 [43:54<30:21,  1.52it/s][A
Epoch 1:  59%|█████▉    | 4010/6778 [43:54<30:18,  1.52it/s][A
Epoch 1:  59%|█████▉    | 4011/6778 [43:55<30:16,  1.52it/s][A
Epoch 1:  59%|█████▉    | 4012/6778 [43:56<30:18,  1.52it/s][A
Epoch 1:  59%|█████▉    | 4013/6778 [43:56<30:06,  1.53it/s][A
Epoch 1:  59%|█████▉    | 4014/6778 [43:57<30:08,  1.53it/s][A
Epoch 1:  59%|█████▉    | 4015/6778 [43:58<30:15,  1.52it/s][A
Epoch 1:  59%|█████▉    | 4016/6778 [43:58<30:09,  1.53it/s][A
Epoch 1:  59%|█████▉    | 4017/6778 [43


Epoch: 0, Loss0.3061607462999792



Epoch 1:  60%|█████▉    | 4052/6778 [44:22<29:44,  1.53it/s][A
Epoch 1:  60%|█████▉    | 4053/6778 [44:23<29:37,  1.53it/s][A
Epoch 1:  60%|█████▉    | 4054/6778 [44:23<29:43,  1.53it/s][A
Epoch 1:  60%|█████▉    | 4055/6778 [44:24<29:41,  1.53it/s][A
Epoch 1:  60%|█████▉    | 4056/6778 [44:25<29:39,  1.53it/s][A
Epoch 1:  60%|█████▉    | 4057/6778 [44:25<29:39,  1.53it/s][A
Epoch 1:  60%|█████▉    | 4058/6778 [44:26<29:41,  1.53it/s][A
Epoch 1:  60%|█████▉    | 4059/6778 [44:26<29:55,  1.51it/s][A
Epoch 1:  60%|█████▉    | 4060/6778 [44:27<30:00,  1.51it/s][A
Epoch 1:  60%|█████▉    | 4061/6778 [44:28<30:02,  1.51it/s][A
Epoch 1:  60%|█████▉    | 4062/6778 [44:28<29:58,  1.51it/s][A
Epoch 1:  60%|█████▉    | 4063/6778 [44:29<29:59,  1.51it/s][A
Epoch 1:  60%|█████▉    | 4064/6778 [44:30<29:45,  1.52it/s][A
Epoch 1:  60%|█████▉    | 4065/6778 [44:30<29:35,  1.53it/s][A
Epoch 1:  60%|█████▉    | 4066/6778 [44:31<29:33,  1.53it/s][A
Epoch 1:  60%|██████    | 4067/6778 [44


Epoch: 0, Loss0.306161681300502



Epoch 1:  61%|██████    | 4102/6778 [44:55<29:31,  1.51it/s][A
Epoch 1:  61%|██████    | 4103/6778 [44:55<29:41,  1.50it/s][A
Epoch 1:  61%|██████    | 4104/6778 [44:56<29:39,  1.50it/s][A
Epoch 1:  61%|██████    | 4105/6778 [44:57<29:23,  1.52it/s][A
Epoch 1:  61%|██████    | 4106/6778 [44:57<29:14,  1.52it/s][A
Epoch 1:  61%|██████    | 4107/6778 [44:58<29:10,  1.53it/s][A
Epoch 1:  61%|██████    | 4108/6778 [44:59<29:11,  1.52it/s][A
Epoch 1:  61%|██████    | 4109/6778 [44:59<29:10,  1.52it/s][A
Epoch 1:  61%|██████    | 4110/6778 [45:00<29:07,  1.53it/s][A
Epoch 1:  61%|██████    | 4111/6778 [45:01<29:06,  1.53it/s][A
Epoch 1:  61%|██████    | 4112/6778 [45:01<29:05,  1.53it/s][A
Epoch 1:  61%|██████    | 4113/6778 [45:02<29:02,  1.53it/s][A
Epoch 1:  61%|██████    | 4114/6778 [45:03<29:01,  1.53it/s][A
Epoch 1:  61%|██████    | 4115/6778 [45:03<29:01,  1.53it/s][A
Epoch 1:  61%|██████    | 4116/6778 [45:04<28:58,  1.53it/s][A
Epoch 1:  61%|██████    | 4117/6778 [45


Epoch: 0, Loss0.3061775899624802



Epoch 1:  61%|██████▏   | 4152/6778 [45:28<28:42,  1.52it/s][A
Epoch 1:  61%|██████▏   | 4153/6778 [45:28<28:41,  1.52it/s][A
Epoch 1:  61%|██████▏   | 4154/6778 [45:29<28:41,  1.52it/s][A
Epoch 1:  61%|██████▏   | 4155/6778 [45:30<28:37,  1.53it/s][A
Epoch 1:  61%|██████▏   | 4156/6778 [45:30<28:39,  1.52it/s][A
Epoch 1:  61%|██████▏   | 4157/6778 [45:31<28:40,  1.52it/s][A
Epoch 1:  61%|██████▏   | 4158/6778 [45:32<28:41,  1.52it/s][A
Epoch 1:  61%|██████▏   | 4159/6778 [45:32<28:40,  1.52it/s][A
Epoch 1:  61%|██████▏   | 4160/6778 [45:33<28:41,  1.52it/s][A
Epoch 1:  61%|██████▏   | 4161/6778 [45:34<28:43,  1.52it/s][A
Epoch 1:  61%|██████▏   | 4162/6778 [45:34<28:44,  1.52it/s][A
Epoch 1:  61%|██████▏   | 4163/6778 [45:35<28:56,  1.51it/s][A
Epoch 1:  61%|██████▏   | 4164/6778 [45:36<28:52,  1.51it/s][A
Epoch 1:  61%|██████▏   | 4165/6778 [45:36<28:59,  1.50it/s][A
Epoch 1:  61%|██████▏   | 4166/6778 [45:37<29:02,  1.50it/s][A
Epoch 1:  61%|██████▏   | 4167/6778 [45


Epoch: 0, Loss0.3061161968831334



Epoch 1:  62%|██████▏   | 4202/6778 [46:00<28:06,  1.53it/s][A
Epoch 1:  62%|██████▏   | 4203/6778 [46:01<28:20,  1.51it/s][A
Epoch 1:  62%|██████▏   | 4204/6778 [46:02<28:33,  1.50it/s][A
Epoch 1:  62%|██████▏   | 4205/6778 [46:02<28:19,  1.51it/s][A
Epoch 1:  62%|██████▏   | 4206/6778 [46:03<28:27,  1.51it/s][A
Epoch 1:  62%|██████▏   | 4207/6778 [46:04<28:35,  1.50it/s][A
Epoch 1:  62%|██████▏   | 4208/6778 [46:04<28:14,  1.52it/s][A
Epoch 1:  62%|██████▏   | 4209/6778 [46:05<28:11,  1.52it/s][A
Epoch 1:  62%|██████▏   | 4210/6778 [46:06<28:07,  1.52it/s][A
Epoch 1:  62%|██████▏   | 4211/6778 [46:06<28:05,  1.52it/s][A
Epoch 1:  62%|██████▏   | 4212/6778 [46:07<28:00,  1.53it/s][A
Epoch 1:  62%|██████▏   | 4213/6778 [46:08<27:58,  1.53it/s][A
Epoch 1:  62%|██████▏   | 4214/6778 [46:08<28:00,  1.53it/s][A
Epoch 1:  62%|██████▏   | 4215/6778 [46:09<28:02,  1.52it/s][A
Epoch 1:  62%|██████▏   | 4216/6778 [46:10<28:01,  1.52it/s][A
Epoch 1:  62%|██████▏   | 4217/6778 [46


Epoch: 0, Loss0.30606163359023464



Epoch 1:  63%|██████▎   | 4252/6778 [46:33<27:39,  1.52it/s][A
Epoch 1:  63%|██████▎   | 4253/6778 [46:34<27:33,  1.53it/s][A
Epoch 1:  63%|██████▎   | 4254/6778 [46:35<27:32,  1.53it/s][A
Epoch 1:  63%|██████▎   | 4255/6778 [46:35<27:32,  1.53it/s][A
Epoch 1:  63%|██████▎   | 4256/6778 [46:36<27:31,  1.53it/s][A
Epoch 1:  63%|██████▎   | 4257/6778 [46:37<27:38,  1.52it/s][A
Epoch 1:  63%|██████▎   | 4258/6778 [46:37<27:36,  1.52it/s][A
Epoch 1:  63%|██████▎   | 4259/6778 [46:38<27:35,  1.52it/s][A
Epoch 1:  63%|██████▎   | 4260/6778 [46:39<27:34,  1.52it/s][A
Epoch 1:  63%|██████▎   | 4261/6778 [46:39<27:33,  1.52it/s][A
Epoch 1:  63%|██████▎   | 4262/6778 [46:40<27:32,  1.52it/s][A
Epoch 1:  63%|██████▎   | 4263/6778 [46:41<27:35,  1.52it/s][A
Epoch 1:  63%|██████▎   | 4264/6778 [46:41<27:46,  1.51it/s][A
Epoch 1:  63%|██████▎   | 4265/6778 [46:42<27:48,  1.51it/s][A
Epoch 1:  63%|██████▎   | 4266/6778 [46:43<27:56,  1.50it/s][A
Epoch 1:  63%|██████▎   | 4267/6778 [46


Epoch: 0, Loss0.3061144241837534



Epoch 1:  63%|██████▎   | 4302/6778 [47:06<27:03,  1.53it/s][A
Epoch 1:  63%|██████▎   | 4303/6778 [47:07<27:05,  1.52it/s][A
Epoch 1:  63%|██████▎   | 4304/6778 [47:08<27:01,  1.53it/s][A
Epoch 1:  64%|██████▎   | 4305/6778 [47:08<27:08,  1.52it/s][A
Epoch 1:  64%|██████▎   | 4306/6778 [47:09<27:05,  1.52it/s][A
Epoch 1:  64%|██████▎   | 4307/6778 [47:10<27:08,  1.52it/s][A
Epoch 1:  64%|██████▎   | 4308/6778 [47:10<27:08,  1.52it/s][A
Epoch 1:  64%|██████▎   | 4309/6778 [47:11<27:09,  1.52it/s][A
Epoch 1:  64%|██████▎   | 4310/6778 [47:12<27:19,  1.51it/s][A
Epoch 1:  64%|██████▎   | 4311/6778 [47:12<27:04,  1.52it/s][A
Epoch 1:  64%|██████▎   | 4312/6778 [47:13<27:00,  1.52it/s][A
Epoch 1:  64%|██████▎   | 4313/6778 [47:14<27:00,  1.52it/s][A
Epoch 1:  64%|██████▎   | 4314/6778 [47:14<26:57,  1.52it/s][A
Epoch 1:  64%|██████▎   | 4315/6778 [47:15<26:55,  1.53it/s][A
Epoch 1:  64%|██████▎   | 4316/6778 [47:16<26:50,  1.53it/s][A
Epoch 1:  64%|██████▎   | 4317/6778 [47


Epoch: 0, Loss0.3059360638973193



Epoch 1:  64%|██████▍   | 4352/6778 [47:39<26:43,  1.51it/s][A
Epoch 1:  64%|██████▍   | 4353/6778 [47:40<26:37,  1.52it/s][A
Epoch 1:  64%|██████▍   | 4354/6778 [47:41<26:36,  1.52it/s][A
Epoch 1:  64%|██████▍   | 4355/6778 [47:41<26:32,  1.52it/s][A
Epoch 1:  64%|██████▍   | 4356/6778 [47:42<26:31,  1.52it/s][A
Epoch 1:  64%|██████▍   | 4357/6778 [47:42<26:29,  1.52it/s][A
Epoch 1:  64%|██████▍   | 4358/6778 [47:43<26:34,  1.52it/s][A
Epoch 1:  64%|██████▍   | 4359/6778 [47:44<26:29,  1.52it/s][A
Epoch 1:  64%|██████▍   | 4360/6778 [47:44<26:25,  1.53it/s][A
Epoch 1:  64%|██████▍   | 4361/6778 [47:45<26:32,  1.52it/s][A
Epoch 1:  64%|██████▍   | 4362/6778 [47:46<26:23,  1.53it/s][A
Epoch 1:  64%|██████▍   | 4363/6778 [47:46<26:28,  1.52it/s][A
Epoch 1:  64%|██████▍   | 4364/6778 [47:47<26:23,  1.52it/s][A
Epoch 1:  64%|██████▍   | 4365/6778 [47:48<26:23,  1.52it/s][A
Epoch 1:  64%|██████▍   | 4366/6778 [47:48<26:21,  1.53it/s][A
Epoch 1:  64%|██████▍   | 4367/6778 [47


Epoch: 0, Loss0.3057729942832879



Epoch 1:  65%|██████▍   | 4402/6778 [48:12<25:59,  1.52it/s][A
Epoch 1:  65%|██████▍   | 4403/6778 [48:13<25:55,  1.53it/s][A
Epoch 1:  65%|██████▍   | 4404/6778 [48:13<25:51,  1.53it/s][A
Epoch 1:  65%|██████▍   | 4405/6778 [48:14<25:59,  1.52it/s][A
Epoch 1:  65%|██████▌   | 4406/6778 [48:15<25:48,  1.53it/s][A
Epoch 1:  65%|██████▌   | 4407/6778 [48:15<25:52,  1.53it/s][A
Epoch 1:  65%|██████▌   | 4408/6778 [48:16<26:01,  1.52it/s][A
Epoch 1:  65%|██████▌   | 4409/6778 [48:17<26:02,  1.52it/s][A
Epoch 1:  65%|██████▌   | 4410/6778 [48:17<26:07,  1.51it/s][A
Epoch 1:  65%|██████▌   | 4411/6778 [48:18<26:07,  1.51it/s][A
Epoch 1:  65%|██████▌   | 4412/6778 [48:19<26:08,  1.51it/s][A
Epoch 1:  65%|██████▌   | 4413/6778 [48:19<26:02,  1.51it/s][A
Epoch 1:  65%|██████▌   | 4414/6778 [48:20<25:57,  1.52it/s][A
Epoch 1:  65%|██████▌   | 4415/6778 [48:21<25:56,  1.52it/s][A
Epoch 1:  65%|██████▌   | 4416/6778 [48:21<26:00,  1.51it/s][A
Epoch 1:  65%|██████▌   | 4417/6778 [48


Epoch: 0, Loss0.3057901482368769



Epoch 1:  66%|██████▌   | 4452/6778 [48:45<25:34,  1.52it/s][A
Epoch 1:  66%|██████▌   | 4453/6778 [48:46<25:40,  1.51it/s][A
Epoch 1:  66%|██████▌   | 4454/6778 [48:46<25:39,  1.51it/s][A
Epoch 1:  66%|██████▌   | 4455/6778 [48:47<25:24,  1.52it/s][A
Epoch 1:  66%|██████▌   | 4456/6778 [48:48<25:21,  1.53it/s][A
Epoch 1:  66%|██████▌   | 4457/6778 [48:48<25:19,  1.53it/s][A
Epoch 1:  66%|██████▌   | 4458/6778 [48:49<25:18,  1.53it/s][A
Epoch 1:  66%|██████▌   | 4459/6778 [48:50<25:19,  1.53it/s][A
Epoch 1:  66%|██████▌   | 4460/6778 [48:50<25:18,  1.53it/s][A
Epoch 1:  66%|██████▌   | 4461/6778 [48:51<25:17,  1.53it/s][A
Epoch 1:  66%|██████▌   | 4462/6778 [48:51<25:21,  1.52it/s][A
Epoch 1:  66%|██████▌   | 4463/6778 [48:52<25:23,  1.52it/s][A
Epoch 1:  66%|██████▌   | 4464/6778 [48:53<25:21,  1.52it/s][A
Epoch 1:  66%|██████▌   | 4465/6778 [48:53<25:19,  1.52it/s][A
Epoch 1:  66%|██████▌   | 4466/6778 [48:54<25:19,  1.52it/s][A
Epoch 1:  66%|██████▌   | 4467/6778 [48


Epoch: 0, Loss0.30576411835970124



Epoch 1:  66%|██████▋   | 4502/6778 [49:18<24:54,  1.52it/s][A
Epoch 1:  66%|██████▋   | 4503/6778 [49:18<24:52,  1.52it/s][A
Epoch 1:  66%|██████▋   | 4504/6778 [49:19<24:53,  1.52it/s][A
Epoch 1:  66%|██████▋   | 4505/6778 [49:20<24:50,  1.52it/s][A
Epoch 1:  66%|██████▋   | 4506/6778 [49:20<24:52,  1.52it/s][A
Epoch 1:  66%|██████▋   | 4507/6778 [49:21<24:50,  1.52it/s][A
Epoch 1:  67%|██████▋   | 4508/6778 [49:22<24:50,  1.52it/s][A
Epoch 1:  67%|██████▋   | 4509/6778 [49:22<24:48,  1.52it/s][A
Epoch 1:  67%|██████▋   | 4510/6778 [49:23<24:46,  1.53it/s][A
Epoch 1:  67%|██████▋   | 4511/6778 [49:24<24:51,  1.52it/s][A
Epoch 1:  67%|██████▋   | 4512/6778 [49:24<24:57,  1.51it/s][A
Epoch 1:  67%|██████▋   | 4513/6778 [49:25<24:59,  1.51it/s][A
Epoch 1:  67%|██████▋   | 4514/6778 [49:26<24:52,  1.52it/s][A
Epoch 1:  67%|██████▋   | 4515/6778 [49:26<24:57,  1.51it/s][A
Epoch 1:  67%|██████▋   | 4516/6778 [49:27<25:01,  1.51it/s][A
Epoch 1:  67%|██████▋   | 4517/6778 [49


Epoch: 0, Loss0.30559645416519976



Epoch 1:  67%|██████▋   | 4552/6778 [49:51<24:13,  1.53it/s][A
Epoch 1:  67%|██████▋   | 4553/6778 [49:51<24:23,  1.52it/s][A
Epoch 1:  67%|██████▋   | 4554/6778 [49:52<24:30,  1.51it/s][A
Epoch 1:  67%|██████▋   | 4555/6778 [49:53<24:32,  1.51it/s][A
Epoch 1:  67%|██████▋   | 4556/6778 [49:53<24:37,  1.50it/s][A
Epoch 1:  67%|██████▋   | 4557/6778 [49:54<24:41,  1.50it/s][A
Epoch 1:  67%|██████▋   | 4558/6778 [49:55<24:32,  1.51it/s][A
Epoch 1:  67%|██████▋   | 4559/6778 [49:55<24:23,  1.52it/s][A
Epoch 1:  67%|██████▋   | 4560/6778 [49:56<24:17,  1.52it/s][A
Epoch 1:  67%|██████▋   | 4561/6778 [49:57<24:14,  1.52it/s][A
Epoch 1:  67%|██████▋   | 4562/6778 [49:57<24:13,  1.53it/s][A
Epoch 1:  67%|██████▋   | 4563/6778 [49:58<24:09,  1.53it/s][A
Epoch 1:  67%|██████▋   | 4564/6778 [49:59<24:12,  1.52it/s][A
Epoch 1:  67%|██████▋   | 4565/6778 [49:59<24:09,  1.53it/s][A
Epoch 1:  67%|██████▋   | 4566/6778 [50:00<24:07,  1.53it/s][A
Epoch 1:  67%|██████▋   | 4567/6778 [50


Epoch: 0, Loss0.3053632541014122



Epoch 1:  68%|██████▊   | 4602/6778 [50:24<23:46,  1.52it/s][A
Epoch 1:  68%|██████▊   | 4603/6778 [50:24<23:42,  1.53it/s][A
Epoch 1:  68%|██████▊   | 4604/6778 [50:25<23:40,  1.53it/s][A
Epoch 1:  68%|██████▊   | 4605/6778 [50:26<23:44,  1.53it/s][A
Epoch 1:  68%|██████▊   | 4606/6778 [50:26<23:39,  1.53it/s][A
Epoch 1:  68%|██████▊   | 4607/6778 [50:27<23:42,  1.53it/s][A
Epoch 1:  68%|██████▊   | 4608/6778 [50:27<23:39,  1.53it/s][A
Epoch 1:  68%|██████▊   | 4609/6778 [50:28<23:38,  1.53it/s][A
Epoch 1:  68%|██████▊   | 4610/6778 [50:29<23:40,  1.53it/s][A
Epoch 1:  68%|██████▊   | 4611/6778 [50:29<23:40,  1.53it/s][A
Epoch 1:  68%|██████▊   | 4612/6778 [50:30<23:35,  1.53it/s][A
Epoch 1:  68%|██████▊   | 4613/6778 [50:31<23:36,  1.53it/s][A
Epoch 1:  68%|██████▊   | 4614/6778 [50:31<23:40,  1.52it/s][A
Epoch 1:  68%|██████▊   | 4615/6778 [50:32<23:46,  1.52it/s][A
Epoch 1:  68%|██████▊   | 4616/6778 [50:33<23:48,  1.51it/s][A
Epoch 1:  68%|██████▊   | 4617/6778 [50


Epoch: 0, Loss0.3052433626728272



Epoch 1:  69%|██████▊   | 4652/6778 [50:56<23:08,  1.53it/s][A
Epoch 1:  69%|██████▊   | 4653/6778 [50:57<23:07,  1.53it/s][A
Epoch 1:  69%|██████▊   | 4654/6778 [50:58<23:10,  1.53it/s][A
Epoch 1:  69%|██████▊   | 4655/6778 [50:58<23:17,  1.52it/s][A
Epoch 1:  69%|██████▊   | 4656/6778 [50:59<23:15,  1.52it/s][A
Epoch 1:  69%|██████▊   | 4657/6778 [51:00<23:14,  1.52it/s][A
Epoch 1:  69%|██████▊   | 4658/6778 [51:00<23:12,  1.52it/s][A
Epoch 1:  69%|██████▊   | 4659/6778 [51:01<23:15,  1.52it/s][A
Epoch 1:  69%|██████▉   | 4660/6778 [51:02<23:22,  1.51it/s][A
Epoch 1:  69%|██████▉   | 4661/6778 [51:02<23:06,  1.53it/s][A
Epoch 1:  69%|██████▉   | 4662/6778 [51:03<23:04,  1.53it/s][A
Epoch 1:  69%|██████▉   | 4663/6778 [51:04<23:05,  1.53it/s][A
Epoch 1:  69%|██████▉   | 4664/6778 [51:04<23:04,  1.53it/s][A
Epoch 1:  69%|██████▉   | 4665/6778 [51:05<23:02,  1.53it/s][A
Epoch 1:  69%|██████▉   | 4666/6778 [51:06<23:02,  1.53it/s][A
Epoch 1:  69%|██████▉   | 4667/6778 [51


Epoch: 0, Loss0.305361694376777



Epoch 1:  69%|██████▉   | 4702/6778 [51:29<22:46,  1.52it/s][A
Epoch 1:  69%|██████▉   | 4703/6778 [51:30<22:42,  1.52it/s][A
Epoch 1:  69%|██████▉   | 4704/6778 [51:31<22:45,  1.52it/s][A
Epoch 1:  69%|██████▉   | 4705/6778 [51:31<22:38,  1.53it/s][A
Epoch 1:  69%|██████▉   | 4706/6778 [51:32<22:38,  1.53it/s][A
Epoch 1:  69%|██████▉   | 4707/6778 [51:33<22:39,  1.52it/s][A
Epoch 1:  69%|██████▉   | 4708/6778 [51:33<22:36,  1.53it/s][A
Epoch 1:  69%|██████▉   | 4709/6778 [51:34<22:38,  1.52it/s][A
Epoch 1:  69%|██████▉   | 4710/6778 [51:34<22:35,  1.53it/s][A
Epoch 1:  70%|██████▉   | 4711/6778 [51:35<22:36,  1.52it/s][A
Epoch 1:  70%|██████▉   | 4712/6778 [51:36<22:36,  1.52it/s][A
Epoch 1:  70%|██████▉   | 4713/6778 [51:36<22:32,  1.53it/s][A
Epoch 1:  70%|██████▉   | 4714/6778 [51:37<22:32,  1.53it/s][A
Epoch 1:  70%|██████▉   | 4715/6778 [51:38<22:31,  1.53it/s][A
Epoch 1:  70%|██████▉   | 4716/6778 [51:38<22:28,  1.53it/s][A
Epoch 1:  70%|██████▉   | 4717/6778 [51


Epoch: 0, Loss0.30534990114134203



Epoch 1:  70%|███████   | 4752/6778 [52:02<22:08,  1.52it/s][A
Epoch 1:  70%|███████   | 4753/6778 [52:03<22:13,  1.52it/s][A
Epoch 1:  70%|███████   | 4754/6778 [52:03<22:12,  1.52it/s][A
Epoch 1:  70%|███████   | 4755/6778 [52:04<22:09,  1.52it/s][A
Epoch 1:  70%|███████   | 4756/6778 [52:05<22:05,  1.53it/s][A
Epoch 1:  70%|███████   | 4757/6778 [52:05<22:06,  1.52it/s][A
Epoch 1:  70%|███████   | 4758/6778 [52:06<22:14,  1.51it/s][A
Epoch 1:  70%|███████   | 4759/6778 [52:07<22:10,  1.52it/s][A
Epoch 1:  70%|███████   | 4760/6778 [52:07<22:12,  1.51it/s][A
Epoch 1:  70%|███████   | 4761/6778 [52:08<22:11,  1.52it/s][A
Epoch 1:  70%|███████   | 4762/6778 [52:09<22:17,  1.51it/s][A
Epoch 1:  70%|███████   | 4763/6778 [52:09<22:16,  1.51it/s][A
Epoch 1:  70%|███████   | 4764/6778 [52:10<22:01,  1.52it/s][A
Epoch 1:  70%|███████   | 4765/6778 [52:11<22:01,  1.52it/s][A
Epoch 1:  70%|███████   | 4766/6778 [52:11<21:56,  1.53it/s][A
Epoch 1:  70%|███████   | 4767/6778 [52


Epoch: 0, Loss0.3053311755575381



Epoch 1:  71%|███████   | 4802/6778 [52:35<21:46,  1.51it/s][A
Epoch 1:  71%|███████   | 4803/6778 [52:36<21:51,  1.51it/s][A
Epoch 1:  71%|███████   | 4804/6778 [52:36<21:54,  1.50it/s][A
Epoch 1:  71%|███████   | 4805/6778 [52:37<21:38,  1.52it/s][A
Epoch 1:  71%|███████   | 4806/6778 [52:38<21:38,  1.52it/s][A
Epoch 1:  71%|███████   | 4807/6778 [52:38<21:32,  1.53it/s][A
Epoch 1:  71%|███████   | 4808/6778 [52:39<21:35,  1.52it/s][A
Epoch 1:  71%|███████   | 4809/6778 [52:40<21:31,  1.52it/s][A
Epoch 1:  71%|███████   | 4810/6778 [52:40<21:32,  1.52it/s][A
Epoch 1:  71%|███████   | 4811/6778 [52:41<21:28,  1.53it/s][A
Epoch 1:  71%|███████   | 4812/6778 [52:42<21:27,  1.53it/s][A
Epoch 1:  71%|███████   | 4813/6778 [52:42<21:25,  1.53it/s][A
Epoch 1:  71%|███████   | 4814/6778 [52:43<21:22,  1.53it/s][A
Epoch 1:  71%|███████   | 4815/6778 [52:44<21:21,  1.53it/s][A
Epoch 1:  71%|███████   | 4816/6778 [52:44<21:24,  1.53it/s][A
Epoch 1:  71%|███████   | 4817/6778 [52


Epoch: 0, Loss0.30517076181182173



Epoch 1:  72%|███████▏  | 4852/6778 [53:08<21:08,  1.52it/s][A
Epoch 1:  72%|███████▏  | 4853/6778 [53:09<21:08,  1.52it/s][A
Epoch 1:  72%|███████▏  | 4854/6778 [53:09<21:03,  1.52it/s][A
Epoch 1:  72%|███████▏  | 4855/6778 [53:10<21:01,  1.52it/s][A
Epoch 1:  72%|███████▏  | 4856/6778 [53:10<21:00,  1.53it/s][A
Epoch 1:  72%|███████▏  | 4857/6778 [53:11<20:59,  1.52it/s][A
Epoch 1:  72%|███████▏  | 4858/6778 [53:12<20:56,  1.53it/s][A
Epoch 1:  72%|███████▏  | 4859/6778 [53:12<20:56,  1.53it/s][A
Epoch 1:  72%|███████▏  | 4860/6778 [53:13<20:56,  1.53it/s][A
Epoch 1:  72%|███████▏  | 4861/6778 [53:14<21:11,  1.51it/s][A
Epoch 1:  72%|███████▏  | 4862/6778 [53:14<21:01,  1.52it/s][A
Epoch 1:  72%|███████▏  | 4863/6778 [53:15<21:00,  1.52it/s][A
Epoch 1:  72%|███████▏  | 4864/6778 [53:16<21:03,  1.52it/s][A
Epoch 1:  72%|███████▏  | 4865/6778 [53:16<21:06,  1.51it/s][A
Epoch 1:  72%|███████▏  | 4866/6778 [53:17<20:58,  1.52it/s][A
Epoch 1:  72%|███████▏  | 4867/6778 [53


Epoch: 0, Loss0.30514095518247764



Epoch 1:  72%|███████▏  | 4902/6778 [53:41<20:43,  1.51it/s][A
Epoch 1:  72%|███████▏  | 4903/6778 [53:41<20:41,  1.51it/s][A
Epoch 1:  72%|███████▏  | 4904/6778 [53:42<20:45,  1.51it/s][A
Epoch 1:  72%|███████▏  | 4905/6778 [53:43<20:47,  1.50it/s][A
Epoch 1:  72%|███████▏  | 4906/6778 [53:43<20:46,  1.50it/s][A
Epoch 1:  72%|███████▏  | 4907/6778 [53:44<20:42,  1.51it/s][A
Epoch 1:  72%|███████▏  | 4908/6778 [53:45<20:38,  1.51it/s][A
Epoch 1:  72%|███████▏  | 4909/6778 [53:45<20:33,  1.52it/s][A
Epoch 1:  72%|███████▏  | 4910/6778 [53:46<20:31,  1.52it/s][A
Epoch 1:  72%|███████▏  | 4911/6778 [53:47<20:29,  1.52it/s][A
Epoch 1:  72%|███████▏  | 4912/6778 [53:47<20:27,  1.52it/s][A
Epoch 1:  72%|███████▏  | 4913/6778 [53:48<20:33,  1.51it/s][A
Epoch 1:  72%|███████▏  | 4914/6778 [53:49<20:24,  1.52it/s][A
Epoch 1:  73%|███████▎  | 4915/6778 [53:49<20:21,  1.52it/s][A
Epoch 1:  73%|███████▎  | 4916/6778 [53:50<20:22,  1.52it/s][A
Epoch 1:  73%|███████▎  | 4917/6778 [53


Epoch: 0, Loss0.3049791969014307



Epoch 1:  73%|███████▎  | 4952/6778 [54:14<20:06,  1.51it/s][A
Epoch 1:  73%|███████▎  | 4953/6778 [54:14<20:01,  1.52it/s][A
Epoch 1:  73%|███████▎  | 4954/6778 [54:15<20:02,  1.52it/s][A
Epoch 1:  73%|███████▎  | 4955/6778 [54:16<19:58,  1.52it/s][A
Epoch 1:  73%|███████▎  | 4956/6778 [54:16<19:58,  1.52it/s][A
Epoch 1:  73%|███████▎  | 4957/6778 [54:17<19:59,  1.52it/s][A
Epoch 1:  73%|███████▎  | 4958/6778 [54:18<19:55,  1.52it/s][A
Epoch 1:  73%|███████▎  | 4959/6778 [54:18<19:54,  1.52it/s][A
Epoch 1:  73%|███████▎  | 4960/6778 [54:19<20:00,  1.51it/s][A
Epoch 1:  73%|███████▎  | 4961/6778 [54:20<19:56,  1.52it/s][A
Epoch 1:  73%|███████▎  | 4962/6778 [54:20<19:55,  1.52it/s][A
Epoch 1:  73%|███████▎  | 4963/6778 [54:21<19:52,  1.52it/s][A
Epoch 1:  73%|███████▎  | 4964/6778 [54:22<20:00,  1.51it/s][A
Epoch 1:  73%|███████▎  | 4965/6778 [54:22<20:03,  1.51it/s][A
Epoch 1:  73%|███████▎  | 4966/6778 [54:23<20:04,  1.50it/s][A
Epoch 1:  73%|███████▎  | 4967/6778 [54


Epoch: 0, Loss0.30480105029126686



Epoch 1:  74%|███████▍  | 5002/6778 [54:47<19:24,  1.53it/s][A
Epoch 1:  74%|███████▍  | 5003/6778 [54:47<19:24,  1.52it/s][A
Epoch 1:  74%|███████▍  | 5004/6778 [54:48<19:22,  1.53it/s][A
Epoch 1:  74%|███████▍  | 5005/6778 [54:49<19:30,  1.51it/s][A
Epoch 1:  74%|███████▍  | 5006/6778 [54:49<19:30,  1.51it/s][A
Epoch 1:  74%|███████▍  | 5007/6778 [54:50<19:44,  1.50it/s][A
Epoch 1:  74%|███████▍  | 5008/6778 [54:51<19:28,  1.51it/s][A
Epoch 1:  74%|███████▍  | 5009/6778 [54:51<19:31,  1.51it/s][A
Epoch 1:  74%|███████▍  | 5010/6778 [54:52<19:23,  1.52it/s][A
Epoch 1:  74%|███████▍  | 5011/6778 [54:53<19:22,  1.52it/s][A
Epoch 1:  74%|███████▍  | 5012/6778 [54:53<19:18,  1.52it/s][A
Epoch 1:  74%|███████▍  | 5013/6778 [54:54<19:21,  1.52it/s][A
Epoch 1:  74%|███████▍  | 5014/6778 [54:55<19:17,  1.52it/s][A
Epoch 1:  74%|███████▍  | 5015/6778 [54:55<19:19,  1.52it/s][A
Epoch 1:  74%|███████▍  | 5016/6778 [54:56<19:11,  1.53it/s][A
Epoch 1:  74%|███████▍  | 5017/6778 [54


Epoch: 0, Loss0.30472554611176744



Epoch 1:  75%|███████▍  | 5052/6778 [55:19<18:55,  1.52it/s][A
Epoch 1:  75%|███████▍  | 5053/6778 [55:20<18:53,  1.52it/s][A
Epoch 1:  75%|███████▍  | 5054/6778 [55:21<18:52,  1.52it/s][A
Epoch 1:  75%|███████▍  | 5055/6778 [55:21<18:50,  1.52it/s][A
Epoch 1:  75%|███████▍  | 5056/6778 [55:22<18:47,  1.53it/s][A
Epoch 1:  75%|███████▍  | 5057/6778 [55:23<18:46,  1.53it/s][A
Epoch 1:  75%|███████▍  | 5058/6778 [55:23<18:48,  1.52it/s][A
Epoch 1:  75%|███████▍  | 5059/6778 [55:24<18:46,  1.53it/s][A
Epoch 1:  75%|███████▍  | 5060/6778 [55:25<18:46,  1.53it/s][A
Epoch 1:  75%|███████▍  | 5061/6778 [55:25<18:44,  1.53it/s][A
Epoch 1:  75%|███████▍  | 5062/6778 [55:26<18:41,  1.53it/s][A
Epoch 1:  75%|███████▍  | 5063/6778 [55:27<18:40,  1.53it/s][A
Epoch 1:  75%|███████▍  | 5064/6778 [55:27<18:42,  1.53it/s][A
Epoch 1:  75%|███████▍  | 5065/6778 [55:28<18:43,  1.52it/s][A
Epoch 1:  75%|███████▍  | 5066/6778 [55:29<18:40,  1.53it/s][A
Epoch 1:  75%|███████▍  | 5067/6778 [55


Epoch: 0, Loss0.30473122299973626



Epoch 1:  75%|███████▌  | 5102/6778 [55:52<18:18,  1.53it/s][A
Epoch 1:  75%|███████▌  | 5103/6778 [55:53<18:14,  1.53it/s][A
Epoch 1:  75%|███████▌  | 5104/6778 [55:54<18:12,  1.53it/s][A
Epoch 1:  75%|███████▌  | 5105/6778 [55:54<18:13,  1.53it/s][A
Epoch 1:  75%|███████▌  | 5106/6778 [55:55<18:13,  1.53it/s][A
Epoch 1:  75%|███████▌  | 5107/6778 [55:56<18:13,  1.53it/s][A
Epoch 1:  75%|███████▌  | 5108/6778 [55:56<18:21,  1.52it/s][A
Epoch 1:  75%|███████▌  | 5109/6778 [55:57<18:22,  1.51it/s][A
Epoch 1:  75%|███████▌  | 5110/6778 [55:58<18:26,  1.51it/s][A
Epoch 1:  75%|███████▌  | 5111/6778 [55:58<18:27,  1.51it/s][A
Epoch 1:  75%|███████▌  | 5112/6778 [55:59<18:26,  1.51it/s][A
Epoch 1:  75%|███████▌  | 5113/6778 [56:00<18:25,  1.51it/s][A
Epoch 1:  75%|███████▌  | 5114/6778 [56:00<18:25,  1.51it/s][A
Epoch 1:  75%|███████▌  | 5115/6778 [56:01<18:14,  1.52it/s][A
Epoch 1:  75%|███████▌  | 5116/6778 [56:02<18:12,  1.52it/s][A
Epoch 1:  75%|███████▌  | 5117/6778 [56


Epoch: 0, Loss0.3047286822315768



Epoch 1:  76%|███████▌  | 5152/6778 [56:25<17:53,  1.51it/s][A
Epoch 1:  76%|███████▌  | 5153/6778 [56:26<17:53,  1.51it/s][A
Epoch 1:  76%|███████▌  | 5154/6778 [56:27<17:48,  1.52it/s][A
Epoch 1:  76%|███████▌  | 5155/6778 [56:27<17:47,  1.52it/s][A
Epoch 1:  76%|███████▌  | 5156/6778 [56:28<17:46,  1.52it/s][A
Epoch 1:  76%|███████▌  | 5157/6778 [56:28<17:45,  1.52it/s][A
Epoch 1:  76%|███████▌  | 5158/6778 [56:29<17:47,  1.52it/s][A
Epoch 1:  76%|███████▌  | 5159/6778 [56:30<17:40,  1.53it/s][A
Epoch 1:  76%|███████▌  | 5160/6778 [56:30<17:41,  1.52it/s][A
Epoch 1:  76%|███████▌  | 5161/6778 [56:31<17:40,  1.52it/s][A
Epoch 1:  76%|███████▌  | 5162/6778 [56:32<17:39,  1.52it/s][A
Epoch 1:  76%|███████▌  | 5163/6778 [56:32<17:40,  1.52it/s][A
Epoch 1:  76%|███████▌  | 5164/6778 [56:33<17:36,  1.53it/s][A
Epoch 1:  76%|███████▌  | 5165/6778 [56:34<17:35,  1.53it/s][A
Epoch 1:  76%|███████▌  | 5166/6778 [56:34<17:34,  1.53it/s][A
Epoch 1:  76%|███████▌  | 5167/6778 [56


Epoch: 0, Loss0.3044808001469314



Epoch 1:  77%|███████▋  | 5202/6778 [56:58<17:12,  1.53it/s][A
Epoch 1:  77%|███████▋  | 5203/6778 [56:59<17:10,  1.53it/s][A
Epoch 1:  77%|███████▋  | 5204/6778 [56:59<17:12,  1.52it/s][A
Epoch 1:  77%|███████▋  | 5205/6778 [57:00<17:09,  1.53it/s][A
Epoch 1:  77%|███████▋  | 5206/6778 [57:01<17:09,  1.53it/s][A
Epoch 1:  77%|███████▋  | 5207/6778 [57:01<17:08,  1.53it/s][A
Epoch 1:  77%|███████▋  | 5208/6778 [57:02<17:09,  1.53it/s][A
Epoch 1:  77%|███████▋  | 5209/6778 [57:03<17:08,  1.53it/s][A
Epoch 1:  77%|███████▋  | 5210/6778 [57:03<17:06,  1.53it/s][A
Epoch 1:  77%|███████▋  | 5211/6778 [57:04<17:13,  1.52it/s][A
Epoch 1:  77%|███████▋  | 5212/6778 [57:05<17:17,  1.51it/s][A
Epoch 1:  77%|███████▋  | 5213/6778 [57:05<17:30,  1.49it/s][A
Epoch 1:  77%|███████▋  | 5214/6778 [57:06<17:17,  1.51it/s][A
Epoch 1:  77%|███████▋  | 5215/6778 [57:07<17:20,  1.50it/s][A
Epoch 1:  77%|███████▋  | 5216/6778 [57:07<17:13,  1.51it/s][A
Epoch 1:  77%|███████▋  | 5217/6778 [57


Epoch: 0, Loss0.30441547518621237



Epoch 1:  77%|███████▋  | 5252/6778 [57:31<16:51,  1.51it/s][A
Epoch 1:  78%|███████▊  | 5253/6778 [57:32<16:48,  1.51it/s][A
Epoch 1:  78%|███████▊  | 5254/6778 [57:32<16:47,  1.51it/s][A
Epoch 1:  78%|███████▊  | 5255/6778 [57:33<16:47,  1.51it/s][A
Epoch 1:  78%|███████▊  | 5256/6778 [57:34<16:49,  1.51it/s][A
Epoch 1:  78%|███████▊  | 5257/6778 [57:34<16:42,  1.52it/s][A
Epoch 1:  78%|███████▊  | 5258/6778 [57:35<16:40,  1.52it/s][A
Epoch 1:  78%|███████▊  | 5259/6778 [57:36<16:40,  1.52it/s][A
Epoch 1:  78%|███████▊  | 5260/6778 [57:36<16:37,  1.52it/s][A
Epoch 1:  78%|███████▊  | 5261/6778 [57:37<16:35,  1.52it/s][A
Epoch 1:  78%|███████▊  | 5262/6778 [57:38<16:33,  1.53it/s][A
Epoch 1:  78%|███████▊  | 5263/6778 [57:38<16:32,  1.53it/s][A
Epoch 1:  78%|███████▊  | 5264/6778 [57:39<16:34,  1.52it/s][A
Epoch 1:  78%|███████▊  | 5265/6778 [57:40<16:31,  1.53it/s][A
Epoch 1:  78%|███████▊  | 5266/6778 [57:40<16:32,  1.52it/s][A
Epoch 1:  78%|███████▊  | 5267/6778 [57


Epoch: 0, Loss0.3042807687250337



Epoch 1:  78%|███████▊  | 5302/6778 [58:04<16:07,  1.52it/s][A
Epoch 1:  78%|███████▊  | 5303/6778 [58:05<16:06,  1.53it/s][A
Epoch 1:  78%|███████▊  | 5304/6778 [58:05<16:04,  1.53it/s][A
Epoch 1:  78%|███████▊  | 5305/6778 [58:06<16:04,  1.53it/s][A
Epoch 1:  78%|███████▊  | 5306/6778 [58:06<16:03,  1.53it/s][A
Epoch 1:  78%|███████▊  | 5307/6778 [58:07<16:00,  1.53it/s][A
Epoch 1:  78%|███████▊  | 5308/6778 [58:08<16:01,  1.53it/s][A
Epoch 1:  78%|███████▊  | 5309/6778 [58:08<15:59,  1.53it/s][A
Epoch 1:  78%|███████▊  | 5310/6778 [58:09<15:57,  1.53it/s][A
Epoch 1:  78%|███████▊  | 5311/6778 [58:10<15:59,  1.53it/s][A
Epoch 1:  78%|███████▊  | 5312/6778 [58:10<15:58,  1.53it/s][A
Epoch 1:  78%|███████▊  | 5313/6778 [58:11<15:56,  1.53it/s][A
Epoch 1:  78%|███████▊  | 5314/6778 [58:12<16:02,  1.52it/s][A
Epoch 1:  78%|███████▊  | 5315/6778 [58:12<16:02,  1.52it/s][A
Epoch 1:  78%|███████▊  | 5316/6778 [58:13<16:01,  1.52it/s][A
Epoch 1:  78%|███████▊  | 5317/6778 [58


Epoch: 0, Loss0.3042550498351296



Epoch 1:  79%|███████▉  | 5352/6778 [58:37<15:31,  1.53it/s][A
Epoch 1:  79%|███████▉  | 5353/6778 [58:37<15:30,  1.53it/s][A
Epoch 1:  79%|███████▉  | 5354/6778 [58:38<15:28,  1.53it/s][A
Epoch 1:  79%|███████▉  | 5355/6778 [58:39<15:38,  1.52it/s][A
Epoch 1:  79%|███████▉  | 5356/6778 [58:39<15:41,  1.51it/s][A
Epoch 1:  79%|███████▉  | 5357/6778 [58:40<15:40,  1.51it/s][A
Epoch 1:  79%|███████▉  | 5358/6778 [58:41<15:40,  1.51it/s][A
Epoch 1:  79%|███████▉  | 5359/6778 [58:41<15:42,  1.51it/s][A
Epoch 1:  79%|███████▉  | 5360/6778 [58:42<15:30,  1.52it/s][A
Epoch 1:  79%|███████▉  | 5361/6778 [58:43<15:29,  1.53it/s][A
Epoch 1:  79%|███████▉  | 5362/6778 [58:43<15:25,  1.53it/s][A
Epoch 1:  79%|███████▉  | 5363/6778 [58:44<15:25,  1.53it/s][A
Epoch 1:  79%|███████▉  | 5364/6778 [58:45<15:28,  1.52it/s][A
Epoch 1:  79%|███████▉  | 5365/6778 [58:45<15:24,  1.53it/s][A
Epoch 1:  79%|███████▉  | 5366/6778 [58:46<15:24,  1.53it/s][A
Epoch 1:  79%|███████▉  | 5367/6778 [58


Epoch: 0, Loss0.3042944898482959



Epoch 1:  80%|███████▉  | 5402/6778 [59:10<15:05,  1.52it/s][A
Epoch 1:  80%|███████▉  | 5403/6778 [59:10<15:02,  1.52it/s][A
Epoch 1:  80%|███████▉  | 5404/6778 [59:11<15:02,  1.52it/s][A
Epoch 1:  80%|███████▉  | 5405/6778 [59:12<14:59,  1.53it/s][A
Epoch 1:  80%|███████▉  | 5406/6778 [59:12<14:58,  1.53it/s][A
Epoch 1:  80%|███████▉  | 5407/6778 [59:13<14:57,  1.53it/s][A
Epoch 1:  80%|███████▉  | 5408/6778 [59:13<14:57,  1.53it/s][A
Epoch 1:  80%|███████▉  | 5409/6778 [59:14<14:57,  1.53it/s][A
Epoch 1:  80%|███████▉  | 5410/6778 [59:15<14:57,  1.53it/s][A
Epoch 1:  80%|███████▉  | 5411/6778 [59:15<14:55,  1.53it/s][A
Epoch 1:  80%|███████▉  | 5412/6778 [59:16<14:56,  1.52it/s][A
Epoch 1:  80%|███████▉  | 5413/6778 [59:17<14:53,  1.53it/s][A
Epoch 1:  80%|███████▉  | 5414/6778 [59:17<14:53,  1.53it/s][A
Epoch 1:  80%|███████▉  | 5415/6778 [59:18<14:52,  1.53it/s][A
Epoch 1:  80%|███████▉  | 5416/6778 [59:19<14:50,  1.53it/s][A
Epoch 1:  80%|███████▉  | 5417/6778 [59


Epoch: 0, Loss0.304234176506484



Epoch 1:  80%|████████  | 5452/6778 [59:42<14:26,  1.53it/s][A
Epoch 1:  80%|████████  | 5453/6778 [59:43<14:27,  1.53it/s][A
Epoch 1:  80%|████████  | 5454/6778 [59:44<14:27,  1.53it/s][A
Epoch 1:  80%|████████  | 5455/6778 [59:44<14:27,  1.53it/s][A
Epoch 1:  80%|████████  | 5456/6778 [59:45<14:25,  1.53it/s][A
Epoch 1:  81%|████████  | 5457/6778 [59:46<14:25,  1.53it/s][A
Epoch 1:  81%|████████  | 5458/6778 [59:46<14:28,  1.52it/s][A
Epoch 1:  81%|████████  | 5459/6778 [59:47<14:30,  1.52it/s][A
Epoch 1:  81%|████████  | 5460/6778 [59:48<14:31,  1.51it/s][A
Epoch 1:  81%|████████  | 5461/6778 [59:48<14:29,  1.51it/s][A
Epoch 1:  81%|████████  | 5462/6778 [59:49<14:31,  1.51it/s][A
Epoch 1:  81%|████████  | 5463/6778 [59:50<14:23,  1.52it/s][A
Epoch 1:  81%|████████  | 5464/6778 [59:50<14:21,  1.53it/s][A
Epoch 1:  81%|████████  | 5465/6778 [59:51<14:19,  1.53it/s][A
Epoch 1:  81%|████████  | 5466/6778 [59:52<14:20,  1.53it/s][A
Epoch 1:  81%|████████  | 5467/6778 [59


Epoch: 0, Loss0.30426739431867555



Epoch 1:  81%|████████  | 5502/6778 [1:00:15<14:02,  1.52it/s][A
Epoch 1:  81%|████████  | 5503/6778 [1:00:16<14:06,  1.51it/s][A
Epoch 1:  81%|████████  | 5504/6778 [1:00:16<13:58,  1.52it/s][A
Epoch 1:  81%|████████  | 5505/6778 [1:00:17<13:56,  1.52it/s][A
Epoch 1:  81%|████████  | 5506/6778 [1:00:18<13:55,  1.52it/s][A
Epoch 1:  81%|████████  | 5507/6778 [1:00:18<13:54,  1.52it/s][A
Epoch 1:  81%|████████▏ | 5508/6778 [1:00:19<13:52,  1.53it/s][A
Epoch 1:  81%|████████▏ | 5509/6778 [1:00:20<13:53,  1.52it/s][A
Epoch 1:  81%|████████▏ | 5510/6778 [1:00:20<13:52,  1.52it/s][A
Epoch 1:  81%|████████▏ | 5511/6778 [1:00:21<13:50,  1.53it/s][A
Epoch 1:  81%|████████▏ | 5512/6778 [1:00:22<13:48,  1.53it/s][A
Epoch 1:  81%|████████▏ | 5513/6778 [1:00:22<13:48,  1.53it/s][A
Epoch 1:  81%|████████▏ | 5514/6778 [1:00:23<13:49,  1.52it/s][A
Epoch 1:  81%|████████▏ | 5515/6778 [1:00:24<13:47,  1.53it/s][A
Epoch 1:  81%|████████▏ | 5516/6778 [1:00:24<13:49,  1.52it/s][A
Epoch 1: 


Epoch: 0, Loss0.30420391647193135



Epoch 1:  82%|████████▏ | 5552/6778 [1:00:48<13:21,  1.53it/s][A
Epoch 1:  82%|████████▏ | 5553/6778 [1:00:49<13:23,  1.52it/s][A
Epoch 1:  82%|████████▏ | 5554/6778 [1:00:49<13:20,  1.53it/s][A
Epoch 1:  82%|████████▏ | 5555/6778 [1:00:50<13:20,  1.53it/s][A
Epoch 1:  82%|████████▏ | 5556/6778 [1:00:51<13:19,  1.53it/s][A
Epoch 1:  82%|████████▏ | 5557/6778 [1:00:51<13:18,  1.53it/s][A
Epoch 1:  82%|████████▏ | 5558/6778 [1:00:52<13:18,  1.53it/s][A
Epoch 1:  82%|████████▏ | 5559/6778 [1:00:53<13:17,  1.53it/s][A
Epoch 1:  82%|████████▏ | 5560/6778 [1:00:53<13:20,  1.52it/s][A
Epoch 1:  82%|████████▏ | 5561/6778 [1:00:54<13:20,  1.52it/s][A
Epoch 1:  82%|████████▏ | 5562/6778 [1:00:55<13:19,  1.52it/s][A
Epoch 1:  82%|████████▏ | 5563/6778 [1:00:55<13:19,  1.52it/s][A
Epoch 1:  82%|████████▏ | 5564/6778 [1:00:56<13:24,  1.51it/s][A
Epoch 1:  82%|████████▏ | 5565/6778 [1:00:57<13:25,  1.51it/s][A
Epoch 1:  82%|████████▏ | 5566/6778 [1:00:57<13:15,  1.52it/s][A
Epoch 1: 


Epoch: 0, Loss0.30408610999876845



Epoch 1:  83%|████████▎ | 5602/6778 [1:01:21<12:58,  1.51it/s][A
Epoch 1:  83%|████████▎ | 5603/6778 [1:01:21<12:53,  1.52it/s][A
Epoch 1:  83%|████████▎ | 5604/6778 [1:01:22<12:54,  1.52it/s][A
Epoch 1:  83%|████████▎ | 5605/6778 [1:01:23<12:55,  1.51it/s][A
Epoch 1:  83%|████████▎ | 5606/6778 [1:01:23<12:57,  1.51it/s][A
Epoch 1:  83%|████████▎ | 5607/6778 [1:01:24<12:54,  1.51it/s][A
Epoch 1:  83%|████████▎ | 5608/6778 [1:01:25<12:50,  1.52it/s][A
Epoch 1:  83%|████████▎ | 5609/6778 [1:01:25<12:46,  1.52it/s][A
Epoch 1:  83%|████████▎ | 5610/6778 [1:01:26<12:46,  1.52it/s][A
Epoch 1:  83%|████████▎ | 5611/6778 [1:01:27<12:45,  1.52it/s][A
Epoch 1:  83%|████████▎ | 5612/6778 [1:01:27<12:45,  1.52it/s][A
Epoch 1:  83%|████████▎ | 5613/6778 [1:01:28<12:43,  1.53it/s][A
Epoch 1:  83%|████████▎ | 5614/6778 [1:01:29<12:43,  1.52it/s][A
Epoch 1:  83%|████████▎ | 5615/6778 [1:01:29<12:41,  1.53it/s][A
Epoch 1:  83%|████████▎ | 5616/6778 [1:01:30<12:41,  1.53it/s][A
Epoch 1: 


Epoch: 0, Loss0.30393675888767074



Epoch 1:  83%|████████▎ | 5652/6778 [1:01:54<12:17,  1.53it/s][A
Epoch 1:  83%|████████▎ | 5653/6778 [1:01:54<12:14,  1.53it/s][A
Epoch 1:  83%|████████▎ | 5654/6778 [1:01:55<12:14,  1.53it/s][A
Epoch 1:  83%|████████▎ | 5655/6778 [1:01:56<12:14,  1.53it/s][A
Epoch 1:  83%|████████▎ | 5656/6778 [1:01:56<12:13,  1.53it/s][A
Epoch 1:  83%|████████▎ | 5657/6778 [1:01:57<12:12,  1.53it/s][A
Epoch 1:  83%|████████▎ | 5658/6778 [1:01:58<12:12,  1.53it/s][A
Epoch 1:  83%|████████▎ | 5659/6778 [1:01:58<12:10,  1.53it/s][A
Epoch 1:  84%|████████▎ | 5660/6778 [1:01:59<12:08,  1.53it/s][A
Epoch 1:  84%|████████▎ | 5661/6778 [1:02:00<12:10,  1.53it/s][A
Epoch 1:  84%|████████▎ | 5662/6778 [1:02:00<12:10,  1.53it/s][A
Epoch 1:  84%|████████▎ | 5663/6778 [1:02:01<12:09,  1.53it/s][A
Epoch 1:  84%|████████▎ | 5664/6778 [1:02:02<12:16,  1.51it/s][A
Epoch 1:  84%|████████▎ | 5665/6778 [1:02:02<12:17,  1.51it/s][A
Epoch 1:  84%|████████▎ | 5666/6778 [1:02:03<12:18,  1.51it/s][A
Epoch 1: 


Epoch: 0, Loss0.30388928344089344



Epoch 1:  84%|████████▍ | 5702/6778 [1:02:26<11:43,  1.53it/s][A
Epoch 1:  84%|████████▍ | 5703/6778 [1:02:27<11:42,  1.53it/s][A
Epoch 1:  84%|████████▍ | 5704/6778 [1:02:28<11:42,  1.53it/s][A
Epoch 1:  84%|████████▍ | 5705/6778 [1:02:28<11:48,  1.51it/s][A
Epoch 1:  84%|████████▍ | 5706/6778 [1:02:29<11:45,  1.52it/s][A
Epoch 1:  84%|████████▍ | 5707/6778 [1:02:30<11:45,  1.52it/s][A
Epoch 1:  84%|████████▍ | 5708/6778 [1:02:30<11:48,  1.51it/s][A
Epoch 1:  84%|████████▍ | 5709/6778 [1:02:31<11:51,  1.50it/s][A
Epoch 1:  84%|████████▍ | 5710/6778 [1:02:32<11:45,  1.51it/s][A
Epoch 1:  84%|████████▍ | 5711/6778 [1:02:32<11:42,  1.52it/s][A
Epoch 1:  84%|████████▍ | 5712/6778 [1:02:33<11:41,  1.52it/s][A
Epoch 1:  84%|████████▍ | 5713/6778 [1:02:34<11:38,  1.52it/s][A
Epoch 1:  84%|████████▍ | 5714/6778 [1:02:34<11:37,  1.52it/s][A
Epoch 1:  84%|████████▍ | 5715/6778 [1:02:35<11:41,  1.52it/s][A
Epoch 1:  84%|████████▍ | 5716/6778 [1:02:36<11:37,  1.52it/s][A
Epoch 1: 


Epoch: 0, Loss0.30393617527653



Epoch 1:  85%|████████▍ | 5752/6778 [1:02:59<11:17,  1.51it/s][A
Epoch 1:  85%|████████▍ | 5753/6778 [1:03:00<11:15,  1.52it/s][A
Epoch 1:  85%|████████▍ | 5754/6778 [1:03:01<11:13,  1.52it/s][A
Epoch 1:  85%|████████▍ | 5755/6778 [1:03:01<11:12,  1.52it/s][A
Epoch 1:  85%|████████▍ | 5756/6778 [1:03:02<11:10,  1.53it/s][A
Epoch 1:  85%|████████▍ | 5757/6778 [1:03:03<11:09,  1.53it/s][A
Epoch 1:  85%|████████▍ | 5758/6778 [1:03:03<11:09,  1.52it/s][A
Epoch 1:  85%|████████▍ | 5759/6778 [1:03:04<11:10,  1.52it/s][A
Epoch 1:  85%|████████▍ | 5760/6778 [1:03:05<11:08,  1.52it/s][A
Epoch 1:  85%|████████▍ | 5761/6778 [1:03:05<11:10,  1.52it/s][A
Epoch 1:  85%|████████▌ | 5762/6778 [1:03:06<11:07,  1.52it/s][A
Epoch 1:  85%|████████▌ | 5763/6778 [1:03:07<11:05,  1.53it/s][A
Epoch 1:  85%|████████▌ | 5764/6778 [1:03:07<11:04,  1.53it/s][A
Epoch 1:  85%|████████▌ | 5765/6778 [1:03:08<11:04,  1.53it/s][A
Epoch 1:  85%|████████▌ | 5766/6778 [1:03:09<11:04,  1.52it/s][A
Epoch 1: 


Epoch: 0, Loss0.30383670676439883



Epoch 1:  86%|████████▌ | 5802/6778 [1:03:32<10:42,  1.52it/s][A
Epoch 1:  86%|████████▌ | 5803/6778 [1:03:33<10:40,  1.52it/s][A
Epoch 1:  86%|████████▌ | 5804/6778 [1:03:34<10:39,  1.52it/s][A
Epoch 1:  86%|████████▌ | 5805/6778 [1:03:34<10:38,  1.52it/s][A
Epoch 1:  86%|████████▌ | 5806/6778 [1:03:35<10:39,  1.52it/s][A
Epoch 1:  86%|████████▌ | 5807/6778 [1:03:36<10:39,  1.52it/s][A
Epoch 1:  86%|████████▌ | 5808/6778 [1:03:36<10:39,  1.52it/s][A
Epoch 1:  86%|████████▌ | 5809/6778 [1:03:37<10:38,  1.52it/s][A
Epoch 1:  86%|████████▌ | 5810/6778 [1:03:38<10:38,  1.52it/s][A
Epoch 1:  86%|████████▌ | 5811/6778 [1:03:38<10:42,  1.50it/s][A
Epoch 1:  86%|████████▌ | 5812/6778 [1:03:39<10:41,  1.50it/s][A
Epoch 1:  86%|████████▌ | 5813/6778 [1:03:40<10:34,  1.52it/s][A
Epoch 1:  86%|████████▌ | 5814/6778 [1:03:40<10:32,  1.52it/s][A
Epoch 1:  86%|████████▌ | 5815/6778 [1:03:41<10:31,  1.52it/s][A
Epoch 1:  86%|████████▌ | 5816/6778 [1:03:42<10:30,  1.53it/s][A
Epoch 1: 


Epoch: 0, Loss0.30383294171995434



Epoch 1:  86%|████████▋ | 5852/6778 [1:04:05<10:12,  1.51it/s][A
Epoch 1:  86%|████████▋ | 5853/6778 [1:04:06<10:12,  1.51it/s][A
Epoch 1:  86%|████████▋ | 5854/6778 [1:04:07<10:05,  1.53it/s][A
Epoch 1:  86%|████████▋ | 5855/6778 [1:04:07<10:03,  1.53it/s][A
Epoch 1:  86%|████████▋ | 5856/6778 [1:04:08<10:04,  1.53it/s][A
Epoch 1:  86%|████████▋ | 5857/6778 [1:04:08<10:01,  1.53it/s][A
Epoch 1:  86%|████████▋ | 5858/6778 [1:04:09<10:01,  1.53it/s][A
Epoch 1:  86%|████████▋ | 5859/6778 [1:04:10<10:03,  1.52it/s][A
Epoch 1:  86%|████████▋ | 5860/6778 [1:04:10<10:03,  1.52it/s][A
Epoch 1:  86%|████████▋ | 5861/6778 [1:04:11<10:04,  1.52it/s][A
Epoch 1:  86%|████████▋ | 5862/6778 [1:04:12<10:01,  1.52it/s][A
Epoch 1:  87%|████████▋ | 5863/6778 [1:04:12<10:00,  1.52it/s][A
Epoch 1:  87%|████████▋ | 5864/6778 [1:04:13<09:59,  1.52it/s][A
Epoch 1:  87%|████████▋ | 5865/6778 [1:04:14<09:57,  1.53it/s][A
Epoch 1:  87%|████████▋ | 5866/6778 [1:04:14<09:56,  1.53it/s][A
Epoch 1: 


Epoch: 0, Loss0.3039621399484172



Epoch 1:  87%|████████▋ | 5902/6778 [1:04:38<09:34,  1.53it/s][A
Epoch 1:  87%|████████▋ | 5903/6778 [1:04:39<09:34,  1.52it/s][A
Epoch 1:  87%|████████▋ | 5904/6778 [1:04:39<09:33,  1.52it/s][A
Epoch 1:  87%|████████▋ | 5905/6778 [1:04:40<09:32,  1.52it/s][A
Epoch 1:  87%|████████▋ | 5906/6778 [1:04:41<09:30,  1.53it/s][A
Epoch 1:  87%|████████▋ | 5907/6778 [1:04:41<09:29,  1.53it/s][A
Epoch 1:  87%|████████▋ | 5908/6778 [1:04:42<09:29,  1.53it/s][A
Epoch 1:  87%|████████▋ | 5909/6778 [1:04:43<09:28,  1.53it/s][A
Epoch 1:  87%|████████▋ | 5910/6778 [1:04:43<09:32,  1.52it/s][A
Epoch 1:  87%|████████▋ | 5911/6778 [1:04:44<09:31,  1.52it/s][A
Epoch 1:  87%|████████▋ | 5912/6778 [1:04:45<09:32,  1.51it/s][A
Epoch 1:  87%|████████▋ | 5913/6778 [1:04:45<09:30,  1.52it/s][A
Epoch 1:  87%|████████▋ | 5914/6778 [1:04:46<09:31,  1.51it/s][A
Epoch 1:  87%|████████▋ | 5915/6778 [1:04:47<09:26,  1.52it/s][A
Epoch 1:  87%|████████▋ | 5916/6778 [1:04:47<09:25,  1.52it/s][A
Epoch 1: 


Epoch: 0, Loss0.3039093221915087



Epoch 1:  88%|████████▊ | 5952/6778 [1:05:11<09:04,  1.52it/s][A
Epoch 1:  88%|████████▊ | 5953/6778 [1:05:12<09:02,  1.52it/s][A
Epoch 1:  88%|████████▊ | 5954/6778 [1:05:12<09:02,  1.52it/s][A
Epoch 1:  88%|████████▊ | 5955/6778 [1:05:13<09:02,  1.52it/s][A
Epoch 1:  88%|████████▊ | 5956/6778 [1:05:14<09:04,  1.51it/s][A
Epoch 1:  88%|████████▊ | 5957/6778 [1:05:14<08:56,  1.53it/s][A
Epoch 1:  88%|████████▊ | 5958/6778 [1:05:15<08:56,  1.53it/s][A
Epoch 1:  88%|████████▊ | 5959/6778 [1:05:16<08:55,  1.53it/s][A
Epoch 1:  88%|████████▊ | 5960/6778 [1:05:16<08:54,  1.53it/s][A
Epoch 1:  88%|████████▊ | 5961/6778 [1:05:17<08:54,  1.53it/s][A
Epoch 1:  88%|████████▊ | 5962/6778 [1:05:17<08:53,  1.53it/s][A
Epoch 1:  88%|████████▊ | 5963/6778 [1:05:18<08:52,  1.53it/s][A
Epoch 1:  88%|████████▊ | 5964/6778 [1:05:19<08:52,  1.53it/s][A
Epoch 1:  88%|████████▊ | 5965/6778 [1:05:19<08:50,  1.53it/s][A
Epoch 1:  88%|████████▊ | 5966/6778 [1:05:20<08:50,  1.53it/s][A
Epoch 1: 


Epoch: 0, Loss0.3038797614100555



Epoch 1:  89%|████████▊ | 6002/6778 [1:05:44<08:29,  1.52it/s][A
Epoch 1:  89%|████████▊ | 6003/6778 [1:05:44<08:28,  1.53it/s][A
Epoch 1:  89%|████████▊ | 6004/6778 [1:05:45<08:27,  1.53it/s][A
Epoch 1:  89%|████████▊ | 6005/6778 [1:05:46<08:26,  1.53it/s][A
Epoch 1:  89%|████████▊ | 6006/6778 [1:05:46<08:25,  1.53it/s][A
Epoch 1:  89%|████████▊ | 6007/6778 [1:05:47<08:26,  1.52it/s][A
Epoch 1:  89%|████████▊ | 6008/6778 [1:05:48<08:24,  1.53it/s][A
Epoch 1:  89%|████████▊ | 6009/6778 [1:05:48<08:24,  1.52it/s][A
Epoch 1:  89%|████████▊ | 6010/6778 [1:05:49<08:24,  1.52it/s][A
Epoch 1:  89%|████████▊ | 6011/6778 [1:05:50<08:23,  1.52it/s][A
Epoch 1:  89%|████████▊ | 6012/6778 [1:05:50<08:23,  1.52it/s][A
Epoch 1:  89%|████████▊ | 6013/6778 [1:05:51<08:25,  1.51it/s][A
Epoch 1:  89%|████████▊ | 6014/6778 [1:05:52<08:22,  1.52it/s][A
Epoch 1:  89%|████████▊ | 6015/6778 [1:05:52<08:22,  1.52it/s][A
Epoch 1:  89%|████████▉ | 6016/6778 [1:05:53<08:24,  1.51it/s][A
Epoch 1: 


Epoch: 0, Loss0.30395887635612545



Epoch 1:  89%|████████▉ | 6052/6778 [1:06:17<07:55,  1.53it/s][A
Epoch 1:  89%|████████▉ | 6053/6778 [1:06:17<07:54,  1.53it/s][A
Epoch 1:  89%|████████▉ | 6054/6778 [1:06:18<07:53,  1.53it/s][A
Epoch 1:  89%|████████▉ | 6055/6778 [1:06:19<07:55,  1.52it/s][A
Epoch 1:  89%|████████▉ | 6056/6778 [1:06:19<07:59,  1.50it/s][A
Epoch 1:  89%|████████▉ | 6057/6778 [1:06:20<07:56,  1.51it/s][A
Epoch 1:  89%|████████▉ | 6058/6778 [1:06:21<07:56,  1.51it/s][A
Epoch 1:  89%|████████▉ | 6059/6778 [1:06:21<07:56,  1.51it/s][A
Epoch 1:  89%|████████▉ | 6060/6778 [1:06:22<07:49,  1.53it/s][A
Epoch 1:  89%|████████▉ | 6061/6778 [1:06:23<07:49,  1.53it/s][A
Epoch 1:  89%|████████▉ | 6062/6778 [1:06:23<07:48,  1.53it/s][A
Epoch 1:  89%|████████▉ | 6063/6778 [1:06:24<07:48,  1.53it/s][A
Epoch 1:  89%|████████▉ | 6064/6778 [1:06:25<07:47,  1.53it/s][A
Epoch 1:  89%|████████▉ | 6065/6778 [1:06:25<07:47,  1.52it/s][A
Epoch 1:  89%|████████▉ | 6066/6778 [1:06:26<07:46,  1.53it/s][A
Epoch 1: 


Epoch: 0, Loss0.30392872393888404



Epoch 1:  90%|█████████ | 6102/6778 [1:06:50<07:24,  1.52it/s][A
Epoch 1:  90%|█████████ | 6103/6778 [1:06:50<07:22,  1.53it/s][A
Epoch 1:  90%|█████████ | 6104/6778 [1:06:51<07:22,  1.52it/s][A
Epoch 1:  90%|█████████ | 6105/6778 [1:06:51<07:22,  1.52it/s][A
Epoch 1:  90%|█████████ | 6106/6778 [1:06:52<07:21,  1.52it/s][A
Epoch 1:  90%|█████████ | 6107/6778 [1:06:53<07:20,  1.52it/s][A
Epoch 1:  90%|█████████ | 6108/6778 [1:06:53<07:19,  1.53it/s][A
Epoch 1:  90%|█████████ | 6109/6778 [1:06:54<07:19,  1.52it/s][A
Epoch 1:  90%|█████████ | 6110/6778 [1:06:55<07:17,  1.53it/s][A
Epoch 1:  90%|█████████ | 6111/6778 [1:06:55<07:16,  1.53it/s][A
Epoch 1:  90%|█████████ | 6112/6778 [1:06:56<07:15,  1.53it/s][A
Epoch 1:  90%|█████████ | 6113/6778 [1:06:57<07:15,  1.53it/s][A
Epoch 1:  90%|█████████ | 6114/6778 [1:06:57<07:15,  1.53it/s][A
Epoch 1:  90%|█████████ | 6115/6778 [1:06:58<07:13,  1.53it/s][A
Epoch 1:  90%|█████████ | 6116/6778 [1:06:59<07:15,  1.52it/s][A
Epoch 1: 


Epoch: 0, Loss0.3038860869417829



Epoch 1:  91%|█████████ | 6152/6778 [1:07:22<06:51,  1.52it/s][A
Epoch 1:  91%|█████████ | 6153/6778 [1:07:23<06:49,  1.53it/s][A
Epoch 1:  91%|█████████ | 6154/6778 [1:07:24<06:48,  1.53it/s][A
Epoch 1:  91%|█████████ | 6155/6778 [1:07:24<06:47,  1.53it/s][A
Epoch 1:  91%|█████████ | 6156/6778 [1:07:25<06:47,  1.53it/s][A
Epoch 1:  91%|█████████ | 6157/6778 [1:07:26<06:47,  1.52it/s][A
Epoch 1:  91%|█████████ | 6158/6778 [1:07:26<06:49,  1.51it/s][A
Epoch 1:  91%|█████████ | 6159/6778 [1:07:27<06:48,  1.52it/s][A
Epoch 1:  91%|█████████ | 6160/6778 [1:07:28<06:48,  1.51it/s][A
Epoch 1:  91%|█████████ | 6161/6778 [1:07:28<06:49,  1.50it/s][A
Epoch 1:  91%|█████████ | 6162/6778 [1:07:29<06:49,  1.51it/s][A
Epoch 1:  91%|█████████ | 6163/6778 [1:07:30<06:44,  1.52it/s][A
Epoch 1:  91%|█████████ | 6164/6778 [1:07:30<06:43,  1.52it/s][A
Epoch 1:  91%|█████████ | 6165/6778 [1:07:31<06:42,  1.52it/s][A
Epoch 1:  91%|█████████ | 6166/6778 [1:07:32<06:40,  1.53it/s][A
Epoch 1: 


Epoch: 0, Loss0.30367639910389466



Epoch 1:  92%|█████████▏| 6202/6778 [1:07:55<06:22,  1.50it/s][A
Epoch 1:  92%|█████████▏| 6203/6778 [1:07:56<06:20,  1.51it/s][A
Epoch 1:  92%|█████████▏| 6204/6778 [1:07:57<06:16,  1.52it/s][A
Epoch 1:  92%|█████████▏| 6205/6778 [1:07:57<06:16,  1.52it/s][A
Epoch 1:  92%|█████████▏| 6206/6778 [1:07:58<06:15,  1.52it/s][A
Epoch 1:  92%|█████████▏| 6207/6778 [1:07:58<06:14,  1.53it/s][A
Epoch 1:  92%|█████████▏| 6208/6778 [1:07:59<06:13,  1.53it/s][A
Epoch 1:  92%|█████████▏| 6209/6778 [1:08:00<06:13,  1.52it/s][A
Epoch 1:  92%|█████████▏| 6210/6778 [1:08:00<06:13,  1.52it/s][A
Epoch 1:  92%|█████████▏| 6211/6778 [1:08:01<06:11,  1.52it/s][A
Epoch 1:  92%|█████████▏| 6212/6778 [1:08:02<06:11,  1.52it/s][A
Epoch 1:  92%|█████████▏| 6213/6778 [1:08:02<06:10,  1.52it/s][A
Epoch 1:  92%|█████████▏| 6214/6778 [1:08:03<06:10,  1.52it/s][A
Epoch 1:  92%|█████████▏| 6215/6778 [1:08:04<06:09,  1.52it/s][A
Epoch 1:  92%|█████████▏| 6216/6778 [1:08:04<06:08,  1.52it/s][A
Epoch 1: 


Epoch: 0, Loss0.3035751473312949



Epoch 1:  92%|█████████▏| 6252/6778 [1:08:28<05:45,  1.52it/s][A
Epoch 1:  92%|█████████▏| 6253/6778 [1:08:29<05:43,  1.53it/s][A
Epoch 1:  92%|█████████▏| 6254/6778 [1:08:29<05:44,  1.52it/s][A
Epoch 1:  92%|█████████▏| 6255/6778 [1:08:30<05:41,  1.53it/s][A
Epoch 1:  92%|█████████▏| 6256/6778 [1:08:31<05:41,  1.53it/s][A
Epoch 1:  92%|█████████▏| 6257/6778 [1:08:31<05:40,  1.53it/s][A
Epoch 1:  92%|█████████▏| 6258/6778 [1:08:32<05:40,  1.53it/s][A
Epoch 1:  92%|█████████▏| 6259/6778 [1:08:33<05:39,  1.53it/s][A
Epoch 1:  92%|█████████▏| 6260/6778 [1:08:33<05:38,  1.53it/s][A
Epoch 1:  92%|█████████▏| 6261/6778 [1:08:34<05:40,  1.52it/s][A
Epoch 1:  92%|█████████▏| 6262/6778 [1:08:35<05:40,  1.52it/s][A
Epoch 1:  92%|█████████▏| 6263/6778 [1:08:35<05:40,  1.51it/s][A
Epoch 1:  92%|█████████▏| 6264/6778 [1:08:36<05:40,  1.51it/s][A
Epoch 1:  92%|█████████▏| 6265/6778 [1:08:37<05:40,  1.50it/s][A
Epoch 1:  92%|█████████▏| 6266/6778 [1:08:37<05:36,  1.52it/s][A
Epoch 1: 


Epoch: 0, Loss0.30353992839589644



Epoch 1:  93%|█████████▎| 6302/6778 [1:09:01<05:12,  1.52it/s][A
Epoch 1:  93%|█████████▎| 6303/6778 [1:09:02<05:12,  1.52it/s][A
Epoch 1:  93%|█████████▎| 6304/6778 [1:09:02<05:13,  1.51it/s][A
Epoch 1:  93%|█████████▎| 6305/6778 [1:09:03<05:14,  1.50it/s][A
Epoch 1:  93%|█████████▎| 6306/6778 [1:09:04<05:14,  1.50it/s][A
Epoch 1:  93%|█████████▎| 6307/6778 [1:09:04<05:09,  1.52it/s][A
Epoch 1:  93%|█████████▎| 6308/6778 [1:09:05<05:08,  1.52it/s][A
Epoch 1:  93%|█████████▎| 6309/6778 [1:09:05<05:07,  1.52it/s][A
Epoch 1:  93%|█████████▎| 6310/6778 [1:09:06<05:07,  1.52it/s][A
Epoch 1:  93%|█████████▎| 6311/6778 [1:09:07<05:06,  1.53it/s][A
Epoch 1:  93%|█████████▎| 6312/6778 [1:09:07<05:05,  1.53it/s][A
Epoch 1:  93%|█████████▎| 6313/6778 [1:09:08<05:05,  1.52it/s][A
Epoch 1:  93%|█████████▎| 6314/6778 [1:09:09<05:04,  1.52it/s][A
Epoch 1:  93%|█████████▎| 6315/6778 [1:09:09<05:03,  1.52it/s][A
Epoch 1:  93%|█████████▎| 6316/6778 [1:09:10<05:03,  1.52it/s][A
Epoch 1: 


Epoch: 0, Loss0.3035081686093345



Epoch 1:  94%|█████████▎| 6352/6778 [1:09:34<04:40,  1.52it/s][A
Epoch 1:  94%|█████████▎| 6353/6778 [1:09:34<04:39,  1.52it/s][A
Epoch 1:  94%|█████████▎| 6354/6778 [1:09:35<04:38,  1.52it/s][A
Epoch 1:  94%|█████████▍| 6355/6778 [1:09:36<04:39,  1.51it/s][A
Epoch 1:  94%|█████████▍| 6356/6778 [1:09:36<04:37,  1.52it/s][A
Epoch 1:  94%|█████████▍| 6357/6778 [1:09:37<04:37,  1.52it/s][A
Epoch 1:  94%|█████████▍| 6358/6778 [1:09:38<04:35,  1.52it/s][A
Epoch 1:  94%|█████████▍| 6359/6778 [1:09:38<04:34,  1.53it/s][A
Epoch 1:  94%|█████████▍| 6360/6778 [1:09:39<04:33,  1.53it/s][A
Epoch 1:  94%|█████████▍| 6361/6778 [1:09:40<04:33,  1.53it/s][A
Epoch 1:  94%|█████████▍| 6362/6778 [1:09:40<04:32,  1.53it/s][A
Epoch 1:  94%|█████████▍| 6363/6778 [1:09:41<04:33,  1.52it/s][A
Epoch 1:  94%|█████████▍| 6364/6778 [1:09:42<04:35,  1.50it/s][A
Epoch 1:  94%|█████████▍| 6365/6778 [1:09:42<04:31,  1.52it/s][A
Epoch 1:  94%|█████████▍| 6366/6778 [1:09:43<04:32,  1.51it/s][A
Epoch 1: 


Epoch: 0, Loss0.30347706844840755



Epoch 1:  94%|█████████▍| 6402/6778 [1:10:07<04:06,  1.53it/s][A
Epoch 1:  94%|█████████▍| 6403/6778 [1:10:07<04:05,  1.53it/s][A
Epoch 1:  94%|█████████▍| 6404/6778 [1:10:08<04:06,  1.52it/s][A
Epoch 1:  94%|█████████▍| 6405/6778 [1:10:09<04:06,  1.51it/s][A
Epoch 1:  95%|█████████▍| 6406/6778 [1:10:09<04:05,  1.52it/s][A
Epoch 1:  95%|█████████▍| 6407/6778 [1:10:10<04:04,  1.52it/s][A
Epoch 1:  95%|█████████▍| 6408/6778 [1:10:11<04:05,  1.51it/s][A
Epoch 1:  95%|█████████▍| 6409/6778 [1:10:11<04:04,  1.51it/s][A
Epoch 1:  95%|█████████▍| 6410/6778 [1:10:12<04:01,  1.52it/s][A
Epoch 1:  95%|█████████▍| 6411/6778 [1:10:13<04:01,  1.52it/s][A
Epoch 1:  95%|█████████▍| 6412/6778 [1:10:13<04:00,  1.52it/s][A
Epoch 1:  95%|█████████▍| 6413/6778 [1:10:14<03:59,  1.53it/s][A
Epoch 1:  95%|█████████▍| 6414/6778 [1:10:15<03:58,  1.53it/s][A
Epoch 1:  95%|█████████▍| 6415/6778 [1:10:15<03:57,  1.53it/s][A
Epoch 1:  95%|█████████▍| 6416/6778 [1:10:16<03:57,  1.53it/s][A
Epoch 1: 


Epoch: 0, Loss0.3034328001021064



Epoch 1:  95%|█████████▌| 6452/6778 [1:10:39<03:33,  1.52it/s][A
Epoch 1:  95%|█████████▌| 6453/6778 [1:10:40<03:33,  1.52it/s][A
Epoch 1:  95%|█████████▌| 6454/6778 [1:10:41<03:32,  1.52it/s][A
Epoch 1:  95%|█████████▌| 6455/6778 [1:10:41<03:32,  1.52it/s][A
Epoch 1:  95%|█████████▌| 6456/6778 [1:10:42<03:32,  1.52it/s][A
Epoch 1:  95%|█████████▌| 6457/6778 [1:10:43<03:31,  1.52it/s][A
Epoch 1:  95%|█████████▌| 6458/6778 [1:10:43<03:30,  1.52it/s][A
Epoch 1:  95%|█████████▌| 6459/6778 [1:10:44<03:29,  1.52it/s][A
Epoch 1:  95%|█████████▌| 6460/6778 [1:10:45<03:28,  1.53it/s][A
Epoch 1:  95%|█████████▌| 6461/6778 [1:10:45<03:27,  1.53it/s][A
Epoch 1:  95%|█████████▌| 6462/6778 [1:10:46<03:27,  1.53it/s][A
Epoch 1:  95%|█████████▌| 6463/6778 [1:10:47<03:26,  1.53it/s][A
Epoch 1:  95%|█████████▌| 6464/6778 [1:10:47<03:25,  1.52it/s][A
Epoch 1:  95%|█████████▌| 6465/6778 [1:10:48<03:25,  1.52it/s][A
Epoch 1:  95%|█████████▌| 6466/6778 [1:10:49<03:25,  1.52it/s][A
Epoch 1: 


Epoch: 0, Loss0.30342472222236977



Epoch 1:  96%|█████████▌| 6502/6778 [1:11:12<03:01,  1.52it/s][A
Epoch 1:  96%|█████████▌| 6503/6778 [1:11:13<03:00,  1.52it/s][A
Epoch 1:  96%|█████████▌| 6504/6778 [1:11:14<03:00,  1.52it/s][A
Epoch 1:  96%|█████████▌| 6505/6778 [1:11:14<02:59,  1.52it/s][A
Epoch 1:  96%|█████████▌| 6506/6778 [1:11:15<02:58,  1.52it/s][A
Epoch 1:  96%|█████████▌| 6507/6778 [1:11:16<02:58,  1.51it/s][A
Epoch 1:  96%|█████████▌| 6508/6778 [1:11:16<02:58,  1.52it/s][A
Epoch 1:  96%|█████████▌| 6509/6778 [1:11:17<02:57,  1.52it/s][A
Epoch 1:  96%|█████████▌| 6510/6778 [1:11:18<02:57,  1.51it/s][A
Epoch 1:  96%|█████████▌| 6511/6778 [1:11:18<02:57,  1.50it/s][A
Epoch 1:  96%|█████████▌| 6512/6778 [1:11:19<02:57,  1.50it/s][A
Epoch 1:  96%|█████████▌| 6513/6778 [1:11:20<02:53,  1.53it/s][A
Epoch 1:  96%|█████████▌| 6514/6778 [1:11:20<02:52,  1.53it/s][A
Epoch 1:  96%|█████████▌| 6515/6778 [1:11:21<02:52,  1.52it/s][A
Epoch 1:  96%|█████████▌| 6516/6778 [1:11:22<02:51,  1.52it/s][A
Epoch 1: 


Epoch: 0, Loss0.3033562253081895



Epoch 1:  97%|█████████▋| 6552/6778 [1:11:45<02:30,  1.50it/s][A
Epoch 1:  97%|█████████▋| 6553/6778 [1:11:46<02:29,  1.50it/s][A
Epoch 1:  97%|█████████▋| 6554/6778 [1:11:47<02:27,  1.52it/s][A
Epoch 1:  97%|█████████▋| 6555/6778 [1:11:47<02:26,  1.52it/s][A
Epoch 1:  97%|█████████▋| 6556/6778 [1:11:48<02:25,  1.52it/s][A
Epoch 1:  97%|█████████▋| 6557/6778 [1:11:49<02:25,  1.52it/s][A
Epoch 1:  97%|█████████▋| 6558/6778 [1:11:49<02:24,  1.52it/s][A
Epoch 1:  97%|█████████▋| 6559/6778 [1:11:50<02:23,  1.52it/s][A
Epoch 1:  97%|█████████▋| 6560/6778 [1:11:50<02:23,  1.52it/s][A
Epoch 1:  97%|█████████▋| 6561/6778 [1:11:51<02:23,  1.52it/s][A
Epoch 1:  97%|█████████▋| 6562/6778 [1:11:52<02:22,  1.52it/s][A
Epoch 1:  97%|█████████▋| 6563/6778 [1:11:52<02:21,  1.52it/s][A
Epoch 1:  97%|█████████▋| 6564/6778 [1:11:53<02:20,  1.52it/s][A
Epoch 1:  97%|█████████▋| 6565/6778 [1:11:54<02:19,  1.53it/s][A
Epoch 1:  97%|█████████▋| 6566/6778 [1:11:54<02:19,  1.52it/s][A
Epoch 1: 


Epoch: 0, Loss0.30329609154377213



Epoch 1:  97%|█████████▋| 6602/6778 [1:12:18<01:55,  1.53it/s][A
Epoch 1:  97%|█████████▋| 6603/6778 [1:12:19<01:54,  1.53it/s][A
Epoch 1:  97%|█████████▋| 6604/6778 [1:12:19<01:53,  1.53it/s][A
Epoch 1:  97%|█████████▋| 6605/6778 [1:12:20<01:53,  1.53it/s][A
Epoch 1:  97%|█████████▋| 6606/6778 [1:12:21<01:52,  1.53it/s][A
Epoch 1:  97%|█████████▋| 6607/6778 [1:12:21<01:52,  1.52it/s][A
Epoch 1:  97%|█████████▋| 6608/6778 [1:12:22<01:51,  1.52it/s][A
Epoch 1:  98%|█████████▊| 6609/6778 [1:12:23<01:50,  1.52it/s][A
Epoch 1:  98%|█████████▊| 6610/6778 [1:12:23<01:50,  1.52it/s][A
Epoch 1:  98%|█████████▊| 6611/6778 [1:12:24<01:50,  1.52it/s][A
Epoch 1:  98%|█████████▊| 6612/6778 [1:12:25<01:49,  1.52it/s][A
Epoch 1:  98%|█████████▊| 6613/6778 [1:12:25<01:48,  1.52it/s][A
Epoch 1:  98%|█████████▊| 6614/6778 [1:12:26<01:48,  1.51it/s][A
Epoch 1:  98%|█████████▊| 6615/6778 [1:12:27<01:47,  1.51it/s][A
Epoch 1:  98%|█████████▊| 6616/6778 [1:12:27<01:46,  1.53it/s][A
Epoch 1: 


Epoch: 0, Loss0.30334971447135967



Epoch 1:  98%|█████████▊| 6652/6778 [1:12:51<01:23,  1.51it/s][A
Epoch 1:  98%|█████████▊| 6653/6778 [1:12:52<01:22,  1.52it/s][A
Epoch 1:  98%|█████████▊| 6654/6778 [1:12:52<01:21,  1.52it/s][A
Epoch 1:  98%|█████████▊| 6655/6778 [1:12:53<01:21,  1.51it/s][A
Epoch 1:  98%|█████████▊| 6656/6778 [1:12:54<01:20,  1.51it/s][A
Epoch 1:  98%|█████████▊| 6657/6778 [1:12:54<01:19,  1.53it/s][A
Epoch 1:  98%|█████████▊| 6658/6778 [1:12:55<01:18,  1.53it/s][A
Epoch 1:  98%|█████████▊| 6659/6778 [1:12:55<01:17,  1.53it/s][A
Epoch 1:  98%|█████████▊| 6660/6778 [1:12:56<01:17,  1.53it/s][A
Epoch 1:  98%|█████████▊| 6661/6778 [1:12:57<01:16,  1.53it/s][A
Epoch 1:  98%|█████████▊| 6662/6778 [1:12:57<01:15,  1.53it/s][A
Epoch 1:  98%|█████████▊| 6663/6778 [1:12:58<01:15,  1.53it/s][A
Epoch 1:  98%|█████████▊| 6664/6778 [1:12:59<01:14,  1.53it/s][A
Epoch 1:  98%|█████████▊| 6665/6778 [1:12:59<01:13,  1.53it/s][A
Epoch 1:  98%|█████████▊| 6666/6778 [1:13:00<01:13,  1.53it/s][A
Epoch 1: 


Epoch: 0, Loss0.30327857917719786



Epoch 1:  99%|█████████▉| 6702/6778 [1:13:24<00:49,  1.53it/s][A
Epoch 1:  99%|█████████▉| 6703/6778 [1:13:24<00:48,  1.53it/s][A
Epoch 1:  99%|█████████▉| 6704/6778 [1:13:25<00:48,  1.53it/s][A
Epoch 1:  99%|█████████▉| 6705/6778 [1:13:26<00:47,  1.53it/s][A
Epoch 1:  99%|█████████▉| 6706/6778 [1:13:26<00:47,  1.53it/s][A
Epoch 1:  99%|█████████▉| 6707/6778 [1:13:27<00:46,  1.53it/s][A
Epoch 1:  99%|█████████▉| 6708/6778 [1:13:28<00:45,  1.53it/s][A
Epoch 1:  99%|█████████▉| 6709/6778 [1:13:28<00:45,  1.53it/s][A
Epoch 1:  99%|█████████▉| 6710/6778 [1:13:29<00:44,  1.53it/s][A
Epoch 1:  99%|█████████▉| 6711/6778 [1:13:30<00:43,  1.53it/s][A
Epoch 1:  99%|█████████▉| 6712/6778 [1:13:30<00:43,  1.53it/s][A
Epoch 1:  99%|█████████▉| 6713/6778 [1:13:31<00:42,  1.52it/s][A
Epoch 1:  99%|█████████▉| 6714/6778 [1:13:32<00:42,  1.52it/s][A
Epoch 1:  99%|█████████▉| 6715/6778 [1:13:32<00:41,  1.52it/s][A
Epoch 1:  99%|█████████▉| 6716/6778 [1:13:33<00:40,  1.52it/s][A
Epoch 1: 


Epoch: 0, Loss0.303134908698529



Epoch 1: 100%|█████████▉| 6752/6778 [1:13:57<00:17,  1.52it/s][A
Epoch 1: 100%|█████████▉| 6753/6778 [1:13:57<00:16,  1.52it/s][A
Epoch 1: 100%|█████████▉| 6754/6778 [1:13:58<00:15,  1.51it/s][A
Epoch 1: 100%|█████████▉| 6755/6778 [1:13:59<00:15,  1.52it/s][A
Epoch 1: 100%|█████████▉| 6756/6778 [1:13:59<00:14,  1.52it/s][A
Epoch 1: 100%|█████████▉| 6757/6778 [1:14:00<00:13,  1.52it/s][A
Epoch 1: 100%|█████████▉| 6758/6778 [1:14:01<00:13,  1.50it/s][A
Epoch 1: 100%|█████████▉| 6759/6778 [1:14:01<00:12,  1.51it/s][A
Epoch 1: 100%|█████████▉| 6760/6778 [1:14:02<00:11,  1.52it/s][A
Epoch 1: 100%|█████████▉| 6761/6778 [1:14:02<00:11,  1.52it/s][A
Epoch 1: 100%|█████████▉| 6762/6778 [1:14:03<00:10,  1.52it/s][A
Epoch 1: 100%|█████████▉| 6763/6778 [1:14:04<00:09,  1.52it/s][A
Epoch 1: 100%|█████████▉| 6764/6778 [1:14:04<00:09,  1.52it/s][A
Epoch 1: 100%|█████████▉| 6765/6778 [1:14:05<00:08,  1.52it/s][A
Epoch 1: 100%|█████████▉| 6766/6778 [1:14:06<00:07,  1.52it/s][A
Epoch 1: 

#### Validation Loop

In [None]:
from sklearn import metrics

for epoch in tqdm(range(EPOCHS)):

  multilabel_model.eval()
  val_targets=[]
  val_outputs=[]

  with torch.no_grad():

    for i,batch in enumerate(validation_loader):

      input_ids = batch['input_ids'].to(device)
      attention_mask = batch['attention_mask'].to(device)
      token_type_ids = batch['token_type_ids'].to(device)
      targets = batch['targets'].to(device)

      outputs = multilabel_model(input_ids,attention_mask,token_type_ids)

      val_targets.extend(targets.cpu().detach().numpy().tolist())
      val_outputs.extend(torch.sigmoid(outputs).cpu().detach().numpy().tolist())

  outputs = np.array(val_outputs) >= 0.5
  accuracy = metrics.accuracy_score(val_targets, outputs)
  f1_score_micro = metrics.f1_score(val_targets, outputs, average='micro')
  f1_score_macro = metrics.f1_score(val_targets, outputs, average='macro')
  print(f"Accuracy Score = {accuracy}")
  print(f"F1 Score (Micro) = {f1_score_micro}")
  print(f"F1 Score (Macro) = {f1_score_macro}")

In [29]:
multilabel_model

MultilabelHateBert(
  (bertmodel): BertModel(
    (embeddings): BertEmbeddings(
      (word_embeddings): Embedding(30522, 768, padding_idx=0)
      (position_embeddings): Embedding(512, 768)
      (token_type_embeddings): Embedding(2, 768)
      (LayerNorm): LayerNorm((768,), eps=1e-12, elementwise_affine=True)
      (dropout): Dropout(p=0.1, inplace=False)
    )
    (encoder): BertEncoder(
      (layer): ModuleList(
        (0-11): 12 x BertLayer(
          (attention): BertAttention(
            (self): BertSelfAttention(
              (query): Linear(in_features=768, out_features=768, bias=True)
              (key): Linear(in_features=768, out_features=768, bias=True)
              (value): Linear(in_features=768, out_features=768, bias=True)
              (dropout): Dropout(p=0.1, inplace=False)
            )
            (output): BertSelfOutput(
              (dense): Linear(in_features=768, out_features=768, bias=True)
              (LayerNorm): LayerNorm((768,), eps=1e-12, eleme

In [35]:
PATH = 'fine_tuning_v1.pth'
torch.save(multilabel_model.state_dict(), PATH)

In [37]:
print("lluak")

lluak


In [None]:

#multilabel_model1 = MultilabelHateBert(model)
#multilabel_model1.load_state_dict(torch.load('/content/fine_tuning_v1.1'))

## Interpretability

In [None]:
multilabel_dataset

In [None]:
#Import
! pip install lime
! pip install transformers-interpret

In [None]:
samples = [17, 4, 44, 3, 8, 27, 71, 74]
attributions = dict()
attributions['LIME'] = []

In [None]:
import lime
from lime.lime_text import LimeTextExplainer
explainer = LimeTextExplainer(class_names=columns_to_transform, split_expression='\s+', bow=False)

In [None]:

def predictor(texts):

    encodings = tokenizer(texts,
                           padding='max_length',
                           truncation=True,
                           max_length=MAX_LEN,
                           return_tensors='pt')

    input_ids = encodings['input_ids'].to(device)
    attention_mask = encodings['attention_mask'].to(device)
    token_type_ids = encodings['token_type_ids'].to(device)

    logits = multilabel_model(input_ids, attention_mask, token_type_ids)
    probabilities = F.softmax(logits, dim=1)

    return probabilities.cpu().detach().numpy()

for idx in samples:
    instance = val_texts.iloc[idx].text

    # Call predictor with the current instance
    exp = explainer.explain_instance(instance, predictor, num_features=200, num_samples=64)

    explanation_dict = dict(list(exp.as_map().values())[0])
    tokens = val_texts.iloc[idx].text.split(' ')
    scores = []

    for i in range(len(tokens)):
        scores.append((tokens[i], explanation_dict[i]))

    attributions['LIME'].append(scores)

In [None]:
%matplotlib inline
import matplotlib.pyplot as plt
from matplotlib import cm, transforms

# Plotting Code from innvestigate library: https://github.com/albermax/innvestigate
def plot_text_heatmap(words, scores, title="", width=10, height=0.2, verbose=0, max_word_per_line=20):
    fig = plt.figure(figsize=(width, height))

    ax = plt.gca()

    ax.set_title(title, loc='left')
    tokens = words
    if verbose > 0:
        print('len words : %d | len scores : %d' % (len(words), len(scores)))

    cmap = plt.cm.ScalarMappable(cmap=cm.bwr)
    cmap.set_clim(0, 1)

    canvas = ax.figure.canvas
    t = ax.transData

    # normalize scores to the followings:
    # - negative scores in [0, 0.5]
    # - positive scores in (0.5, 1]
    normalized_scores = 0.5 * scores / np.max(np.abs(scores)) + 0.5

    if verbose > 1:
        print('Raw score')
        print(scores)
        print('Normalized score')
        print(normalized_scores)

    # make sure the heatmap doesn't overlap with the title
    loc_y = -0.2

    for i, token in enumerate(tokens):
        *rgb, _ = cmap.to_rgba(normalized_scores[i], bytes=True)
        color = '#%02x%02x%02x' % tuple(rgb)

        text = ax.text(0.0, loc_y, token,
                       bbox={
                           'facecolor': color,
                           'pad': 5.0,
                           'linewidth': 1,
                           'boxstyle': 'round,pad=0.5'
                       }, transform=t)

        text.draw(canvas.get_renderer())
        ex = text.get_window_extent()

        # create a new line if the line exceeds the length
        if (i+1) % max_word_per_line == 0:
            loc_y = loc_y -  2.5
            t = ax.transData
        else:
            t = transforms.offset_copy(text._transform, x=ex.width+15, units='dots')

    if verbose == 0:
        ax.axis('off')

In [None]:
# Plotting
methods = ['LIME']

for sample_id in range(len(samples)):
    for method in methods:
        analysis = attributions[method][sample_id]
        words = [t[0] for t in analysis]
        scores = np.array([t[1] for t in analysis])
        plot_text_heatmap(words, scores, title='Method: %s' % method, verbose=0)
    plt.show()