<a href="https://colab.research.google.com/github/LikeWind99/DeepLearning/blob/master/%E4%BA%8C%E5%88%86%E7%B1%BB.ipynb" target="_parent"><img src="https://colab.research.google.com/assets/colab-badge.svg" alt="Open In Colab"/></a>

In [6]:
import torch as t
import torchvision
from torchvision.datasets import ImageFolder
import torch.nn as nn
from torch.utils.data import DataLoader
import torchvision.transforms as T
import matplotlib.pyplot as plt
import torch.nn.functional as F
import tqdm
import numpy as np

In [7]:
normalize = T.Normalize(mean=[0.4, 0.4, 0.4], std=[0.2, 0.2, 0.2])
transform = T.Compose([
    T.RandomResizedCrop(224),
    T.RandomHorizontalFlip(),
    T.ToTensor(),
    normalize
])
device = t.device('cuda' if t.cuda.is_available() else 'cpu')
batch_size = 4
num_works = 2
epochs = 100


In [10]:
dataset = ImageFolder(r'/content/drive/MyDrive/test', transform=transform)
sample_size = len(dataset)
trainDataset, testDataset = t.utils.data.random_split(dataset= dataset, lengths=[int(0.8 * sample_size), int(0.2 * sample_size)])

trainLoader = DataLoader(dataset=trainDataset, batch_size=batch_size, shuffle=True, drop_last=True)
testLoader = DataLoader(dataset=testDataset, batch_size=batch_size, drop_last=True)

In [11]:
class ResidualBlock(nn.Module):
    def __init__(self, inchannel, outchannel, stride=1, shortcut=None):
        super(ResidualBlock,self).__init__()
        self.left = nn.Sequential(
            nn.Conv2d(inchannel,outchannel,3,stride, 1,bias=False),
            nn.BatchNorm2d(outchannel),
            nn.ReLU(inplace=True),
            nn.Conv2d(outchannel,outchannel,3,1,1,bias=False),
            nn.BatchNorm2d(outchannel)
        )
        self.right = shortcut
    
    def forward(self,x):
        out = self.left(x)
        residual = x if self.right is None else self.right(x)
        out += residual
        return F.relu(out)
    
class ResNet(nn.Module):
    def __init__(self, num_classes=2):
        super(ResNet,self).__init__()
        self.pre = nn.Sequential(
                nn.Conv2d(3, 64, 7, 2, 3, bias=False),
                nn.BatchNorm2d(64),
                nn.ReLU(inplace=True),
                nn.MaxPool2d(3, 2, 1)
        )
        self.layer1 = self._make_layer( 64, 64, 3)
        self.layer2 = self._make_layer( 64, 128, 4, stride=2)
        self.layer3 = self._make_layer( 128, 256, 6, stride=2)
        self.layer4 = self._make_layer( 256, 512, 3, stride=2)
        self.fc = nn.Linear(512, num_classes)
        
    def _make_layer(self,  inchannel, outchannel, block_num, stride=1):
        shortcut = nn.Sequential(
                nn.Conv2d(inchannel,outchannel,1,stride, bias=False),
                nn.BatchNorm2d(outchannel)
        )
        layers = []
        layers.append(ResidualBlock(inchannel, outchannel, stride, shortcut))
        
        for i in range(1, block_num):
            layers.append(ResidualBlock(outchannel, outchannel))
        return nn.Sequential(*layers)
    
    def forward(self, x):
        x = self.pre(x)
        
        x = self.layer1(x)
        x = self.layer2(x)
        x = self.layer3(x)
        x = self.layer4(x)

        x = F.avg_pool2d(x, 7)
        x = x.view(x.size(0), -1)
        return self.fc(x)

In [14]:
net = ResNet()
total_step = len(trainLoader)
criterion = nn.CrossEntropyLoss()
optimizer = t.optim.Adam(params=net.parameters())
for epoch in range(epochs):
  for i, (imgs, labels) in tqdm.tqdm(enumerate(trainLoader)):
    net = net.to(device)
    optimizer.zero_grad()
    imgs = imgs.to(device)
    labels = labels.to(device)
    predict = net(imgs)
    loss = criterion(predict, labels)
    loss.backward()
    optimizer.step()
    if (i + 1) % 100 == 0:
      print(f'Epoch [{epoch}/{epochs}], Step [{i+1}/{total_step}], loss: {loss.item():.4f}')





0it [00:00, ?it/s][A[A[A


1it [00:02,  2.26s/it][A[A[A


2it [00:04,  2.29s/it][A[A[A


3it [00:07,  2.35s/it][A[A[A


4it [00:08,  2.15s/it][A[A[A


5it [00:10,  2.00s/it][A[A[A


6it [00:12,  2.06s/it][A[A[A


7it [00:15,  2.42s/it][A[A[A


8it [00:17,  2.17s/it][A[A[A


9it [00:20,  2.43s/it][A[A[A


10it [00:22,  2.18s/it][A[A[A


11it [00:25,  2.44s/it][A[A[A


12it [00:28,  2.65s/it][A[A[A


13it [00:31,  2.74s/it][A[A[A


14it [00:33,  2.59s/it][A[A[A


15it [00:36,  2.72s/it][A[A[A


16it [00:39,  2.80s/it][A[A[A


17it [00:42,  2.94s/it][A[A[A


18it [00:45,  2.97s/it][A[A[A


19it [00:48,  2.99s/it][A[A[A


20it [00:51,  2.76s/it][A[A[A


21it [00:54,  2.85s/it][A[A[A


22it [00:56,  2.68s/it][A[A[A


23it [00:58,  2.59s/it][A[A[A


24it [01:01,  2.75s/it][A[A[A


25it [01:04,  2.80s/it][A[A[A


26it [01:06,  2.43s/it][A[A[A


27it [01:08,  2.36s/it][A[A[A


28it [01:11,  2.55s/it][A[A[

Epoch [0/100], Step [100/187], loss: 0.0229





101it [04:11,  2.10s/it][A[A[A


102it [04:13,  1.95s/it][A[A[A


103it [04:16,  2.27s/it][A[A[A


104it [04:18,  2.27s/it][A[A[A


105it [04:20,  2.04s/it][A[A[A


106it [04:22,  2.09s/it][A[A[A


107it [04:24,  2.15s/it][A[A[A


109it [04:27,  1.96s/it][A[A[A


110it [04:30,  2.31s/it][A[A[A


111it [04:32,  2.13s/it][A[A[A


112it [04:34,  2.14s/it][A[A[A


113it [04:37,  2.23s/it][A[A[A


114it [04:40,  2.46s/it][A[A[A


115it [04:41,  2.16s/it][A[A[A


116it [04:44,  2.22s/it][A[A[A


117it [04:46,  2.40s/it][A[A[A


118it [04:48,  2.29s/it][A[A[A


119it [04:51,  2.32s/it][A[A[A


120it [04:54,  2.58s/it][A[A[A


121it [04:57,  2.74s/it][A[A[A


122it [04:58,  2.18s/it][A[A[A


123it [05:00,  2.20s/it][A[A[A


124it [05:02,  2.15s/it][A[A[A


125it [05:05,  2.41s/it][A[A[A


126it [05:08,  2.37s/it][A[A[A


127it [05:11,  2.64s/it][A[A[A


128it [05:12,  2.34s/it][A[A[A


129it [05:16,  2.59s/it]

Epoch [1/100], Step [100/187], loss: 0.0851





107it [00:04, 22.47it/s][A[A[A


110it [00:04, 22.78it/s][A[A[A


113it [00:04, 22.96it/s][A[A[A


116it [00:05, 22.31it/s][A[A[A


119it [00:05, 22.63it/s][A[A[A


122it [00:05, 22.69it/s][A[A[A


125it [00:05, 22.84it/s][A[A[A


128it [00:05, 23.24it/s][A[A[A


131it [00:05, 23.36it/s][A[A[A


134it [00:05, 23.34it/s][A[A[A


137it [00:06, 23.38it/s][A[A[A


140it [00:06, 22.79it/s][A[A[A


143it [00:06, 23.07it/s][A[A[A


146it [00:06, 23.37it/s][A[A[A


149it [00:06, 23.02it/s][A[A[A


152it [00:06, 23.27it/s][A[A[A


155it [00:06, 23.37it/s][A[A[A


158it [00:06, 22.89it/s][A[A[A


161it [00:07, 23.08it/s][A[A[A


164it [00:07, 23.26it/s][A[A[A


167it [00:07, 23.14it/s][A[A[A


170it [00:07, 23.23it/s][A[A[A


173it [00:07, 23.04it/s][A[A[A


176it [00:07, 23.18it/s][A[A[A


179it [00:07, 22.83it/s][A[A[A


182it [00:07, 23.13it/s][A[A[A


187it [00:08, 22.86it/s]



0it [00:00, ?it/s][A[A[A


3it

Epoch [2/100], Step [100/187], loss: 0.1551





105it [00:04, 22.50it/s][A[A[A


108it [00:04, 22.55it/s][A[A[A


111it [00:04, 22.83it/s][A[A[A


114it [00:04, 22.77it/s][A[A[A


117it [00:05, 22.94it/s][A[A[A


120it [00:05, 23.06it/s][A[A[A


123it [00:05, 22.99it/s][A[A[A


126it [00:05, 22.93it/s][A[A[A


129it [00:05, 23.24it/s][A[A[A


132it [00:05, 23.24it/s][A[A[A


135it [00:05, 23.49it/s][A[A[A


138it [00:05, 23.69it/s][A[A[A


141it [00:06, 23.54it/s][A[A[A


144it [00:06, 23.61it/s][A[A[A


147it [00:06, 23.62it/s][A[A[A


150it [00:06, 23.15it/s][A[A[A


153it [00:06, 23.36it/s][A[A[A


156it [00:06, 23.40it/s][A[A[A


159it [00:06, 23.02it/s][A[A[A


162it [00:07, 23.22it/s][A[A[A


165it [00:07, 23.06it/s][A[A[A


168it [00:07, 23.21it/s][A[A[A


171it [00:07, 23.37it/s][A[A[A


174it [00:07, 22.86it/s][A[A[A


177it [00:07, 23.10it/s][A[A[A


180it [00:07, 23.30it/s][A[A[A


183it [00:07, 23.09it/s][A[A[A


187it [00:08, 23.11it/s]


Epoch [3/100], Step [100/187], loss: 0.2035





105it [00:04, 22.46it/s][A[A[A


108it [00:04, 22.01it/s][A[A[A


111it [00:04, 22.48it/s][A[A[A


114it [00:04, 22.87it/s][A[A[A


117it [00:05, 22.91it/s][A[A[A


120it [00:05, 23.03it/s][A[A[A


123it [00:05, 22.91it/s][A[A[A


126it [00:05, 22.91it/s][A[A[A


129it [00:05, 22.88it/s][A[A[A


132it [00:05, 23.15it/s][A[A[A


135it [00:05, 23.46it/s][A[A[A


138it [00:06, 23.45it/s][A[A[A


141it [00:06, 23.60it/s][A[A[A


144it [00:06, 23.56it/s][A[A[A


147it [00:06, 23.32it/s][A[A[A


150it [00:06, 23.19it/s][A[A[A


153it [00:06, 23.19it/s][A[A[A


156it [00:06, 23.36it/s][A[A[A


159it [00:06, 23.10it/s][A[A[A


162it [00:07, 22.65it/s][A[A[A


165it [00:07, 22.11it/s][A[A[A


168it [00:07, 22.50it/s][A[A[A


171it [00:07, 22.66it/s][A[A[A


174it [00:07, 22.84it/s][A[A[A


177it [00:07, 23.03it/s][A[A[A


180it [00:07, 23.10it/s][A[A[A


183it [00:07, 23.14it/s][A[A[A


187it [00:08, 22.92it/s]


Epoch [4/100], Step [100/187], loss: 0.2477





105it [00:04, 22.49it/s][A[A[A


108it [00:04, 22.74it/s][A[A[A


111it [00:04, 22.85it/s][A[A[A


114it [00:04, 23.10it/s][A[A[A


117it [00:05, 23.17it/s][A[A[A


120it [00:05, 23.39it/s][A[A[A


123it [00:05, 23.47it/s][A[A[A


126it [00:05, 22.89it/s][A[A[A


129it [00:05, 23.15it/s][A[A[A


132it [00:05, 22.93it/s][A[A[A


135it [00:05, 23.06it/s][A[A[A


138it [00:05, 23.17it/s][A[A[A


141it [00:06, 23.06it/s][A[A[A


144it [00:06, 23.36it/s][A[A[A


147it [00:06, 22.57it/s][A[A[A


150it [00:06, 22.52it/s][A[A[A


153it [00:06, 22.88it/s][A[A[A


156it [00:06, 23.31it/s][A[A[A


159it [00:06, 23.56it/s][A[A[A


162it [00:07, 23.68it/s][A[A[A


165it [00:07, 23.75it/s][A[A[A


168it [00:07, 23.72it/s][A[A[A


171it [00:07, 23.58it/s][A[A[A


174it [00:07, 23.58it/s][A[A[A


177it [00:07, 23.53it/s][A[A[A


180it [00:07, 23.70it/s][A[A[A


183it [00:07, 23.56it/s][A[A[A


187it [00:08, 23.13it/s]


Epoch [5/100], Step [100/187], loss: 0.9034





105it [00:04, 22.79it/s][A[A[A


108it [00:04, 22.99it/s][A[A[A


111it [00:04, 23.06it/s][A[A[A


114it [00:04, 23.29it/s][A[A[A


117it [00:05, 23.45it/s][A[A[A


120it [00:05, 23.42it/s][A[A[A


123it [00:05, 23.47it/s][A[A[A


126it [00:05, 22.32it/s][A[A[A


129it [00:05, 22.47it/s][A[A[A


132it [00:05, 22.82it/s][A[A[A


135it [00:05, 23.08it/s][A[A[A


138it [00:05, 22.84it/s][A[A[A


141it [00:06, 23.11it/s][A[A[A


144it [00:06, 23.04it/s][A[A[A


147it [00:06, 22.55it/s][A[A[A


150it [00:06, 22.88it/s][A[A[A


153it [00:06, 22.53it/s][A[A[A


156it [00:06, 22.58it/s][A[A[A


159it [00:06, 22.98it/s][A[A[A


162it [00:07, 23.05it/s][A[A[A


165it [00:07, 23.31it/s][A[A[A


168it [00:07, 23.37it/s][A[A[A


171it [00:07, 23.03it/s][A[A[A


174it [00:07, 23.21it/s][A[A[A


177it [00:07, 23.31it/s][A[A[A


180it [00:07, 23.25it/s][A[A[A


183it [00:07, 23.33it/s][A[A[A


187it [00:08, 23.01it/s]


Epoch [6/100], Step [100/187], loss: 0.0456





105it [00:04, 21.80it/s][A[A[A


108it [00:04, 22.35it/s][A[A[A


111it [00:04, 22.70it/s][A[A[A


114it [00:05, 22.77it/s][A[A[A


117it [00:05, 23.00it/s][A[A[A


120it [00:05, 22.74it/s][A[A[A


123it [00:05, 22.87it/s][A[A[A


126it [00:05, 22.92it/s][A[A[A


129it [00:05, 22.84it/s][A[A[A


132it [00:05, 23.11it/s][A[A[A


135it [00:05, 23.24it/s][A[A[A


138it [00:06, 22.89it/s][A[A[A


141it [00:06, 22.82it/s][A[A[A


144it [00:06, 22.70it/s][A[A[A


147it [00:06, 22.70it/s][A[A[A


150it [00:06, 22.95it/s][A[A[A


153it [00:06, 23.13it/s][A[A[A


156it [00:06, 23.16it/s][A[A[A


159it [00:07, 23.36it/s][A[A[A


162it [00:07, 23.29it/s][A[A[A


165it [00:07, 23.06it/s][A[A[A


168it [00:07, 22.89it/s][A[A[A


171it [00:07, 22.89it/s][A[A[A


174it [00:07, 22.95it/s][A[A[A


177it [00:07, 23.03it/s][A[A[A


180it [00:07, 22.89it/s][A[A[A


183it [00:08, 22.85it/s][A[A[A


187it [00:08, 22.70it/s]


Epoch [7/100], Step [100/187], loss: 0.8320





105it [00:04, 21.76it/s][A[A[A


108it [00:04, 21.95it/s][A[A[A


111it [00:04, 22.09it/s][A[A[A


114it [00:05, 22.33it/s][A[A[A


117it [00:05, 22.17it/s][A[A[A


120it [00:05, 22.35it/s][A[A[A


123it [00:05, 22.27it/s][A[A[A


126it [00:05, 22.35it/s][A[A[A


129it [00:05, 22.61it/s][A[A[A


132it [00:05, 22.80it/s][A[A[A


135it [00:06, 22.84it/s][A[A[A


138it [00:06, 21.98it/s][A[A[A


141it [00:06, 21.99it/s][A[A[A


144it [00:06, 22.11it/s][A[A[A


147it [00:06, 22.39it/s][A[A[A


150it [00:06, 22.59it/s][A[A[A


153it [00:06, 22.30it/s][A[A[A


156it [00:06, 22.42it/s][A[A[A


159it [00:07, 22.42it/s][A[A[A


162it [00:07, 22.27it/s][A[A[A


165it [00:07, 22.54it/s][A[A[A


168it [00:07, 22.32it/s][A[A[A


171it [00:07, 22.24it/s][A[A[A


174it [00:07, 22.45it/s][A[A[A


177it [00:07, 22.66it/s][A[A[A


180it [00:08, 22.66it/s][A[A[A


183it [00:08, 22.62it/s][A[A[A


187it [00:08, 22.33it/s]


Epoch [8/100], Step [100/187], loss: 0.1052





105it [00:04, 22.30it/s][A[A[A


108it [00:04, 22.17it/s][A[A[A


111it [00:04, 22.33it/s][A[A[A


114it [00:05, 22.27it/s][A[A[A


117it [00:05, 22.57it/s][A[A[A


120it [00:05, 22.63it/s][A[A[A


123it [00:05, 22.90it/s][A[A[A


126it [00:05, 23.18it/s][A[A[A


129it [00:05, 23.29it/s][A[A[A


132it [00:05, 23.35it/s][A[A[A


135it [00:06, 22.75it/s][A[A[A


138it [00:06, 22.79it/s][A[A[A


141it [00:06, 23.12it/s][A[A[A


144it [00:06, 23.02it/s][A[A[A


147it [00:06, 22.75it/s][A[A[A


150it [00:06, 22.99it/s][A[A[A


153it [00:06, 23.20it/s][A[A[A


156it [00:06, 23.32it/s][A[A[A


159it [00:07, 23.26it/s][A[A[A


162it [00:07, 23.24it/s][A[A[A


165it [00:07, 23.30it/s][A[A[A


168it [00:07, 23.20it/s][A[A[A


171it [00:07, 23.32it/s][A[A[A


174it [00:07, 23.15it/s][A[A[A


177it [00:07, 23.12it/s][A[A[A


180it [00:07, 22.98it/s][A[A[A


183it [00:08, 22.70it/s][A[A[A


187it [00:08, 22.67it/s]


Epoch [9/100], Step [100/187], loss: 0.0523





105it [00:04, 22.01it/s][A[A[A


108it [00:04, 22.11it/s][A[A[A


111it [00:04, 22.62it/s][A[A[A


114it [00:05, 22.59it/s][A[A[A


117it [00:05, 22.58it/s][A[A[A


120it [00:05, 22.69it/s][A[A[A


123it [00:05, 22.83it/s][A[A[A


126it [00:05, 23.04it/s][A[A[A


129it [00:05, 22.97it/s][A[A[A


132it [00:05, 22.47it/s][A[A[A


135it [00:05, 22.88it/s][A[A[A


138it [00:06, 22.84it/s][A[A[A


141it [00:06, 23.07it/s][A[A[A


144it [00:06, 23.21it/s][A[A[A


147it [00:06, 23.39it/s][A[A[A


150it [00:06, 23.45it/s][A[A[A


153it [00:06, 23.56it/s][A[A[A


156it [00:06, 23.08it/s][A[A[A


159it [00:07, 22.83it/s][A[A[A


162it [00:07, 23.05it/s][A[A[A


165it [00:07, 22.83it/s][A[A[A


168it [00:07, 23.11it/s][A[A[A


171it [00:07, 23.29it/s][A[A[A


174it [00:07, 22.74it/s][A[A[A


177it [00:07, 22.73it/s][A[A[A


180it [00:07, 23.06it/s][A[A[A


183it [00:08, 22.76it/s][A[A[A


187it [00:08, 22.70it/s]


Epoch [10/100], Step [100/187], loss: 0.0443





105it [00:04, 22.91it/s][A[A[A


108it [00:04, 22.73it/s][A[A[A


111it [00:04, 23.02it/s][A[A[A


114it [00:04, 22.69it/s][A[A[A


117it [00:05, 22.97it/s][A[A[A


120it [00:05, 23.18it/s][A[A[A


123it [00:05, 22.83it/s][A[A[A


126it [00:05, 23.08it/s][A[A[A


129it [00:05, 23.29it/s][A[A[A


132it [00:05, 23.15it/s][A[A[A


135it [00:05, 23.36it/s][A[A[A


138it [00:05, 23.52it/s][A[A[A


141it [00:06, 23.42it/s][A[A[A


144it [00:06, 23.48it/s][A[A[A


147it [00:06, 23.33it/s][A[A[A


150it [00:06, 23.37it/s][A[A[A


153it [00:06, 23.46it/s][A[A[A


156it [00:06, 23.28it/s][A[A[A


159it [00:06, 23.35it/s][A[A[A


162it [00:06, 23.53it/s][A[A[A


165it [00:07, 23.44it/s][A[A[A


168it [00:07, 23.57it/s][A[A[A


171it [00:07, 23.60it/s][A[A[A


174it [00:07, 23.16it/s][A[A[A


177it [00:07, 23.36it/s][A[A[A


180it [00:07, 23.26it/s][A[A[A


183it [00:07, 23.26it/s][A[A[A


187it [00:08, 23.29it/s]


Epoch [11/100], Step [100/187], loss: 0.1189





105it [00:04, 22.75it/s][A[A[A


108it [00:04, 22.05it/s][A[A[A


111it [00:04, 22.45it/s][A[A[A


114it [00:04, 22.73it/s][A[A[A


117it [00:05, 23.01it/s][A[A[A


120it [00:05, 23.18it/s][A[A[A


123it [00:05, 23.11it/s][A[A[A


126it [00:05, 23.29it/s][A[A[A


129it [00:05, 23.43it/s][A[A[A


132it [00:05, 23.16it/s][A[A[A


135it [00:05, 23.03it/s][A[A[A


138it [00:05, 23.38it/s][A[A[A


141it [00:06, 23.53it/s][A[A[A


144it [00:06, 23.37it/s][A[A[A


147it [00:06, 23.48it/s][A[A[A


150it [00:06, 23.33it/s][A[A[A


153it [00:06, 23.36it/s][A[A[A


156it [00:06, 23.17it/s][A[A[A


159it [00:06, 22.55it/s][A[A[A


162it [00:07, 22.67it/s][A[A[A


165it [00:07, 23.01it/s][A[A[A


168it [00:07, 23.01it/s][A[A[A


171it [00:07, 23.14it/s][A[A[A


174it [00:07, 23.31it/s][A[A[A


177it [00:07, 23.25it/s][A[A[A


180it [00:07, 23.24it/s][A[A[A


183it [00:07, 23.42it/s][A[A[A


187it [00:08, 23.11it/s]


Epoch [12/100], Step [100/187], loss: 0.1238





105it [00:04, 22.66it/s][A[A[A


108it [00:04, 22.60it/s][A[A[A


111it [00:04, 22.86it/s][A[A[A


114it [00:04, 22.59it/s][A[A[A


117it [00:05, 22.81it/s][A[A[A


120it [00:05, 22.88it/s][A[A[A


123it [00:05, 22.62it/s][A[A[A


126it [00:05, 22.82it/s][A[A[A


129it [00:05, 22.97it/s][A[A[A


132it [00:05, 22.75it/s][A[A[A


135it [00:05, 23.02it/s][A[A[A


138it [00:06, 23.08it/s][A[A[A


141it [00:06, 23.23it/s][A[A[A


144it [00:06, 23.35it/s][A[A[A


147it [00:06, 23.38it/s][A[A[A


150it [00:06, 22.78it/s][A[A[A


153it [00:06, 22.87it/s][A[A[A


156it [00:06, 22.74it/s][A[A[A


159it [00:06, 22.90it/s][A[A[A


162it [00:07, 23.01it/s][A[A[A


165it [00:07, 23.16it/s][A[A[A


168it [00:07, 23.14it/s][A[A[A


171it [00:07, 23.19it/s][A[A[A


174it [00:07, 23.28it/s][A[A[A


177it [00:07, 22.70it/s][A[A[A


180it [00:07, 22.88it/s][A[A[A


183it [00:07, 23.16it/s][A[A[A


187it [00:08, 23.02it/s]


Epoch [13/100], Step [100/187], loss: 0.0229





105it [00:04, 22.73it/s][A[A[A


108it [00:04, 22.64it/s][A[A[A


111it [00:04, 23.06it/s][A[A[A


114it [00:04, 23.35it/s][A[A[A


117it [00:05, 23.49it/s][A[A[A


120it [00:05, 23.75it/s][A[A[A


123it [00:05, 23.49it/s][A[A[A


126it [00:05, 23.69it/s][A[A[A


129it [00:05, 22.87it/s][A[A[A


132it [00:05, 22.49it/s][A[A[A


135it [00:05, 22.87it/s][A[A[A


138it [00:05, 23.20it/s][A[A[A


141it [00:06, 23.30it/s][A[A[A


144it [00:06, 23.40it/s][A[A[A


147it [00:06, 23.60it/s][A[A[A


150it [00:06, 23.64it/s][A[A[A


153it [00:06, 23.81it/s][A[A[A


156it [00:06, 23.43it/s][A[A[A


159it [00:06, 23.33it/s][A[A[A


162it [00:07, 23.37it/s][A[A[A


165it [00:07, 23.47it/s][A[A[A


168it [00:07, 23.32it/s][A[A[A


171it [00:07, 23.49it/s][A[A[A


174it [00:07, 23.55it/s][A[A[A


177it [00:07, 23.03it/s][A[A[A


180it [00:07, 23.14it/s][A[A[A


183it [00:07, 23.13it/s][A[A[A


187it [00:08, 23.14it/s]


Epoch [14/100], Step [100/187], loss: 0.6413





105it [00:04, 23.14it/s][A[A[A


108it [00:04, 22.81it/s][A[A[A


111it [00:04, 22.98it/s][A[A[A


114it [00:04, 23.05it/s][A[A[A


117it [00:05, 23.06it/s][A[A[A


120it [00:05, 23.19it/s][A[A[A


123it [00:05, 23.31it/s][A[A[A


126it [00:05, 23.14it/s][A[A[A


129it [00:05, 23.02it/s][A[A[A


132it [00:05, 22.98it/s][A[A[A


135it [00:05, 23.02it/s][A[A[A


138it [00:05, 23.31it/s][A[A[A


141it [00:06, 23.48it/s][A[A[A


144it [00:06, 23.57it/s][A[A[A


147it [00:06, 23.57it/s][A[A[A


150it [00:06, 23.61it/s][A[A[A


153it [00:06, 23.53it/s][A[A[A


156it [00:06, 23.48it/s][A[A[A


159it [00:06, 23.48it/s][A[A[A


162it [00:06, 23.26it/s][A[A[A


165it [00:07, 23.32it/s][A[A[A


168it [00:07, 23.47it/s][A[A[A


171it [00:07, 23.46it/s][A[A[A


174it [00:07, 23.44it/s][A[A[A


177it [00:07, 23.15it/s][A[A[A


180it [00:07, 23.04it/s][A[A[A


183it [00:07, 22.67it/s][A[A[A


187it [00:08, 23.17it/s]


Epoch [15/100], Step [100/187], loss: 0.1865





105it [00:04, 22.91it/s][A[A[A


108it [00:04, 22.70it/s][A[A[A


111it [00:04, 22.89it/s][A[A[A


114it [00:04, 23.15it/s][A[A[A


117it [00:05, 23.13it/s][A[A[A


120it [00:05, 23.19it/s][A[A[A


123it [00:05, 23.17it/s][A[A[A


126it [00:05, 22.69it/s][A[A[A


129it [00:05, 22.92it/s][A[A[A


132it [00:05, 22.95it/s][A[A[A


135it [00:05, 23.03it/s][A[A[A


138it [00:05, 23.26it/s][A[A[A


141it [00:06, 23.33it/s][A[A[A


144it [00:06, 23.06it/s][A[A[A


147it [00:06, 23.25it/s][A[A[A


150it [00:06, 23.32it/s][A[A[A


153it [00:06, 23.26it/s][A[A[A


156it [00:06, 23.15it/s][A[A[A


159it [00:06, 23.11it/s][A[A[A


162it [00:06, 23.05it/s][A[A[A


165it [00:07, 22.85it/s][A[A[A


168it [00:07, 22.93it/s][A[A[A


171it [00:07, 23.21it/s][A[A[A


174it [00:07, 23.01it/s][A[A[A


177it [00:07, 22.71it/s][A[A[A


180it [00:07, 22.81it/s][A[A[A


183it [00:07, 22.93it/s][A[A[A


187it [00:08, 23.14it/s]


Epoch [16/100], Step [100/187], loss: 0.0605





105it [00:04, 22.64it/s][A[A[A


108it [00:04, 22.75it/s][A[A[A


111it [00:04, 22.91it/s][A[A[A


114it [00:04, 22.85it/s][A[A[A


117it [00:05, 22.85it/s][A[A[A


120it [00:05, 23.09it/s][A[A[A


123it [00:05, 22.91it/s][A[A[A


126it [00:05, 23.05it/s][A[A[A


129it [00:05, 23.30it/s][A[A[A


132it [00:05, 23.19it/s][A[A[A


135it [00:05, 23.17it/s][A[A[A


138it [00:06, 22.91it/s][A[A[A


141it [00:06, 23.05it/s][A[A[A


144it [00:06, 23.25it/s][A[A[A


147it [00:06, 23.22it/s][A[A[A


150it [00:06, 22.95it/s][A[A[A


153it [00:06, 23.02it/s][A[A[A


156it [00:06, 22.72it/s][A[A[A


159it [00:06, 22.24it/s][A[A[A


162it [00:07, 22.21it/s][A[A[A


165it [00:07, 22.51it/s][A[A[A


168it [00:07, 22.49it/s][A[A[A


171it [00:07, 22.63it/s][A[A[A


174it [00:07, 22.89it/s][A[A[A


177it [00:07, 22.88it/s][A[A[A


180it [00:07, 22.72it/s][A[A[A


183it [00:07, 22.81it/s][A[A[A


187it [00:08, 22.90it/s]


Epoch [17/100], Step [100/187], loss: 0.0622





107it [00:04, 22.34it/s][A[A[A


110it [00:04, 22.57it/s][A[A[A


113it [00:04, 22.88it/s][A[A[A


116it [00:05, 23.08it/s][A[A[A


119it [00:05, 23.34it/s][A[A[A


122it [00:05, 23.46it/s][A[A[A


125it [00:05, 22.84it/s][A[A[A


128it [00:05, 23.05it/s][A[A[A


131it [00:05, 22.89it/s][A[A[A


134it [00:05, 22.98it/s][A[A[A


137it [00:05, 23.15it/s][A[A[A


140it [00:06, 23.36it/s][A[A[A


143it [00:06, 23.52it/s][A[A[A


146it [00:06, 23.55it/s][A[A[A


149it [00:06, 23.71it/s][A[A[A


152it [00:06, 23.83it/s][A[A[A


155it [00:06, 23.33it/s][A[A[A


158it [00:06, 23.53it/s][A[A[A


161it [00:06, 23.59it/s][A[A[A


164it [00:07, 23.57it/s][A[A[A


167it [00:07, 23.61it/s][A[A[A


170it [00:07, 23.64it/s][A[A[A


173it [00:07, 22.77it/s][A[A[A


176it [00:07, 22.88it/s][A[A[A


179it [00:07, 23.07it/s][A[A[A


182it [00:07, 23.28it/s][A[A[A


187it [00:08, 23.17it/s]



0it [00:00, ?it/s][A[A[A


3it

Epoch [18/100], Step [100/187], loss: 0.0501





105it [00:04, 22.53it/s][A[A[A


108it [00:04, 22.67it/s][A[A[A


111it [00:04, 22.88it/s][A[A[A


114it [00:04, 22.88it/s][A[A[A


117it [00:05, 23.20it/s][A[A[A


120it [00:05, 23.28it/s][A[A[A


123it [00:05, 23.18it/s][A[A[A


126it [00:05, 23.31it/s][A[A[A


129it [00:05, 23.41it/s][A[A[A


132it [00:05, 23.16it/s][A[A[A


135it [00:05, 23.36it/s][A[A[A


138it [00:05, 23.51it/s][A[A[A


141it [00:06, 22.97it/s][A[A[A


144it [00:06, 23.12it/s][A[A[A


147it [00:06, 23.34it/s][A[A[A


150it [00:06, 23.24it/s][A[A[A


153it [00:06, 23.29it/s][A[A[A


156it [00:06, 22.69it/s][A[A[A


159it [00:06, 22.75it/s][A[A[A


162it [00:06, 22.77it/s][A[A[A


165it [00:07, 23.01it/s][A[A[A


168it [00:07, 22.97it/s][A[A[A


171it [00:07, 22.83it/s][A[A[A


174it [00:07, 23.06it/s][A[A[A


177it [00:07, 22.94it/s][A[A[A


180it [00:07, 23.14it/s][A[A[A


183it [00:07, 23.28it/s][A[A[A


187it [00:08, 23.15it/s]


Epoch [19/100], Step [100/187], loss: 0.8409





105it [00:04, 22.78it/s][A[A[A


108it [00:04, 22.66it/s][A[A[A


111it [00:04, 22.94it/s][A[A[A


114it [00:04, 23.18it/s][A[A[A


117it [00:05, 23.00it/s][A[A[A


120it [00:05, 23.22it/s][A[A[A


123it [00:05, 22.87it/s][A[A[A


126it [00:05, 22.67it/s][A[A[A


129it [00:05, 23.01it/s][A[A[A


132it [00:05, 22.77it/s][A[A[A


135it [00:05, 23.03it/s][A[A[A


138it [00:05, 23.25it/s][A[A[A


141it [00:06, 22.98it/s][A[A[A


144it [00:06, 23.25it/s][A[A[A


147it [00:06, 23.32it/s][A[A[A


150it [00:06, 23.29it/s][A[A[A


153it [00:06, 23.17it/s][A[A[A


156it [00:06, 23.09it/s][A[A[A


159it [00:06, 23.14it/s][A[A[A


162it [00:07, 23.37it/s][A[A[A


165it [00:07, 22.74it/s][A[A[A


168it [00:07, 22.42it/s][A[A[A


171it [00:07, 22.65it/s][A[A[A


174it [00:07, 22.76it/s][A[A[A


177it [00:07, 22.62it/s][A[A[A


180it [00:07, 22.70it/s][A[A[A


183it [00:07, 22.57it/s][A[A[A


187it [00:08, 23.02it/s]


Epoch [20/100], Step [100/187], loss: 0.0591





105it [00:04, 22.51it/s][A[A[A


108it [00:04, 22.42it/s][A[A[A


111it [00:04, 22.53it/s][A[A[A


114it [00:04, 22.84it/s][A[A[A


117it [00:05, 23.18it/s][A[A[A


120it [00:05, 23.01it/s][A[A[A


123it [00:05, 22.91it/s][A[A[A


126it [00:05, 23.23it/s][A[A[A


129it [00:05, 22.90it/s][A[A[A


132it [00:05, 23.14it/s][A[A[A


135it [00:05, 23.24it/s][A[A[A


138it [00:05, 23.31it/s][A[A[A


141it [00:06, 23.26it/s][A[A[A


144it [00:06, 23.19it/s][A[A[A


147it [00:06, 23.34it/s][A[A[A


150it [00:06, 23.22it/s][A[A[A


153it [00:06, 23.04it/s][A[A[A


156it [00:06, 23.16it/s][A[A[A


159it [00:06, 22.97it/s][A[A[A


162it [00:07, 22.98it/s][A[A[A


165it [00:07, 23.15it/s][A[A[A


168it [00:07, 23.07it/s][A[A[A


171it [00:07, 23.38it/s][A[A[A


174it [00:07, 22.90it/s][A[A[A


177it [00:07, 22.42it/s][A[A[A


180it [00:07, 22.82it/s][A[A[A


183it [00:07, 23.03it/s][A[A[A


187it [00:08, 23.05it/s]


Epoch [21/100], Step [100/187], loss: 0.2789





105it [00:04, 22.49it/s][A[A[A


108it [00:04, 22.74it/s][A[A[A


111it [00:04, 22.81it/s][A[A[A


114it [00:04, 22.88it/s][A[A[A


117it [00:05, 23.06it/s][A[A[A


120it [00:05, 22.98it/s][A[A[A


123it [00:05, 22.80it/s][A[A[A


126it [00:05, 23.12it/s][A[A[A


129it [00:05, 22.93it/s][A[A[A


132it [00:05, 23.08it/s][A[A[A


135it [00:05, 23.03it/s][A[A[A


138it [00:05, 23.17it/s][A[A[A


141it [00:06, 23.20it/s][A[A[A


144it [00:06, 23.19it/s][A[A[A


147it [00:06, 23.28it/s][A[A[A


150it [00:06, 23.18it/s][A[A[A


153it [00:06, 23.03it/s][A[A[A


156it [00:06, 23.17it/s][A[A[A


159it [00:06, 23.19it/s][A[A[A


162it [00:07, 23.23it/s][A[A[A


165it [00:07, 23.45it/s][A[A[A


168it [00:07, 23.36it/s][A[A[A


171it [00:07, 23.48it/s][A[A[A


174it [00:07, 23.45it/s][A[A[A


177it [00:07, 22.61it/s][A[A[A


180it [00:07, 22.92it/s][A[A[A


183it [00:07, 23.14it/s][A[A[A


187it [00:08, 23.06it/s]


Epoch [22/100], Step [100/187], loss: 0.5507





105it [00:04, 22.79it/s][A[A[A


108it [00:04, 23.00it/s][A[A[A


111it [00:04, 23.20it/s][A[A[A


114it [00:04, 23.25it/s][A[A[A


117it [00:05, 22.72it/s][A[A[A


120it [00:05, 22.95it/s][A[A[A


123it [00:05, 23.08it/s][A[A[A


126it [00:05, 23.11it/s][A[A[A


129it [00:05, 22.83it/s][A[A[A


132it [00:05, 21.86it/s][A[A[A


135it [00:05, 22.04it/s][A[A[A


138it [00:06, 22.54it/s][A[A[A


141it [00:06, 22.94it/s][A[A[A


144it [00:06, 23.04it/s][A[A[A


147it [00:06, 23.19it/s][A[A[A


150it [00:06, 23.49it/s][A[A[A


153it [00:06, 22.88it/s][A[A[A


156it [00:06, 23.11it/s][A[A[A


159it [00:06, 23.25it/s][A[A[A


162it [00:07, 23.22it/s][A[A[A


165it [00:07, 23.21it/s][A[A[A


168it [00:07, 23.29it/s][A[A[A


171it [00:07, 23.12it/s][A[A[A


174it [00:07, 22.78it/s][A[A[A


177it [00:07, 22.82it/s][A[A[A


180it [00:07, 22.98it/s][A[A[A


183it [00:07, 23.14it/s][A[A[A


187it [00:08, 23.01it/s]


Epoch [23/100], Step [100/187], loss: 0.1695





105it [00:04, 22.44it/s][A[A[A


108it [00:04, 22.80it/s][A[A[A


111it [00:04, 22.68it/s][A[A[A


114it [00:04, 22.55it/s][A[A[A


117it [00:05, 22.86it/s][A[A[A


120it [00:05, 22.91it/s][A[A[A


123it [00:05, 23.05it/s][A[A[A


126it [00:05, 23.26it/s][A[A[A


129it [00:05, 22.99it/s][A[A[A


132it [00:05, 23.11it/s][A[A[A


135it [00:05, 23.37it/s][A[A[A


138it [00:05, 23.48it/s][A[A[A


141it [00:06, 23.50it/s][A[A[A


144it [00:06, 23.48it/s][A[A[A


147it [00:06, 22.64it/s][A[A[A


150it [00:06, 22.69it/s][A[A[A


153it [00:06, 22.47it/s][A[A[A


156it [00:06, 22.65it/s][A[A[A


159it [00:06, 22.88it/s][A[A[A


162it [00:07, 23.07it/s][A[A[A


165it [00:07, 23.26it/s][A[A[A


168it [00:07, 22.77it/s][A[A[A


171it [00:07, 23.01it/s][A[A[A


174it [00:07, 22.97it/s][A[A[A


177it [00:07, 22.87it/s][A[A[A


180it [00:07, 23.00it/s][A[A[A


183it [00:07, 22.61it/s][A[A[A


187it [00:08, 23.03it/s]


Epoch [24/100], Step [100/187], loss: 0.8007





105it [00:04, 22.83it/s][A[A[A


108it [00:04, 22.57it/s][A[A[A


111it [00:04, 22.82it/s][A[A[A


114it [00:04, 23.06it/s][A[A[A


117it [00:05, 23.10it/s][A[A[A


120it [00:05, 23.16it/s][A[A[A


123it [00:05, 23.24it/s][A[A[A


126it [00:05, 22.90it/s][A[A[A


129it [00:05, 22.72it/s][A[A[A


132it [00:05, 22.91it/s][A[A[A


135it [00:05, 23.04it/s][A[A[A


138it [00:05, 23.33it/s][A[A[A


141it [00:06, 23.47it/s][A[A[A


144it [00:06, 23.49it/s][A[A[A


147it [00:06, 23.59it/s][A[A[A


150it [00:06, 23.63it/s][A[A[A


153it [00:06, 23.24it/s][A[A[A


156it [00:06, 23.36it/s][A[A[A


159it [00:06, 23.34it/s][A[A[A


162it [00:06, 22.87it/s][A[A[A


165it [00:07, 23.14it/s][A[A[A


168it [00:07, 23.24it/s][A[A[A


171it [00:07, 23.41it/s][A[A[A


174it [00:07, 23.34it/s][A[A[A


177it [00:07, 23.25it/s][A[A[A


180it [00:07, 23.47it/s][A[A[A


183it [00:07, 23.60it/s][A[A[A


187it [00:08, 23.19it/s]


Epoch [25/100], Step [100/187], loss: 0.0795





105it [00:04, 22.67it/s][A[A[A


108it [00:04, 23.05it/s][A[A[A


111it [00:04, 23.24it/s][A[A[A


114it [00:04, 23.23it/s][A[A[A


117it [00:05, 23.56it/s][A[A[A


120it [00:05, 23.58it/s][A[A[A


123it [00:05, 23.37it/s][A[A[A


126it [00:05, 23.43it/s][A[A[A


129it [00:05, 23.07it/s][A[A[A


132it [00:05, 23.29it/s][A[A[A


135it [00:05, 23.37it/s][A[A[A


138it [00:05, 23.15it/s][A[A[A


141it [00:06, 23.17it/s][A[A[A


144it [00:06, 23.43it/s][A[A[A


147it [00:06, 23.03it/s][A[A[A


150it [00:06, 23.02it/s][A[A[A


153it [00:06, 23.01it/s][A[A[A


156it [00:06, 23.22it/s][A[A[A


159it [00:06, 23.38it/s][A[A[A


162it [00:06, 23.48it/s][A[A[A


165it [00:07, 23.21it/s][A[A[A


168it [00:07, 23.23it/s][A[A[A


171it [00:07, 23.25it/s][A[A[A


174it [00:07, 23.03it/s][A[A[A


177it [00:07, 22.38it/s][A[A[A


180it [00:07, 22.42it/s][A[A[A


183it [00:07, 22.79it/s][A[A[A


187it [00:08, 23.18it/s]


Epoch [26/100], Step [100/187], loss: 0.6449





105it [00:04, 22.12it/s][A[A[A


108it [00:04, 22.61it/s][A[A[A


111it [00:04, 22.94it/s][A[A[A


114it [00:04, 23.05it/s][A[A[A


117it [00:05, 23.11it/s][A[A[A


120it [00:05, 23.27it/s][A[A[A


123it [00:05, 23.25it/s][A[A[A


126it [00:05, 23.10it/s][A[A[A


129it [00:05, 22.85it/s][A[A[A


132it [00:05, 22.87it/s][A[A[A


135it [00:05, 22.67it/s][A[A[A


138it [00:06, 22.96it/s][A[A[A


141it [00:06, 23.05it/s][A[A[A


144it [00:06, 22.53it/s][A[A[A


147it [00:06, 22.68it/s][A[A[A


150it [00:06, 22.52it/s][A[A[A


153it [00:06, 22.63it/s][A[A[A


156it [00:06, 22.95it/s][A[A[A


159it [00:06, 23.08it/s][A[A[A


162it [00:07, 23.31it/s][A[A[A


165it [00:07, 23.44it/s][A[A[A


168it [00:07, 23.32it/s][A[A[A


171it [00:07, 23.53it/s][A[A[A


174it [00:07, 23.38it/s][A[A[A


177it [00:07, 23.11it/s][A[A[A


180it [00:07, 23.35it/s][A[A[A


183it [00:07, 23.41it/s][A[A[A


187it [00:08, 22.97it/s]


Epoch [27/100], Step [100/187], loss: 1.5252





105it [00:04, 22.47it/s][A[A[A


108it [00:04, 22.89it/s][A[A[A


111it [00:04, 22.84it/s][A[A[A


114it [00:04, 22.78it/s][A[A[A


117it [00:05, 22.74it/s][A[A[A


120it [00:05, 22.20it/s][A[A[A


123it [00:05, 22.24it/s][A[A[A


126it [00:05, 22.57it/s][A[A[A


129it [00:05, 22.30it/s][A[A[A


132it [00:05, 22.61it/s][A[A[A


135it [00:05, 22.75it/s][A[A[A


138it [00:05, 22.52it/s][A[A[A


141it [00:06, 22.88it/s][A[A[A


144it [00:06, 22.77it/s][A[A[A


147it [00:06, 23.09it/s][A[A[A


150it [00:06, 22.29it/s][A[A[A


153it [00:06, 22.46it/s][A[A[A


156it [00:06, 22.67it/s][A[A[A


159it [00:06, 22.92it/s][A[A[A


162it [00:07, 22.95it/s][A[A[A


165it [00:07, 23.03it/s][A[A[A


168it [00:07, 23.19it/s][A[A[A


171it [00:07, 23.12it/s][A[A[A


174it [00:07, 22.94it/s][A[A[A


177it [00:07, 22.56it/s][A[A[A


180it [00:07, 22.38it/s][A[A[A


183it [00:07, 22.32it/s][A[A[A


187it [00:08, 22.96it/s]


Epoch [28/100], Step [100/187], loss: 0.9327





105it [00:04, 22.63it/s][A[A[A


108it [00:04, 22.87it/s][A[A[A


111it [00:04, 22.94it/s][A[A[A


114it [00:04, 22.82it/s][A[A[A


117it [00:05, 22.67it/s][A[A[A


120it [00:05, 22.91it/s][A[A[A


123it [00:05, 22.88it/s][A[A[A


126it [00:05, 22.66it/s][A[A[A


129it [00:05, 22.90it/s][A[A[A


132it [00:05, 22.98it/s][A[A[A


135it [00:05, 23.21it/s][A[A[A


138it [00:05, 23.42it/s][A[A[A


141it [00:06, 23.21it/s][A[A[A


144it [00:06, 23.38it/s][A[A[A


147it [00:06, 23.62it/s][A[A[A


150it [00:06, 23.11it/s][A[A[A


153it [00:06, 23.22it/s][A[A[A


156it [00:06, 23.29it/s][A[A[A


159it [00:06, 23.27it/s][A[A[A


162it [00:07, 23.38it/s][A[A[A


165it [00:07, 23.43it/s][A[A[A


168it [00:07, 22.90it/s][A[A[A


171it [00:07, 23.01it/s][A[A[A


174it [00:07, 22.73it/s][A[A[A


177it [00:07, 22.78it/s][A[A[A


180it [00:07, 23.02it/s][A[A[A


183it [00:07, 23.17it/s][A[A[A


187it [00:08, 23.08it/s]


Epoch [29/100], Step [100/187], loss: 0.0417





107it [00:04, 21.76it/s][A[A[A


110it [00:04, 22.22it/s][A[A[A


113it [00:04, 22.51it/s][A[A[A


116it [00:05, 22.91it/s][A[A[A


119it [00:05, 22.96it/s][A[A[A


122it [00:05, 23.04it/s][A[A[A


125it [00:05, 22.77it/s][A[A[A


128it [00:05, 22.81it/s][A[A[A


131it [00:05, 23.06it/s][A[A[A


134it [00:05, 23.21it/s][A[A[A


137it [00:05, 23.17it/s][A[A[A


140it [00:06, 23.18it/s][A[A[A


143it [00:06, 23.14it/s][A[A[A


146it [00:06, 23.02it/s][A[A[A


149it [00:06, 22.79it/s][A[A[A


152it [00:06, 22.43it/s][A[A[A


155it [00:06, 22.68it/s][A[A[A


158it [00:06, 22.93it/s][A[A[A


161it [00:07, 22.86it/s][A[A[A


164it [00:07, 23.04it/s][A[A[A


167it [00:07, 23.17it/s][A[A[A


170it [00:07, 22.99it/s][A[A[A


173it [00:07, 23.13it/s][A[A[A


176it [00:07, 23.16it/s][A[A[A


179it [00:07, 23.33it/s][A[A[A


182it [00:07, 23.30it/s][A[A[A


187it [00:08, 22.92it/s]



0it [00:00, ?it/s][A[A[A


3it

Epoch [30/100], Step [100/187], loss: 0.6319





105it [00:04, 22.40it/s][A[A[A


108it [00:04, 22.83it/s][A[A[A


111it [00:04, 22.68it/s][A[A[A


114it [00:04, 22.77it/s][A[A[A


117it [00:05, 22.90it/s][A[A[A


120it [00:05, 23.02it/s][A[A[A


123it [00:05, 23.07it/s][A[A[A


126it [00:05, 23.42it/s][A[A[A


129it [00:05, 23.51it/s][A[A[A


132it [00:05, 23.73it/s][A[A[A


135it [00:05, 23.69it/s][A[A[A


138it [00:05, 23.69it/s][A[A[A


141it [00:06, 22.98it/s][A[A[A


144it [00:06, 23.16it/s][A[A[A


147it [00:06, 23.11it/s][A[A[A


150it [00:06, 23.18it/s][A[A[A


153it [00:06, 23.35it/s][A[A[A


156it [00:06, 23.55it/s][A[A[A


159it [00:06, 23.32it/s][A[A[A


162it [00:07, 23.39it/s][A[A[A


165it [00:07, 23.30it/s][A[A[A


168it [00:07, 23.22it/s][A[A[A


171it [00:07, 22.85it/s][A[A[A


174it [00:07, 22.97it/s][A[A[A


177it [00:07, 23.22it/s][A[A[A


180it [00:07, 23.43it/s][A[A[A


183it [00:07, 23.23it/s][A[A[A


187it [00:08, 23.03it/s]


Epoch [31/100], Step [100/187], loss: 0.2642





105it [00:04, 22.65it/s][A[A[A


108it [00:04, 22.80it/s][A[A[A


111it [00:04, 22.63it/s][A[A[A


114it [00:04, 22.95it/s][A[A[A


117it [00:05, 22.91it/s][A[A[A


120it [00:05, 22.64it/s][A[A[A


123it [00:05, 21.94it/s][A[A[A


126it [00:05, 21.27it/s][A[A[A


129it [00:05, 21.86it/s][A[A[A


132it [00:05, 22.36it/s][A[A[A


135it [00:05, 22.60it/s][A[A[A


138it [00:06, 22.70it/s][A[A[A


141it [00:06, 22.92it/s][A[A[A


144it [00:06, 23.06it/s][A[A[A


147it [00:06, 23.12it/s][A[A[A


150it [00:06, 23.24it/s][A[A[A


153it [00:06, 23.44it/s][A[A[A


156it [00:06, 23.31it/s][A[A[A


159it [00:06, 23.10it/s][A[A[A


162it [00:07, 23.29it/s][A[A[A


165it [00:07, 23.38it/s][A[A[A


168it [00:07, 23.21it/s][A[A[A


171it [00:07, 23.37it/s][A[A[A


174it [00:07, 23.62it/s][A[A[A


177it [00:07, 23.37it/s][A[A[A


180it [00:07, 23.40it/s][A[A[A


183it [00:07, 23.34it/s][A[A[A


187it [00:08, 22.94it/s]


Epoch [32/100], Step [100/187], loss: 0.1414





105it [00:04, 22.55it/s][A[A[A


108it [00:04, 22.90it/s][A[A[A


111it [00:04, 22.96it/s][A[A[A


114it [00:04, 22.90it/s][A[A[A


117it [00:05, 22.98it/s][A[A[A


120it [00:05, 22.95it/s][A[A[A


123it [00:05, 23.04it/s][A[A[A


126it [00:05, 22.97it/s][A[A[A


129it [00:05, 23.24it/s][A[A[A


132it [00:05, 23.31it/s][A[A[A


135it [00:05, 23.49it/s][A[A[A


138it [00:06, 23.59it/s][A[A[A


141it [00:06, 23.46it/s][A[A[A


144it [00:06, 23.39it/s][A[A[A


147it [00:06, 23.49it/s][A[A[A


150it [00:06, 23.37it/s][A[A[A


153it [00:06, 23.40it/s][A[A[A


156it [00:06, 23.53it/s][A[A[A


159it [00:06, 23.36it/s][A[A[A


162it [00:07, 23.41it/s][A[A[A


165it [00:07, 23.50it/s][A[A[A


168it [00:07, 23.10it/s][A[A[A


171it [00:07, 23.35it/s][A[A[A


174it [00:07, 22.64it/s][A[A[A


177it [00:07, 22.71it/s][A[A[A


180it [00:07, 23.07it/s][A[A[A


183it [00:07, 23.36it/s][A[A[A


187it [00:08, 23.05it/s]


Epoch [33/100], Step [100/187], loss: 0.1285





105it [00:04, 22.62it/s][A[A[A


108it [00:04, 22.93it/s][A[A[A


111it [00:04, 23.23it/s][A[A[A


114it [00:04, 23.26it/s][A[A[A


117it [00:05, 23.24it/s][A[A[A


120it [00:05, 22.70it/s][A[A[A


123it [00:05, 22.59it/s][A[A[A


126it [00:05, 22.79it/s][A[A[A


129it [00:05, 23.00it/s][A[A[A


132it [00:05, 23.11it/s][A[A[A


135it [00:05, 23.26it/s][A[A[A


138it [00:05, 23.49it/s][A[A[A


141it [00:06, 23.42it/s][A[A[A


144it [00:06, 23.59it/s][A[A[A


147it [00:06, 23.49it/s][A[A[A


150it [00:06, 23.39it/s][A[A[A


153it [00:06, 23.52it/s][A[A[A


156it [00:06, 23.55it/s][A[A[A


159it [00:06, 23.26it/s][A[A[A


162it [00:06, 23.43it/s][A[A[A


165it [00:07, 23.58it/s][A[A[A


168it [00:07, 23.55it/s][A[A[A


171it [00:07, 22.84it/s][A[A[A


174it [00:07, 23.01it/s][A[A[A


177it [00:07, 22.66it/s][A[A[A


180it [00:07, 22.88it/s][A[A[A


183it [00:07, 23.13it/s][A[A[A


187it [00:08, 23.24it/s]


Epoch [34/100], Step [100/187], loss: 1.1529





105it [00:04, 22.75it/s][A[A[A


108it [00:04, 23.14it/s][A[A[A


111it [00:04, 22.93it/s][A[A[A


114it [00:04, 23.05it/s][A[A[A


117it [00:05, 23.09it/s][A[A[A


120it [00:05, 22.97it/s][A[A[A


123it [00:05, 22.93it/s][A[A[A


126it [00:05, 23.06it/s][A[A[A


129it [00:05, 23.19it/s][A[A[A


132it [00:05, 23.25it/s][A[A[A


135it [00:05, 23.17it/s][A[A[A


138it [00:05, 22.96it/s][A[A[A


141it [00:06, 23.25it/s][A[A[A


144it [00:06, 23.26it/s][A[A[A


147it [00:06, 23.21it/s][A[A[A


150it [00:06, 23.26it/s][A[A[A


153it [00:06, 23.27it/s][A[A[A


156it [00:06, 23.32it/s][A[A[A


159it [00:06, 23.41it/s][A[A[A


162it [00:06, 23.01it/s][A[A[A


165it [00:07, 22.90it/s][A[A[A


168it [00:07, 23.26it/s][A[A[A


171it [00:07, 22.97it/s][A[A[A


174it [00:07, 23.15it/s][A[A[A


177it [00:07, 23.47it/s][A[A[A


180it [00:07, 23.31it/s][A[A[A


183it [00:07, 23.32it/s][A[A[A


187it [00:08, 23.20it/s]


Epoch [35/100], Step [100/187], loss: 0.8019





105it [00:04, 22.22it/s][A[A[A


108it [00:04, 22.70it/s][A[A[A


111it [00:04, 22.71it/s][A[A[A


114it [00:04, 22.81it/s][A[A[A


117it [00:05, 23.14it/s][A[A[A


120it [00:05, 23.15it/s][A[A[A


123it [00:05, 23.06it/s][A[A[A


126it [00:05, 23.16it/s][A[A[A


129it [00:05, 22.83it/s][A[A[A


132it [00:05, 22.94it/s][A[A[A


135it [00:05, 22.97it/s][A[A[A


138it [00:06, 22.74it/s][A[A[A


141it [00:06, 22.33it/s][A[A[A


144it [00:06, 22.26it/s][A[A[A


147it [00:06, 22.48it/s][A[A[A


150it [00:06, 21.92it/s][A[A[A


153it [00:06, 22.01it/s][A[A[A


156it [00:06, 22.45it/s][A[A[A


159it [00:06, 22.74it/s][A[A[A


162it [00:07, 22.22it/s][A[A[A


165it [00:07, 22.53it/s][A[A[A


168it [00:07, 22.36it/s][A[A[A


171it [00:07, 22.58it/s][A[A[A


174it [00:07, 22.63it/s][A[A[A


177it [00:07, 22.69it/s][A[A[A


180it [00:07, 22.49it/s][A[A[A


183it [00:08, 22.59it/s][A[A[A


187it [00:08, 22.72it/s]


Epoch [36/100], Step [100/187], loss: 1.1002





105it [00:04, 22.00it/s][A[A[A


108it [00:04, 22.40it/s][A[A[A


111it [00:04, 22.74it/s][A[A[A


114it [00:05, 22.94it/s][A[A[A


117it [00:05, 22.74it/s][A[A[A


120it [00:05, 22.93it/s][A[A[A


123it [00:05, 22.74it/s][A[A[A


126it [00:05, 23.00it/s][A[A[A


129it [00:05, 23.02it/s][A[A[A


132it [00:05, 23.14it/s][A[A[A


135it [00:05, 23.20it/s][A[A[A


138it [00:06, 22.37it/s][A[A[A


141it [00:06, 22.09it/s][A[A[A


144it [00:06, 22.43it/s][A[A[A


147it [00:06, 22.79it/s][A[A[A


150it [00:06, 22.80it/s][A[A[A


153it [00:06, 22.93it/s][A[A[A


156it [00:06, 23.07it/s][A[A[A


159it [00:07, 22.98it/s][A[A[A


162it [00:07, 23.14it/s][A[A[A


165it [00:07, 22.98it/s][A[A[A


168it [00:07, 22.90it/s][A[A[A


171it [00:07, 23.12it/s][A[A[A


174it [00:07, 23.33it/s][A[A[A


177it [00:07, 23.22it/s][A[A[A


180it [00:07, 23.44it/s][A[A[A


183it [00:08, 23.47it/s][A[A[A


187it [00:08, 22.68it/s]


Epoch [37/100], Step [100/187], loss: 0.0344





105it [00:04, 22.27it/s][A[A[A


108it [00:04, 22.35it/s][A[A[A


111it [00:04, 22.71it/s][A[A[A


114it [00:04, 22.95it/s][A[A[A


117it [00:05, 23.11it/s][A[A[A


120it [00:05, 23.23it/s][A[A[A


123it [00:05, 23.39it/s][A[A[A


126it [00:05, 23.55it/s][A[A[A


129it [00:05, 23.46it/s][A[A[A


132it [00:05, 23.55it/s][A[A[A


135it [00:05, 23.58it/s][A[A[A


138it [00:05, 23.44it/s][A[A[A


141it [00:06, 23.21it/s][A[A[A


144it [00:06, 23.09it/s][A[A[A


147it [00:06, 23.17it/s][A[A[A


150it [00:06, 23.08it/s][A[A[A


153it [00:06, 22.64it/s][A[A[A


156it [00:06, 22.86it/s][A[A[A


159it [00:06, 23.11it/s][A[A[A


162it [00:06, 23.11it/s][A[A[A


165it [00:07, 22.99it/s][A[A[A


168it [00:07, 23.30it/s][A[A[A


171it [00:07, 23.28it/s][A[A[A


174it [00:07, 23.44it/s][A[A[A


177it [00:07, 23.58it/s][A[A[A


180it [00:07, 23.54it/s][A[A[A


183it [00:07, 23.62it/s][A[A[A


187it [00:08, 23.18it/s]


Epoch [38/100], Step [100/187], loss: 0.0295





107it [00:04, 22.50it/s][A[A[A


110it [00:04, 22.80it/s][A[A[A


113it [00:04, 22.97it/s][A[A[A


116it [00:05, 23.02it/s][A[A[A


119it [00:05, 23.13it/s][A[A[A


122it [00:05, 23.36it/s][A[A[A


125it [00:05, 23.67it/s][A[A[A


128it [00:05, 23.75it/s][A[A[A


131it [00:05, 23.91it/s][A[A[A


134it [00:05, 23.93it/s][A[A[A


137it [00:05, 23.80it/s][A[A[A


140it [00:06, 23.77it/s][A[A[A


143it [00:06, 23.67it/s][A[A[A


146it [00:06, 23.34it/s][A[A[A


149it [00:06, 22.96it/s][A[A[A


152it [00:06, 23.18it/s][A[A[A


155it [00:06, 23.38it/s][A[A[A


158it [00:06, 23.25it/s][A[A[A


161it [00:06, 23.34it/s][A[A[A


164it [00:07, 22.89it/s][A[A[A


167it [00:07, 23.04it/s][A[A[A


170it [00:07, 23.33it/s][A[A[A


173it [00:07, 23.35it/s][A[A[A


176it [00:07, 23.56it/s][A[A[A


179it [00:07, 23.63it/s][A[A[A


182it [00:07, 23.42it/s][A[A[A


187it [00:08, 23.25it/s]



0it [00:00, ?it/s][A[A[A


3it

Epoch [39/100], Step [100/187], loss: 0.0453





107it [00:04, 22.60it/s][A[A[A


110it [00:04, 22.87it/s][A[A[A


113it [00:04, 22.90it/s][A[A[A


116it [00:05, 22.79it/s][A[A[A


119it [00:05, 23.02it/s][A[A[A


122it [00:05, 23.31it/s][A[A[A


125it [00:05, 23.22it/s][A[A[A


128it [00:05, 23.11it/s][A[A[A


131it [00:05, 23.39it/s][A[A[A


134it [00:05, 23.36it/s][A[A[A


137it [00:05, 23.52it/s][A[A[A


140it [00:06, 23.03it/s][A[A[A


143it [00:06, 23.26it/s][A[A[A


146it [00:06, 23.42it/s][A[A[A


149it [00:06, 22.88it/s][A[A[A


152it [00:06, 23.02it/s][A[A[A


155it [00:06, 23.18it/s][A[A[A


158it [00:06, 23.23it/s][A[A[A


161it [00:07, 23.16it/s][A[A[A


164it [00:07, 23.05it/s][A[A[A


167it [00:07, 23.12it/s][A[A[A


170it [00:07, 23.27it/s][A[A[A


173it [00:07, 22.99it/s][A[A[A


176it [00:07, 23.12it/s][A[A[A


179it [00:07, 22.38it/s][A[A[A


182it [00:07, 22.09it/s][A[A[A


187it [00:08, 22.89it/s]



0it [00:00, ?it/s][A[A[A


3it

Epoch [40/100], Step [100/187], loss: 0.3249





105it [00:04, 22.97it/s][A[A[A


108it [00:04, 22.90it/s][A[A[A


111it [00:04, 23.09it/s][A[A[A


114it [00:04, 23.33it/s][A[A[A


117it [00:05, 22.71it/s][A[A[A


120it [00:05, 22.93it/s][A[A[A


123it [00:05, 22.73it/s][A[A[A


126it [00:05, 22.77it/s][A[A[A


129it [00:05, 22.48it/s][A[A[A


132it [00:05, 22.61it/s][A[A[A


135it [00:05, 22.88it/s][A[A[A


138it [00:05, 23.05it/s][A[A[A


141it [00:06, 22.63it/s][A[A[A


144it [00:06, 22.92it/s][A[A[A


147it [00:06, 23.09it/s][A[A[A


150it [00:06, 23.08it/s][A[A[A


153it [00:06, 23.14it/s][A[A[A


156it [00:06, 23.09it/s][A[A[A


159it [00:06, 22.72it/s][A[A[A


162it [00:07, 22.69it/s][A[A[A


165it [00:07, 23.02it/s][A[A[A


168it [00:07, 23.14it/s][A[A[A


171it [00:07, 23.35it/s][A[A[A


174it [00:07, 23.62it/s][A[A[A


177it [00:07, 23.59it/s][A[A[A


180it [00:07, 23.66it/s][A[A[A


183it [00:07, 23.75it/s][A[A[A


187it [00:08, 23.12it/s]


Epoch [41/100], Step [100/187], loss: 0.2037





105it [00:04, 22.56it/s][A[A[A


108it [00:04, 22.89it/s][A[A[A


111it [00:04, 22.64it/s][A[A[A


114it [00:04, 22.95it/s][A[A[A


117it [00:05, 23.09it/s][A[A[A


120it [00:05, 23.17it/s][A[A[A


123it [00:05, 23.31it/s][A[A[A


126it [00:05, 23.42it/s][A[A[A


129it [00:05, 23.32it/s][A[A[A


132it [00:05, 22.87it/s][A[A[A


135it [00:05, 22.67it/s][A[A[A


138it [00:06, 22.13it/s][A[A[A


141it [00:06, 22.31it/s][A[A[A


144it [00:06, 22.09it/s][A[A[A


147it [00:06, 22.11it/s][A[A[A


150it [00:06, 22.47it/s][A[A[A


153it [00:06, 22.18it/s][A[A[A


156it [00:06, 22.26it/s][A[A[A


159it [00:06, 22.31it/s][A[A[A


162it [00:07, 22.30it/s][A[A[A


165it [00:07, 22.75it/s][A[A[A


168it [00:07, 22.87it/s][A[A[A


171it [00:07, 23.29it/s][A[A[A


174it [00:07, 23.15it/s][A[A[A


177it [00:07, 23.03it/s][A[A[A


180it [00:07, 22.49it/s][A[A[A


183it [00:08, 22.56it/s][A[A[A


187it [00:08, 22.75it/s]


Epoch [42/100], Step [100/187], loss: 0.0921





107it [00:04, 22.68it/s][A[A[A


110it [00:04, 22.98it/s][A[A[A


113it [00:04, 22.95it/s][A[A[A


116it [00:05, 23.10it/s][A[A[A


119it [00:05, 23.31it/s][A[A[A


122it [00:05, 23.33it/s][A[A[A


125it [00:05, 23.26it/s][A[A[A


128it [00:05, 23.38it/s][A[A[A


131it [00:05, 23.42it/s][A[A[A


134it [00:05, 22.99it/s][A[A[A


137it [00:05, 22.87it/s][A[A[A


140it [00:06, 22.98it/s][A[A[A


143it [00:06, 22.77it/s][A[A[A


146it [00:06, 22.97it/s][A[A[A


149it [00:06, 23.22it/s][A[A[A


152it [00:06, 22.91it/s][A[A[A


155it [00:06, 23.06it/s][A[A[A


158it [00:06, 23.30it/s][A[A[A


161it [00:06, 23.22it/s][A[A[A


164it [00:07, 23.03it/s][A[A[A


167it [00:07, 23.26it/s][A[A[A


170it [00:07, 23.18it/s][A[A[A


173it [00:07, 23.11it/s][A[A[A


176it [00:07, 23.33it/s][A[A[A


179it [00:07, 23.38it/s][A[A[A


182it [00:07, 23.30it/s][A[A[A


187it [00:08, 23.05it/s]



0it [00:00, ?it/s][A[A[A


3it

Epoch [43/100], Step [100/187], loss: 0.3045





107it [00:04, 22.26it/s][A[A[A


110it [00:04, 22.64it/s][A[A[A


113it [00:04, 22.39it/s][A[A[A


116it [00:05, 22.70it/s][A[A[A


119it [00:05, 22.66it/s][A[A[A


122it [00:05, 22.82it/s][A[A[A


125it [00:05, 23.11it/s][A[A[A


128it [00:05, 23.19it/s][A[A[A


131it [00:05, 23.35it/s][A[A[A


134it [00:05, 23.53it/s][A[A[A


137it [00:05, 23.38it/s][A[A[A


140it [00:06, 23.49it/s][A[A[A


143it [00:06, 23.67it/s][A[A[A


146it [00:06, 23.42it/s][A[A[A


149it [00:06, 23.53it/s][A[A[A


152it [00:06, 23.54it/s][A[A[A


155it [00:06, 23.44it/s][A[A[A


158it [00:06, 23.33it/s][A[A[A


161it [00:06, 23.02it/s][A[A[A


164it [00:07, 22.65it/s][A[A[A


167it [00:07, 23.12it/s][A[A[A


170it [00:07, 23.12it/s][A[A[A


173it [00:07, 23.18it/s][A[A[A


176it [00:07, 23.21it/s][A[A[A


179it [00:07, 23.22it/s][A[A[A


182it [00:07, 22.96it/s][A[A[A


187it [00:08, 23.03it/s]



0it [00:00, ?it/s][A[A[A


3it

Epoch [44/100], Step [100/187], loss: 0.1292





105it [00:04, 22.17it/s][A[A[A


108it [00:04, 22.43it/s][A[A[A


111it [00:04, 22.02it/s][A[A[A


114it [00:04, 22.29it/s][A[A[A


117it [00:05, 22.82it/s][A[A[A


120it [00:05, 22.76it/s][A[A[A


123it [00:05, 23.01it/s][A[A[A


126it [00:05, 23.17it/s][A[A[A


129it [00:05, 23.13it/s][A[A[A


132it [00:05, 23.08it/s][A[A[A


135it [00:05, 22.99it/s][A[A[A


138it [00:05, 22.92it/s][A[A[A


141it [00:06, 23.12it/s][A[A[A


144it [00:06, 22.92it/s][A[A[A


147it [00:06, 22.85it/s][A[A[A


150it [00:06, 22.95it/s][A[A[A


153it [00:06, 22.86it/s][A[A[A


156it [00:06, 23.15it/s][A[A[A


159it [00:06, 23.13it/s][A[A[A


162it [00:07, 22.77it/s][A[A[A


165it [00:07, 23.03it/s][A[A[A


168it [00:07, 23.07it/s][A[A[A


171it [00:07, 23.21it/s][A[A[A


174it [00:07, 23.39it/s][A[A[A


177it [00:07, 23.42it/s][A[A[A


180it [00:07, 23.36it/s][A[A[A


183it [00:07, 23.22it/s][A[A[A


187it [00:08, 23.09it/s]


Epoch [45/100], Step [100/187], loss: 0.0166





105it [00:04, 21.62it/s][A[A[A


108it [00:04, 22.08it/s][A[A[A


111it [00:04, 21.55it/s][A[A[A


114it [00:05, 21.83it/s][A[A[A


117it [00:05, 22.13it/s][A[A[A


120it [00:05, 22.38it/s][A[A[A


123it [00:05, 22.50it/s][A[A[A


126it [00:05, 22.52it/s][A[A[A


129it [00:05, 22.62it/s][A[A[A


132it [00:05, 22.51it/s][A[A[A


135it [00:05, 22.44it/s][A[A[A


138it [00:06, 22.51it/s][A[A[A


141it [00:06, 22.52it/s][A[A[A


144it [00:06, 22.07it/s][A[A[A


147it [00:06, 21.46it/s][A[A[A


150it [00:06, 21.83it/s][A[A[A


153it [00:06, 21.68it/s][A[A[A


156it [00:06, 21.72it/s][A[A[A


159it [00:07, 21.85it/s][A[A[A


162it [00:07, 22.27it/s][A[A[A


165it [00:07, 22.61it/s][A[A[A


168it [00:07, 22.67it/s][A[A[A


171it [00:07, 22.43it/s][A[A[A


174it [00:07, 22.42it/s][A[A[A


177it [00:07, 22.18it/s][A[A[A


180it [00:08, 22.51it/s][A[A[A


183it [00:08, 22.67it/s][A[A[A


187it [00:08, 22.42it/s]


Epoch [46/100], Step [100/187], loss: 1.3192





105it [00:04, 21.32it/s][A[A[A


108it [00:04, 21.64it/s][A[A[A


111it [00:04, 22.00it/s][A[A[A


114it [00:05, 22.50it/s][A[A[A


117it [00:05, 22.87it/s][A[A[A


120it [00:05, 22.97it/s][A[A[A


123it [00:05, 23.20it/s][A[A[A


126it [00:05, 22.82it/s][A[A[A


129it [00:05, 22.49it/s][A[A[A


132it [00:05, 22.73it/s][A[A[A


135it [00:06, 22.73it/s][A[A[A


138it [00:06, 22.93it/s][A[A[A


141it [00:06, 22.95it/s][A[A[A


144it [00:06, 23.09it/s][A[A[A


147it [00:06, 23.22it/s][A[A[A


150it [00:06, 23.16it/s][A[A[A


153it [00:06, 23.15it/s][A[A[A


156it [00:06, 23.12it/s][A[A[A


159it [00:07, 23.30it/s][A[A[A


162it [00:07, 22.99it/s][A[A[A


165it [00:07, 23.13it/s][A[A[A


168it [00:07, 23.37it/s][A[A[A


171it [00:07, 22.82it/s][A[A[A


174it [00:07, 22.65it/s][A[A[A


177it [00:07, 22.97it/s][A[A[A


180it [00:07, 23.12it/s][A[A[A


183it [00:08, 23.20it/s][A[A[A


187it [00:08, 22.56it/s]


Epoch [47/100], Step [100/187], loss: 0.0156





105it [00:04, 22.45it/s][A[A[A


108it [00:04, 22.92it/s][A[A[A


111it [00:04, 23.18it/s][A[A[A


114it [00:05, 23.02it/s][A[A[A


117it [00:05, 23.26it/s][A[A[A


120it [00:05, 23.22it/s][A[A[A


123it [00:05, 22.97it/s][A[A[A


126it [00:05, 23.14it/s][A[A[A


129it [00:05, 23.37it/s][A[A[A


132it [00:05, 23.47it/s][A[A[A


135it [00:05, 23.68it/s][A[A[A


138it [00:06, 23.49it/s][A[A[A


141it [00:06, 23.64it/s][A[A[A


144it [00:06, 23.78it/s][A[A[A


147it [00:06, 23.36it/s][A[A[A


150it [00:06, 23.38it/s][A[A[A


153it [00:06, 23.08it/s][A[A[A


156it [00:06, 22.77it/s][A[A[A


159it [00:06, 22.71it/s][A[A[A


162it [00:07, 22.84it/s][A[A[A


165it [00:07, 23.15it/s][A[A[A


168it [00:07, 23.27it/s][A[A[A


171it [00:07, 22.70it/s][A[A[A


174it [00:07, 23.06it/s][A[A[A


177it [00:07, 23.20it/s][A[A[A


180it [00:07, 23.27it/s][A[A[A


183it [00:07, 23.39it/s][A[A[A


187it [00:08, 22.97it/s]


Epoch [48/100], Step [100/187], loss: 1.1144





105it [00:04, 22.62it/s][A[A[A


108it [00:04, 23.04it/s][A[A[A


111it [00:04, 23.30it/s][A[A[A


114it [00:04, 23.29it/s][A[A[A


117it [00:05, 23.53it/s][A[A[A


120it [00:05, 23.59it/s][A[A[A


123it [00:05, 23.38it/s][A[A[A


126it [00:05, 23.27it/s][A[A[A


129it [00:05, 23.49it/s][A[A[A


132it [00:05, 23.49it/s][A[A[A


135it [00:05, 23.78it/s][A[A[A


138it [00:05, 23.91it/s][A[A[A


141it [00:06, 23.50it/s][A[A[A


144it [00:06, 23.60it/s][A[A[A


147it [00:06, 23.71it/s][A[A[A


150it [00:06, 23.25it/s][A[A[A


153it [00:06, 23.52it/s][A[A[A


156it [00:06, 23.57it/s][A[A[A


159it [00:06, 23.66it/s][A[A[A


162it [00:06, 23.78it/s][A[A[A


165it [00:07, 23.76it/s][A[A[A


168it [00:07, 23.55it/s][A[A[A


171it [00:07, 23.45it/s][A[A[A


174it [00:07, 23.33it/s][A[A[A


177it [00:07, 23.41it/s][A[A[A


180it [00:07, 23.56it/s][A[A[A


183it [00:07, 23.74it/s][A[A[A


187it [00:08, 23.35it/s]


Epoch [49/100], Step [100/187], loss: 0.0610





105it [00:04, 22.42it/s][A[A[A


108it [00:04, 22.82it/s][A[A[A


111it [00:04, 23.11it/s][A[A[A


114it [00:04, 23.24it/s][A[A[A


117it [00:05, 22.89it/s][A[A[A


120it [00:05, 23.02it/s][A[A[A


123it [00:05, 23.31it/s][A[A[A


126it [00:05, 23.31it/s][A[A[A


129it [00:05, 22.71it/s][A[A[A


132it [00:05, 22.93it/s][A[A[A


135it [00:05, 23.16it/s][A[A[A


138it [00:05, 23.20it/s][A[A[A


141it [00:06, 23.40it/s][A[A[A


144it [00:06, 23.54it/s][A[A[A


147it [00:06, 23.40it/s][A[A[A


150it [00:06, 23.26it/s][A[A[A


153it [00:06, 23.37it/s][A[A[A


156it [00:06, 23.48it/s][A[A[A


159it [00:06, 23.34it/s][A[A[A


162it [00:06, 23.53it/s][A[A[A


165it [00:07, 23.69it/s][A[A[A


168it [00:07, 23.51it/s][A[A[A


171it [00:07, 23.08it/s][A[A[A


174it [00:07, 23.21it/s][A[A[A


177it [00:07, 22.92it/s][A[A[A


180it [00:07, 23.01it/s][A[A[A


183it [00:07, 23.26it/s][A[A[A


187it [00:08, 23.27it/s]


Epoch [50/100], Step [100/187], loss: 0.1144





105it [00:04, 22.45it/s][A[A[A


108it [00:04, 22.32it/s][A[A[A


111it [00:04, 22.14it/s][A[A[A


114it [00:04, 22.33it/s][A[A[A


117it [00:05, 22.72it/s][A[A[A


120it [00:05, 22.97it/s][A[A[A


123it [00:05, 23.23it/s][A[A[A


126it [00:05, 22.69it/s][A[A[A


129it [00:05, 22.68it/s][A[A[A


132it [00:05, 23.14it/s][A[A[A


135it [00:05, 23.45it/s][A[A[A


138it [00:05, 23.67it/s][A[A[A


141it [00:06, 22.90it/s][A[A[A


144it [00:06, 23.13it/s][A[A[A


147it [00:06, 23.14it/s][A[A[A


150it [00:06, 22.84it/s][A[A[A


153it [00:06, 23.15it/s][A[A[A


156it [00:06, 23.31it/s][A[A[A


159it [00:06, 23.39it/s][A[A[A


162it [00:07, 23.12it/s][A[A[A


165it [00:07, 22.48it/s][A[A[A


168it [00:07, 22.03it/s][A[A[A


171it [00:07, 22.40it/s][A[A[A


174it [00:07, 21.64it/s][A[A[A


177it [00:07, 22.18it/s][A[A[A


180it [00:07, 22.57it/s][A[A[A


183it [00:07, 22.89it/s][A[A[A


187it [00:08, 22.98it/s]


Epoch [51/100], Step [100/187], loss: 0.0925





105it [00:04, 22.41it/s][A[A[A


108it [00:04, 22.85it/s][A[A[A


111it [00:04, 23.13it/s][A[A[A


114it [00:04, 23.13it/s][A[A[A


117it [00:05, 23.28it/s][A[A[A


120it [00:05, 23.27it/s][A[A[A


123it [00:05, 23.35it/s][A[A[A


126it [00:05, 22.89it/s][A[A[A


129it [00:05, 23.14it/s][A[A[A


132it [00:05, 23.29it/s][A[A[A


135it [00:05, 22.95it/s][A[A[A


138it [00:05, 22.94it/s][A[A[A


141it [00:06, 23.13it/s][A[A[A


144it [00:06, 23.18it/s][A[A[A


147it [00:06, 23.05it/s][A[A[A


150it [00:06, 22.85it/s][A[A[A


153it [00:06, 23.12it/s][A[A[A


156it [00:06, 23.12it/s][A[A[A


159it [00:06, 23.25it/s][A[A[A


162it [00:07, 23.48it/s][A[A[A


165it [00:07, 23.33it/s][A[A[A


168it [00:07, 23.41it/s][A[A[A


171it [00:07, 23.43it/s][A[A[A


174it [00:07, 23.19it/s][A[A[A


177it [00:07, 23.28it/s][A[A[A


180it [00:07, 23.46it/s][A[A[A


183it [00:07, 23.29it/s][A[A[A


187it [00:08, 23.13it/s]


Epoch [52/100], Step [100/187], loss: 0.0416





105it [00:04, 22.50it/s][A[A[A


108it [00:04, 22.83it/s][A[A[A


111it [00:04, 23.04it/s][A[A[A


114it [00:04, 23.25it/s][A[A[A


117it [00:05, 23.23it/s][A[A[A


120it [00:05, 23.52it/s][A[A[A


123it [00:05, 23.62it/s][A[A[A


126it [00:05, 23.43it/s][A[A[A


129it [00:05, 23.61it/s][A[A[A


132it [00:05, 23.77it/s][A[A[A


135it [00:05, 23.92it/s][A[A[A


138it [00:05, 23.41it/s][A[A[A


141it [00:06, 23.56it/s][A[A[A


144it [00:06, 23.62it/s][A[A[A


147it [00:06, 23.52it/s][A[A[A


150it [00:06, 23.25it/s][A[A[A


153it [00:06, 23.32it/s][A[A[A


156it [00:06, 23.12it/s][A[A[A


159it [00:06, 23.31it/s][A[A[A


162it [00:06, 23.28it/s][A[A[A


165it [00:07, 23.32it/s][A[A[A


168it [00:07, 23.59it/s][A[A[A


171it [00:07, 23.44it/s][A[A[A


174it [00:07, 23.37it/s][A[A[A


177it [00:07, 23.50it/s][A[A[A


180it [00:07, 23.46it/s][A[A[A


183it [00:07, 23.62it/s][A[A[A


187it [00:08, 23.19it/s]


Epoch [53/100], Step [100/187], loss: 0.2339





105it [00:04, 22.60it/s][A[A[A


108it [00:04, 22.74it/s][A[A[A


111it [00:04, 23.03it/s][A[A[A


114it [00:04, 23.28it/s][A[A[A


117it [00:05, 23.33it/s][A[A[A


120it [00:05, 23.16it/s][A[A[A


123it [00:05, 23.00it/s][A[A[A


126it [00:05, 23.27it/s][A[A[A


129it [00:05, 22.99it/s][A[A[A


132it [00:05, 23.30it/s][A[A[A


135it [00:05, 22.97it/s][A[A[A


138it [00:05, 22.85it/s][A[A[A


141it [00:06, 22.84it/s][A[A[A


144it [00:06, 22.95it/s][A[A[A


147it [00:06, 23.22it/s][A[A[A


150it [00:06, 23.16it/s][A[A[A


153it [00:06, 23.20it/s][A[A[A


156it [00:06, 23.44it/s][A[A[A


159it [00:06, 23.02it/s][A[A[A


162it [00:07, 22.46it/s][A[A[A


165it [00:07, 22.68it/s][A[A[A


168it [00:07, 22.97it/s][A[A[A


171it [00:07, 23.08it/s][A[A[A


174it [00:07, 23.07it/s][A[A[A


177it [00:07, 23.39it/s][A[A[A


180it [00:07, 23.53it/s][A[A[A


183it [00:07, 23.59it/s][A[A[A


187it [00:08, 23.16it/s]


Epoch [54/100], Step [100/187], loss: 0.2119





105it [00:04, 22.53it/s][A[A[A


108it [00:04, 22.89it/s][A[A[A


111it [00:04, 23.15it/s][A[A[A


114it [00:04, 22.89it/s][A[A[A


117it [00:05, 22.99it/s][A[A[A


120it [00:05, 22.79it/s][A[A[A


123it [00:05, 22.88it/s][A[A[A


126it [00:05, 23.14it/s][A[A[A


129it [00:05, 22.67it/s][A[A[A


132it [00:05, 22.88it/s][A[A[A


135it [00:05, 23.04it/s][A[A[A


138it [00:05, 22.99it/s][A[A[A


141it [00:06, 22.50it/s][A[A[A


144it [00:06, 22.62it/s][A[A[A


147it [00:06, 22.82it/s][A[A[A


150it [00:06, 22.83it/s][A[A[A


153it [00:06, 23.04it/s][A[A[A


156it [00:06, 22.54it/s][A[A[A


159it [00:06, 22.72it/s][A[A[A


162it [00:07, 23.01it/s][A[A[A


165it [00:07, 23.08it/s][A[A[A


168it [00:07, 23.32it/s][A[A[A


171it [00:07, 23.38it/s][A[A[A


174it [00:07, 22.57it/s][A[A[A


177it [00:07, 22.66it/s][A[A[A


180it [00:07, 22.73it/s][A[A[A


183it [00:07, 22.89it/s][A[A[A


187it [00:08, 23.00it/s]


Epoch [55/100], Step [100/187], loss: 0.0626





105it [00:04, 21.90it/s][A[A[A


108it [00:04, 22.16it/s][A[A[A


111it [00:04, 22.49it/s][A[A[A


114it [00:04, 22.51it/s][A[A[A


117it [00:05, 22.65it/s][A[A[A


120it [00:05, 22.90it/s][A[A[A


123it [00:05, 22.94it/s][A[A[A


126it [00:05, 22.89it/s][A[A[A


129it [00:05, 23.13it/s][A[A[A


132it [00:05, 22.91it/s][A[A[A


135it [00:05, 23.07it/s][A[A[A


138it [00:06, 23.32it/s][A[A[A


141it [00:06, 23.39it/s][A[A[A


144it [00:06, 23.33it/s][A[A[A


147it [00:06, 23.46it/s][A[A[A


150it [00:06, 22.36it/s][A[A[A


153it [00:06, 22.62it/s][A[A[A


156it [00:06, 22.80it/s][A[A[A


159it [00:06, 22.91it/s][A[A[A


162it [00:07, 22.92it/s][A[A[A


165it [00:07, 22.89it/s][A[A[A


168it [00:07, 22.85it/s][A[A[A


171it [00:07, 22.68it/s][A[A[A


174it [00:07, 22.61it/s][A[A[A


177it [00:07, 22.69it/s][A[A[A


180it [00:07, 22.83it/s][A[A[A


183it [00:08, 22.93it/s][A[A[A


187it [00:08, 22.87it/s]


Epoch [56/100], Step [100/187], loss: 0.1763





105it [00:04, 22.34it/s][A[A[A


108it [00:04, 22.52it/s][A[A[A


111it [00:04, 22.83it/s][A[A[A


114it [00:05, 23.10it/s][A[A[A


117it [00:05, 23.02it/s][A[A[A


120it [00:05, 23.20it/s][A[A[A


123it [00:05, 22.96it/s][A[A[A


126it [00:05, 22.95it/s][A[A[A


129it [00:05, 23.01it/s][A[A[A


132it [00:05, 22.64it/s][A[A[A


135it [00:05, 22.77it/s][A[A[A


138it [00:06, 22.99it/s][A[A[A


141it [00:06, 23.08it/s][A[A[A


144it [00:06, 23.35it/s][A[A[A


147it [00:06, 23.08it/s][A[A[A


150it [00:06, 23.06it/s][A[A[A


153it [00:06, 23.29it/s][A[A[A


156it [00:06, 23.33it/s][A[A[A


159it [00:06, 23.41it/s][A[A[A


162it [00:07, 23.33it/s][A[A[A


165it [00:07, 23.22it/s][A[A[A


168it [00:07, 23.08it/s][A[A[A


171it [00:07, 22.62it/s][A[A[A


174it [00:07, 22.53it/s][A[A[A


177it [00:07, 22.58it/s][A[A[A


180it [00:07, 23.02it/s][A[A[A


183it [00:08, 23.28it/s][A[A[A


187it [00:08, 22.86it/s]


Epoch [57/100], Step [100/187], loss: 0.0163





105it [00:04, 22.76it/s][A[A[A


108it [00:04, 23.13it/s][A[A[A


111it [00:04, 22.85it/s][A[A[A


114it [00:04, 23.00it/s][A[A[A


117it [00:05, 23.23it/s][A[A[A


120it [00:05, 23.13it/s][A[A[A


123it [00:05, 22.92it/s][A[A[A


126it [00:05, 23.13it/s][A[A[A


129it [00:05, 22.82it/s][A[A[A


132it [00:05, 22.88it/s][A[A[A


135it [00:05, 23.24it/s][A[A[A


138it [00:05, 23.44it/s][A[A[A


141it [00:06, 23.36it/s][A[A[A


144it [00:06, 23.38it/s][A[A[A


147it [00:06, 23.12it/s][A[A[A


150it [00:06, 22.96it/s][A[A[A


153it [00:06, 22.80it/s][A[A[A


156it [00:06, 23.10it/s][A[A[A


159it [00:06, 23.22it/s][A[A[A


162it [00:06, 23.32it/s][A[A[A


165it [00:07, 23.49it/s][A[A[A


168it [00:07, 23.36it/s][A[A[A


171it [00:07, 22.73it/s][A[A[A


174it [00:07, 23.03it/s][A[A[A


177it [00:07, 22.93it/s][A[A[A


180it [00:07, 23.24it/s][A[A[A


183it [00:07, 23.47it/s][A[A[A


187it [00:08, 23.16it/s]


Epoch [58/100], Step [100/187], loss: 0.1075





105it [00:04, 22.39it/s][A[A[A


108it [00:04, 22.82it/s][A[A[A


111it [00:04, 22.39it/s][A[A[A


114it [00:04, 22.70it/s][A[A[A


117it [00:05, 23.00it/s][A[A[A


120it [00:05, 22.97it/s][A[A[A


123it [00:05, 22.09it/s][A[A[A


126it [00:05, 22.28it/s][A[A[A


129it [00:05, 22.46it/s][A[A[A


132it [00:05, 22.76it/s][A[A[A


135it [00:05, 23.04it/s][A[A[A


138it [00:05, 22.61it/s][A[A[A


141it [00:06, 22.74it/s][A[A[A


144it [00:06, 23.09it/s][A[A[A


147it [00:06, 22.40it/s][A[A[A


150it [00:06, 22.69it/s][A[A[A


153it [00:06, 22.97it/s][A[A[A


156it [00:06, 22.95it/s][A[A[A


159it [00:06, 23.27it/s][A[A[A


162it [00:07, 23.42it/s][A[A[A


165it [00:07, 23.31it/s][A[A[A


168it [00:07, 23.51it/s][A[A[A


171it [00:07, 23.20it/s][A[A[A


174it [00:07, 23.36it/s][A[A[A


177it [00:07, 23.58it/s][A[A[A


180it [00:07, 23.41it/s][A[A[A


183it [00:07, 23.40it/s][A[A[A


187it [00:08, 23.12it/s]


Epoch [59/100], Step [100/187], loss: 1.9161





105it [00:04, 22.58it/s][A[A[A


108it [00:04, 22.74it/s][A[A[A


111it [00:04, 23.08it/s][A[A[A


114it [00:04, 23.05it/s][A[A[A


117it [00:05, 22.25it/s][A[A[A


120it [00:05, 22.09it/s][A[A[A


123it [00:05, 22.08it/s][A[A[A


126it [00:05, 22.27it/s][A[A[A


129it [00:05, 22.40it/s][A[A[A


132it [00:05, 22.53it/s][A[A[A


135it [00:05, 22.80it/s][A[A[A


138it [00:05, 23.12it/s][A[A[A


141it [00:06, 23.37it/s][A[A[A


144it [00:06, 23.51it/s][A[A[A


147it [00:06, 23.30it/s][A[A[A


150it [00:06, 23.30it/s][A[A[A


153it [00:06, 22.81it/s][A[A[A


156it [00:06, 23.00it/s][A[A[A


159it [00:06, 23.15it/s][A[A[A


162it [00:06, 23.22it/s][A[A[A


165it [00:07, 22.84it/s][A[A[A


168it [00:07, 22.99it/s][A[A[A


171it [00:07, 22.59it/s][A[A[A


174it [00:07, 22.85it/s][A[A[A


177it [00:07, 23.05it/s][A[A[A


180it [00:07, 23.12it/s][A[A[A


183it [00:07, 23.46it/s][A[A[A


187it [00:08, 23.13it/s]


Epoch [60/100], Step [100/187], loss: 0.7104





105it [00:04, 22.41it/s][A[A[A


108it [00:04, 22.82it/s][A[A[A


111it [00:04, 23.16it/s][A[A[A


114it [00:04, 23.39it/s][A[A[A


117it [00:05, 23.36it/s][A[A[A


120it [00:05, 23.34it/s][A[A[A


123it [00:05, 23.28it/s][A[A[A


126it [00:05, 23.24it/s][A[A[A


129it [00:05, 23.29it/s][A[A[A


132it [00:05, 23.47it/s][A[A[A


135it [00:05, 22.71it/s][A[A[A


138it [00:05, 22.96it/s][A[A[A


141it [00:06, 23.17it/s][A[A[A


144it [00:06, 23.01it/s][A[A[A


147it [00:06, 22.90it/s][A[A[A


150it [00:06, 23.09it/s][A[A[A


153it [00:06, 23.09it/s][A[A[A


156it [00:06, 23.35it/s][A[A[A


159it [00:06, 23.57it/s][A[A[A


162it [00:06, 23.53it/s][A[A[A


165it [00:07, 23.64it/s][A[A[A


168it [00:07, 23.59it/s][A[A[A


171it [00:07, 23.31it/s][A[A[A


174it [00:07, 23.40it/s][A[A[A


177it [00:07, 23.36it/s][A[A[A


180it [00:07, 23.50it/s][A[A[A


183it [00:07, 23.60it/s][A[A[A


187it [00:08, 23.23it/s]


Epoch [61/100], Step [100/187], loss: 0.1004





105it [00:04, 22.89it/s][A[A[A


108it [00:04, 23.18it/s][A[A[A


111it [00:04, 23.43it/s][A[A[A


114it [00:04, 23.07it/s][A[A[A


117it [00:05, 23.13it/s][A[A[A


120it [00:05, 23.21it/s][A[A[A


123it [00:05, 23.00it/s][A[A[A


126it [00:05, 22.83it/s][A[A[A


129it [00:05, 23.14it/s][A[A[A


132it [00:05, 23.12it/s][A[A[A


135it [00:05, 23.35it/s][A[A[A


138it [00:05, 23.47it/s][A[A[A


141it [00:06, 23.14it/s][A[A[A


144it [00:06, 23.30it/s][A[A[A


147it [00:06, 23.47it/s][A[A[A


150it [00:06, 23.23it/s][A[A[A


153it [00:06, 23.33it/s][A[A[A


156it [00:06, 23.49it/s][A[A[A


159it [00:06, 22.87it/s][A[A[A


162it [00:06, 22.95it/s][A[A[A


165it [00:07, 23.11it/s][A[A[A


168it [00:07, 22.95it/s][A[A[A


171it [00:07, 22.93it/s][A[A[A


174it [00:07, 23.01it/s][A[A[A


177it [00:07, 23.16it/s][A[A[A


180it [00:07, 23.31it/s][A[A[A


183it [00:07, 23.40it/s][A[A[A


187it [00:08, 23.22it/s]


Epoch [62/100], Step [100/187], loss: 0.0078





105it [00:04, 22.61it/s][A[A[A


108it [00:04, 22.48it/s][A[A[A


111it [00:04, 22.90it/s][A[A[A


114it [00:04, 23.24it/s][A[A[A


117it [00:05, 23.19it/s][A[A[A


120it [00:05, 23.41it/s][A[A[A


123it [00:05, 23.50it/s][A[A[A


126it [00:05, 23.09it/s][A[A[A


129it [00:05, 23.37it/s][A[A[A


132it [00:05, 23.15it/s][A[A[A


135it [00:05, 22.53it/s][A[A[A


138it [00:05, 22.64it/s][A[A[A


141it [00:06, 22.68it/s][A[A[A


144it [00:06, 22.89it/s][A[A[A


147it [00:06, 23.06it/s][A[A[A


150it [00:06, 22.91it/s][A[A[A


153it [00:06, 23.13it/s][A[A[A


156it [00:06, 23.35it/s][A[A[A


159it [00:06, 23.12it/s][A[A[A


162it [00:06, 23.17it/s][A[A[A


165it [00:07, 23.47it/s][A[A[A


168it [00:07, 23.51it/s][A[A[A


171it [00:07, 23.58it/s][A[A[A


174it [00:07, 23.53it/s][A[A[A


177it [00:07, 23.59it/s][A[A[A


180it [00:07, 23.46it/s][A[A[A


183it [00:07, 23.51it/s][A[A[A


187it [00:08, 23.26it/s]


Epoch [63/100], Step [100/187], loss: 0.0289





105it [00:04, 22.58it/s][A[A[A


108it [00:04, 22.77it/s][A[A[A


111it [00:04, 23.15it/s][A[A[A


114it [00:04, 23.33it/s][A[A[A


117it [00:05, 23.32it/s][A[A[A


120it [00:05, 23.38it/s][A[A[A


123it [00:05, 23.55it/s][A[A[A


126it [00:05, 23.03it/s][A[A[A


129it [00:05, 23.15it/s][A[A[A


132it [00:05, 23.28it/s][A[A[A


135it [00:05, 22.45it/s][A[A[A


138it [00:05, 22.82it/s][A[A[A


141it [00:06, 23.08it/s][A[A[A


144it [00:06, 22.62it/s][A[A[A


147it [00:06, 22.37it/s][A[A[A


150it [00:06, 22.52it/s][A[A[A


153it [00:06, 22.90it/s][A[A[A


156it [00:06, 23.09it/s][A[A[A


159it [00:06, 23.13it/s][A[A[A


162it [00:07, 23.33it/s][A[A[A


165it [00:07, 23.49it/s][A[A[A


168it [00:07, 23.48it/s][A[A[A


171it [00:07, 23.58it/s][A[A[A


174it [00:07, 23.35it/s][A[A[A


177it [00:07, 23.37it/s][A[A[A


180it [00:07, 23.22it/s][A[A[A


183it [00:07, 23.44it/s][A[A[A


187it [00:08, 23.10it/s]


Epoch [64/100], Step [100/187], loss: 0.0212





105it [00:04, 22.64it/s][A[A[A


108it [00:04, 23.04it/s][A[A[A


111it [00:04, 23.02it/s][A[A[A


114it [00:04, 23.17it/s][A[A[A


117it [00:05, 23.31it/s][A[A[A


120it [00:05, 23.31it/s][A[A[A


123it [00:05, 23.55it/s][A[A[A


126it [00:05, 23.13it/s][A[A[A


129it [00:05, 22.92it/s][A[A[A


132it [00:05, 23.13it/s][A[A[A


135it [00:05, 23.19it/s][A[A[A


138it [00:05, 23.33it/s][A[A[A


141it [00:06, 23.60it/s][A[A[A


144it [00:06, 23.53it/s][A[A[A


147it [00:06, 23.74it/s][A[A[A


150it [00:06, 23.60it/s][A[A[A


153it [00:06, 23.56it/s][A[A[A


156it [00:06, 23.62it/s][A[A[A


159it [00:06, 23.64it/s][A[A[A


162it [00:06, 23.56it/s][A[A[A


165it [00:07, 23.64it/s][A[A[A


168it [00:07, 23.63it/s][A[A[A


171it [00:07, 23.13it/s][A[A[A


174it [00:07, 23.11it/s][A[A[A


177it [00:07, 23.43it/s][A[A[A


180it [00:07, 23.32it/s][A[A[A


183it [00:07, 23.50it/s][A[A[A


187it [00:08, 23.27it/s]


Epoch [65/100], Step [100/187], loss: 0.0946





105it [00:04, 22.21it/s][A[A[A


108it [00:04, 22.61it/s][A[A[A


111it [00:04, 22.86it/s][A[A[A


114it [00:05, 22.81it/s][A[A[A


117it [00:05, 22.79it/s][A[A[A


120it [00:05, 22.81it/s][A[A[A


123it [00:05, 22.79it/s][A[A[A


126it [00:05, 22.57it/s][A[A[A


129it [00:05, 22.93it/s][A[A[A


132it [00:05, 22.91it/s][A[A[A


135it [00:05, 23.12it/s][A[A[A


138it [00:06, 23.14it/s][A[A[A


141it [00:06, 22.57it/s][A[A[A


144it [00:06, 22.76it/s][A[A[A


147it [00:06, 22.84it/s][A[A[A


150it [00:06, 22.66it/s][A[A[A


153it [00:06, 22.95it/s][A[A[A


156it [00:06, 22.71it/s][A[A[A


159it [00:06, 22.92it/s][A[A[A


162it [00:07, 22.94it/s][A[A[A


165it [00:07, 22.95it/s][A[A[A


168it [00:07, 23.10it/s][A[A[A


171it [00:07, 22.99it/s][A[A[A


174it [00:07, 22.86it/s][A[A[A


177it [00:07, 22.96it/s][A[A[A


180it [00:07, 22.24it/s][A[A[A


183it [00:08, 22.32it/s][A[A[A


187it [00:08, 22.79it/s]


Epoch [66/100], Step [100/187], loss: 0.0298





105it [00:04, 22.46it/s][A[A[A


108it [00:04, 22.59it/s][A[A[A


111it [00:04, 22.65it/s][A[A[A


114it [00:05, 22.72it/s][A[A[A


117it [00:05, 22.96it/s][A[A[A


120it [00:05, 23.22it/s][A[A[A


123it [00:05, 22.93it/s][A[A[A


126it [00:05, 22.95it/s][A[A[A


129it [00:05, 22.80it/s][A[A[A


132it [00:05, 22.95it/s][A[A[A


135it [00:05, 22.98it/s][A[A[A


138it [00:06, 23.21it/s][A[A[A


141it [00:06, 23.28it/s][A[A[A


144it [00:06, 23.29it/s][A[A[A


147it [00:06, 22.97it/s][A[A[A


150it [00:06, 23.23it/s][A[A[A


153it [00:06, 23.21it/s][A[A[A


156it [00:06, 23.20it/s][A[A[A


159it [00:06, 23.35it/s][A[A[A


162it [00:07, 23.30it/s][A[A[A


165it [00:07, 23.42it/s][A[A[A


168it [00:07, 23.25it/s][A[A[A


171it [00:07, 22.36it/s][A[A[A


174it [00:07, 22.54it/s][A[A[A


177it [00:07, 22.56it/s][A[A[A


180it [00:07, 22.81it/s][A[A[A


183it [00:08, 23.10it/s][A[A[A


187it [00:08, 22.79it/s]


Epoch [67/100], Step [100/187], loss: 0.0493





105it [00:04, 22.61it/s][A[A[A


108it [00:04, 22.77it/s][A[A[A


111it [00:04, 22.98it/s][A[A[A


114it [00:04, 23.26it/s][A[A[A


117it [00:05, 23.53it/s][A[A[A


120it [00:05, 23.19it/s][A[A[A


123it [00:05, 22.98it/s][A[A[A


126it [00:05, 23.23it/s][A[A[A


129it [00:05, 23.19it/s][A[A[A


132it [00:05, 23.40it/s][A[A[A


135it [00:05, 23.62it/s][A[A[A


138it [00:05, 23.73it/s][A[A[A


141it [00:06, 23.20it/s][A[A[A


144it [00:06, 23.35it/s][A[A[A


147it [00:06, 23.04it/s][A[A[A


150it [00:06, 23.01it/s][A[A[A


153it [00:06, 23.37it/s][A[A[A


156it [00:06, 23.26it/s][A[A[A


159it [00:06, 23.47it/s][A[A[A


162it [00:06, 23.68it/s][A[A[A


165it [00:07, 23.74it/s][A[A[A


168it [00:07, 23.32it/s][A[A[A


171it [00:07, 23.33it/s][A[A[A


174it [00:07, 23.35it/s][A[A[A


177it [00:07, 23.31it/s][A[A[A


180it [00:07, 23.52it/s][A[A[A


183it [00:07, 23.62it/s][A[A[A


187it [00:08, 23.20it/s]


Epoch [68/100], Step [100/187], loss: 1.1445





105it [00:04, 22.60it/s][A[A[A


108it [00:04, 22.91it/s][A[A[A


111it [00:04, 23.13it/s][A[A[A


114it [00:04, 23.17it/s][A[A[A


117it [00:05, 23.42it/s][A[A[A


120it [00:05, 23.61it/s][A[A[A


123it [00:05, 23.03it/s][A[A[A


126it [00:05, 23.27it/s][A[A[A


129it [00:05, 22.89it/s][A[A[A


132it [00:05, 22.50it/s][A[A[A


135it [00:05, 22.78it/s][A[A[A


138it [00:05, 23.05it/s][A[A[A


141it [00:06, 23.12it/s][A[A[A


144it [00:06, 23.31it/s][A[A[A


147it [00:06, 23.21it/s][A[A[A


150it [00:06, 23.22it/s][A[A[A


153it [00:06, 23.30it/s][A[A[A


156it [00:06, 23.29it/s][A[A[A


159it [00:06, 23.45it/s][A[A[A


162it [00:06, 23.56it/s][A[A[A


165it [00:07, 23.45it/s][A[A[A


168it [00:07, 23.51it/s][A[A[A


171it [00:07, 22.79it/s][A[A[A


174it [00:07, 22.77it/s][A[A[A


177it [00:07, 22.28it/s][A[A[A


180it [00:07, 22.70it/s][A[A[A


183it [00:07, 22.87it/s][A[A[A


187it [00:08, 23.11it/s]


Epoch [69/100], Step [100/187], loss: 0.8644





105it [00:04, 23.01it/s][A[A[A


108it [00:04, 23.29it/s][A[A[A


111it [00:04, 23.26it/s][A[A[A


114it [00:04, 23.56it/s][A[A[A


117it [00:05, 23.57it/s][A[A[A


120it [00:05, 23.63it/s][A[A[A


123it [00:05, 23.46it/s][A[A[A


126it [00:05, 23.58it/s][A[A[A


129it [00:05, 23.50it/s][A[A[A


132it [00:05, 23.56it/s][A[A[A


135it [00:05, 23.75it/s][A[A[A


138it [00:05, 23.50it/s][A[A[A


141it [00:06, 23.29it/s][A[A[A


144it [00:06, 23.62it/s][A[A[A


147it [00:06, 23.14it/s][A[A[A


150it [00:06, 23.26it/s][A[A[A


153it [00:06, 23.23it/s][A[A[A


156it [00:06, 23.08it/s][A[A[A


159it [00:06, 23.12it/s][A[A[A


162it [00:06, 23.30it/s][A[A[A


165it [00:07, 23.33it/s][A[A[A


168it [00:07, 23.44it/s][A[A[A


171it [00:07, 23.16it/s][A[A[A


174it [00:07, 23.05it/s][A[A[A


177it [00:07, 23.01it/s][A[A[A


180it [00:07, 23.18it/s][A[A[A


183it [00:07, 22.82it/s][A[A[A


187it [00:08, 23.29it/s]


Epoch [70/100], Step [100/187], loss: 0.0896





105it [00:04, 22.14it/s][A[A[A


108it [00:04, 22.50it/s][A[A[A


111it [00:04, 22.75it/s][A[A[A


114it [00:04, 22.95it/s][A[A[A


117it [00:05, 22.86it/s][A[A[A


120it [00:05, 22.78it/s][A[A[A


123it [00:05, 23.01it/s][A[A[A


126it [00:05, 23.05it/s][A[A[A


129it [00:05, 23.31it/s][A[A[A


132it [00:05, 23.55it/s][A[A[A


135it [00:05, 23.31it/s][A[A[A


138it [00:05, 23.39it/s][A[A[A


141it [00:06, 23.63it/s][A[A[A


144it [00:06, 23.50it/s][A[A[A


147it [00:06, 23.40it/s][A[A[A


150it [00:06, 23.48it/s][A[A[A


153it [00:06, 23.48it/s][A[A[A


156it [00:06, 22.66it/s][A[A[A


159it [00:06, 22.90it/s][A[A[A


162it [00:07, 22.69it/s][A[A[A


165it [00:07, 22.82it/s][A[A[A


168it [00:07, 22.99it/s][A[A[A


171it [00:07, 22.89it/s][A[A[A


174it [00:07, 23.19it/s][A[A[A


177it [00:07, 23.39it/s][A[A[A


180it [00:07, 23.24it/s][A[A[A


183it [00:07, 23.29it/s][A[A[A


187it [00:08, 23.06it/s]


Epoch [71/100], Step [100/187], loss: 0.0324





105it [00:04, 22.73it/s][A[A[A


108it [00:04, 23.08it/s][A[A[A


111it [00:04, 23.37it/s][A[A[A


114it [00:04, 23.34it/s][A[A[A


117it [00:05, 23.46it/s][A[A[A


120it [00:05, 23.61it/s][A[A[A


123it [00:05, 23.10it/s][A[A[A


126it [00:05, 23.03it/s][A[A[A


129it [00:05, 23.40it/s][A[A[A


132it [00:05, 23.30it/s][A[A[A


135it [00:05, 23.47it/s][A[A[A


138it [00:05, 23.57it/s][A[A[A


141it [00:06, 23.62it/s][A[A[A


144it [00:06, 23.31it/s][A[A[A


147it [00:06, 23.31it/s][A[A[A


150it [00:06, 23.16it/s][A[A[A


153it [00:06, 23.21it/s][A[A[A


156it [00:06, 23.47it/s][A[A[A


159it [00:06, 23.56it/s][A[A[A


162it [00:06, 23.59it/s][A[A[A


165it [00:07, 23.63it/s][A[A[A


168it [00:07, 23.50it/s][A[A[A


171it [00:07, 23.11it/s][A[A[A


174it [00:07, 23.40it/s][A[A[A


177it [00:07, 23.34it/s][A[A[A


180it [00:07, 23.51it/s][A[A[A


183it [00:07, 23.67it/s][A[A[A


187it [00:08, 23.33it/s]


Epoch [72/100], Step [100/187], loss: 0.3757





105it [00:04, 22.69it/s][A[A[A


108it [00:04, 22.92it/s][A[A[A


111it [00:04, 23.10it/s][A[A[A


114it [00:04, 22.39it/s][A[A[A


117it [00:05, 22.56it/s][A[A[A


120it [00:05, 23.04it/s][A[A[A


123it [00:05, 23.24it/s][A[A[A


126it [00:05, 23.01it/s][A[A[A


129it [00:05, 23.31it/s][A[A[A


132it [00:05, 23.53it/s][A[A[A


135it [00:05, 23.41it/s][A[A[A


138it [00:05, 23.31it/s][A[A[A


141it [00:06, 23.48it/s][A[A[A


144it [00:06, 23.33it/s][A[A[A


147it [00:06, 22.54it/s][A[A[A


150it [00:06, 22.52it/s][A[A[A


153it [00:06, 22.86it/s][A[A[A


156it [00:06, 23.15it/s][A[A[A


159it [00:06, 23.04it/s][A[A[A


162it [00:07, 23.04it/s][A[A[A


165it [00:07, 23.23it/s][A[A[A


168it [00:07, 23.18it/s][A[A[A


171it [00:07, 22.91it/s][A[A[A


174it [00:07, 23.13it/s][A[A[A


177it [00:07, 23.17it/s][A[A[A


180it [00:07, 23.21it/s][A[A[A


183it [00:07, 23.44it/s][A[A[A


187it [00:08, 23.01it/s]


Epoch [73/100], Step [100/187], loss: 0.0171





105it [00:04, 22.40it/s][A[A[A


108it [00:04, 22.53it/s][A[A[A


111it [00:04, 22.78it/s][A[A[A


114it [00:04, 22.57it/s][A[A[A


117it [00:05, 22.66it/s][A[A[A


120it [00:05, 22.74it/s][A[A[A


123it [00:05, 22.61it/s][A[A[A


126it [00:05, 22.80it/s][A[A[A


129it [00:05, 22.90it/s][A[A[A


132it [00:05, 22.92it/s][A[A[A


135it [00:05, 22.77it/s][A[A[A


138it [00:06, 22.91it/s][A[A[A


141it [00:06, 23.06it/s][A[A[A


144it [00:06, 22.96it/s][A[A[A


147it [00:06, 22.90it/s][A[A[A


150it [00:06, 23.10it/s][A[A[A


153it [00:06, 23.17it/s][A[A[A


156it [00:06, 23.03it/s][A[A[A


159it [00:06, 22.58it/s][A[A[A


162it [00:07, 22.77it/s][A[A[A


165it [00:07, 22.64it/s][A[A[A


168it [00:07, 22.71it/s][A[A[A


171it [00:07, 22.62it/s][A[A[A


174it [00:07, 22.51it/s][A[A[A


177it [00:07, 22.71it/s][A[A[A


180it [00:07, 22.37it/s][A[A[A


183it [00:08, 21.73it/s][A[A[A


187it [00:08, 22.76it/s]


Epoch [74/100], Step [100/187], loss: 0.0742





105it [00:04, 22.44it/s][A[A[A


108it [00:04, 22.89it/s][A[A[A


111it [00:04, 23.06it/s][A[A[A


114it [00:04, 23.33it/s][A[A[A


117it [00:05, 23.51it/s][A[A[A


120it [00:05, 23.40it/s][A[A[A


123it [00:05, 23.51it/s][A[A[A


126it [00:05, 23.56it/s][A[A[A


129it [00:05, 23.80it/s][A[A[A


132it [00:05, 23.80it/s][A[A[A


135it [00:05, 23.43it/s][A[A[A


138it [00:05, 23.43it/s][A[A[A


141it [00:06, 23.45it/s][A[A[A


144it [00:06, 23.11it/s][A[A[A


147it [00:06, 23.20it/s][A[A[A


150it [00:06, 23.33it/s][A[A[A


153it [00:06, 22.79it/s][A[A[A


156it [00:06, 23.05it/s][A[A[A


159it [00:06, 23.03it/s][A[A[A


162it [00:07, 23.05it/s][A[A[A


165it [00:07, 23.11it/s][A[A[A


168it [00:07, 22.98it/s][A[A[A


171it [00:07, 23.02it/s][A[A[A


174it [00:07, 23.08it/s][A[A[A


177it [00:07, 23.31it/s][A[A[A


180it [00:07, 23.26it/s][A[A[A


183it [00:07, 23.27it/s][A[A[A


187it [00:08, 23.04it/s]


Epoch [75/100], Step [100/187], loss: 0.0070





105it [00:04, 22.21it/s][A[A[A


108it [00:04, 22.59it/s][A[A[A


111it [00:04, 22.72it/s][A[A[A


114it [00:04, 22.88it/s][A[A[A


117it [00:05, 23.08it/s][A[A[A


120it [00:05, 22.83it/s][A[A[A


123it [00:05, 23.08it/s][A[A[A


126it [00:05, 22.14it/s][A[A[A


129it [00:05, 22.50it/s][A[A[A


132it [00:05, 22.79it/s][A[A[A


135it [00:05, 22.90it/s][A[A[A


138it [00:06, 23.10it/s][A[A[A


141it [00:06, 23.23it/s][A[A[A


144it [00:06, 22.66it/s][A[A[A


147it [00:06, 22.61it/s][A[A[A


150it [00:06, 22.84it/s][A[A[A


153it [00:06, 22.89it/s][A[A[A


156it [00:06, 23.06it/s][A[A[A


159it [00:06, 23.14it/s][A[A[A


162it [00:07, 23.06it/s][A[A[A


165it [00:07, 22.80it/s][A[A[A


168it [00:07, 22.81it/s][A[A[A


171it [00:07, 22.92it/s][A[A[A


174it [00:07, 23.01it/s][A[A[A


177it [00:07, 22.89it/s][A[A[A


180it [00:07, 22.95it/s][A[A[A


183it [00:07, 23.00it/s][A[A[A


187it [00:08, 22.92it/s]


Epoch [76/100], Step [100/187], loss: 0.0069





105it [00:04, 22.82it/s][A[A[A


108it [00:04, 23.12it/s][A[A[A


111it [00:04, 22.75it/s][A[A[A


114it [00:04, 22.77it/s][A[A[A


117it [00:05, 23.01it/s][A[A[A


120it [00:05, 22.99it/s][A[A[A


123it [00:05, 22.84it/s][A[A[A


126it [00:05, 22.98it/s][A[A[A


129it [00:05, 23.33it/s][A[A[A


132it [00:05, 22.62it/s][A[A[A


135it [00:05, 22.94it/s][A[A[A


138it [00:06, 22.95it/s][A[A[A


141it [00:06, 23.07it/s][A[A[A


144it [00:06, 23.02it/s][A[A[A


147it [00:06, 23.31it/s][A[A[A


150it [00:06, 23.26it/s][A[A[A


153it [00:06, 23.44it/s][A[A[A


156it [00:06, 23.34it/s][A[A[A


159it [00:06, 23.10it/s][A[A[A


162it [00:07, 23.11it/s][A[A[A


165it [00:07, 22.83it/s][A[A[A


168it [00:07, 22.90it/s][A[A[A


171it [00:07, 23.07it/s][A[A[A


174it [00:07, 23.30it/s][A[A[A


177it [00:07, 23.38it/s][A[A[A


180it [00:07, 22.84it/s][A[A[A


183it [00:07, 23.11it/s][A[A[A


187it [00:08, 23.00it/s]


Epoch [77/100], Step [100/187], loss: 0.1310





105it [00:04, 22.65it/s][A[A[A


108it [00:04, 23.02it/s][A[A[A


111it [00:04, 23.25it/s][A[A[A


114it [00:04, 23.27it/s][A[A[A


117it [00:05, 23.48it/s][A[A[A


120it [00:05, 23.33it/s][A[A[A


123it [00:05, 23.24it/s][A[A[A


126it [00:05, 23.39it/s][A[A[A


129it [00:05, 23.46it/s][A[A[A


132it [00:05, 22.86it/s][A[A[A


135it [00:05, 22.99it/s][A[A[A


138it [00:05, 22.90it/s][A[A[A


141it [00:06, 23.21it/s][A[A[A


144it [00:06, 23.07it/s][A[A[A


147it [00:06, 23.11it/s][A[A[A


150it [00:06, 23.19it/s][A[A[A


153it [00:06, 23.24it/s][A[A[A


156it [00:06, 23.07it/s][A[A[A


159it [00:06, 23.19it/s][A[A[A


162it [00:07, 23.29it/s][A[A[A


165it [00:07, 22.88it/s][A[A[A


168it [00:07, 22.06it/s][A[A[A


171it [00:07, 22.39it/s][A[A[A


174it [00:07, 22.40it/s][A[A[A


177it [00:07, 22.76it/s][A[A[A


180it [00:07, 22.63it/s][A[A[A


183it [00:07, 22.61it/s][A[A[A


187it [00:08, 23.02it/s]


Epoch [78/100], Step [100/187], loss: 0.0887





105it [00:04, 23.07it/s][A[A[A


108it [00:04, 22.57it/s][A[A[A


111it [00:04, 23.01it/s][A[A[A


114it [00:04, 23.39it/s][A[A[A


117it [00:05, 23.17it/s][A[A[A


120it [00:05, 23.24it/s][A[A[A


123it [00:05, 23.51it/s][A[A[A


126it [00:05, 23.51it/s][A[A[A


129it [00:05, 23.58it/s][A[A[A


132it [00:05, 23.71it/s][A[A[A


135it [00:05, 23.71it/s][A[A[A


138it [00:05, 23.81it/s][A[A[A


141it [00:06, 23.51it/s][A[A[A


144it [00:06, 23.53it/s][A[A[A


147it [00:06, 23.60it/s][A[A[A


150it [00:06, 23.33it/s][A[A[A


153it [00:06, 23.42it/s][A[A[A


156it [00:06, 23.51it/s][A[A[A


159it [00:06, 23.05it/s][A[A[A


162it [00:07, 23.23it/s][A[A[A


165it [00:07, 23.21it/s][A[A[A


168it [00:07, 23.26it/s][A[A[A


171it [00:07, 23.24it/s][A[A[A


174it [00:07, 23.15it/s][A[A[A


177it [00:07, 23.23it/s][A[A[A


180it [00:07, 23.34it/s][A[A[A


183it [00:07, 23.39it/s][A[A[A


187it [00:08, 23.11it/s]


Epoch [79/100], Step [100/187], loss: 0.0876





105it [00:04, 22.77it/s][A[A[A


108it [00:04, 22.89it/s][A[A[A


111it [00:04, 23.12it/s][A[A[A


114it [00:04, 23.07it/s][A[A[A


117it [00:05, 23.35it/s][A[A[A


120it [00:05, 23.24it/s][A[A[A


123it [00:05, 23.22it/s][A[A[A


126it [00:05, 23.03it/s][A[A[A


129it [00:05, 23.16it/s][A[A[A


132it [00:05, 23.24it/s][A[A[A


135it [00:05, 23.46it/s][A[A[A


138it [00:05, 23.59it/s][A[A[A


141it [00:06, 23.08it/s][A[A[A


144it [00:06, 22.86it/s][A[A[A


147it [00:06, 23.07it/s][A[A[A


150it [00:06, 22.90it/s][A[A[A


153it [00:06, 23.18it/s][A[A[A


156it [00:06, 23.32it/s][A[A[A


159it [00:06, 23.42it/s][A[A[A


162it [00:06, 23.45it/s][A[A[A


165it [00:07, 23.61it/s][A[A[A


168it [00:07, 23.45it/s][A[A[A


171it [00:07, 23.43it/s][A[A[A


174it [00:07, 23.51it/s][A[A[A


177it [00:07, 23.66it/s][A[A[A


180it [00:07, 23.01it/s][A[A[A


183it [00:07, 23.17it/s][A[A[A


187it [00:08, 23.27it/s]


Epoch [80/100], Step [100/187], loss: 0.0027





105it [00:04, 22.53it/s][A[A[A


108it [00:04, 22.80it/s][A[A[A


111it [00:04, 22.79it/s][A[A[A


114it [00:04, 23.10it/s][A[A[A


117it [00:05, 23.12it/s][A[A[A


120it [00:05, 22.67it/s][A[A[A


123it [00:05, 22.92it/s][A[A[A


126it [00:05, 23.18it/s][A[A[A


129it [00:05, 23.26it/s][A[A[A


132it [00:05, 23.17it/s][A[A[A


135it [00:05, 23.06it/s][A[A[A


138it [00:05, 23.05it/s][A[A[A


141it [00:06, 23.27it/s][A[A[A


144it [00:06, 23.25it/s][A[A[A


147it [00:06, 23.20it/s][A[A[A


150it [00:06, 23.34it/s][A[A[A


153it [00:06, 23.63it/s][A[A[A


156it [00:06, 23.49it/s][A[A[A


159it [00:06, 23.64it/s][A[A[A


162it [00:07, 23.66it/s][A[A[A


165it [00:07, 23.68it/s][A[A[A


168it [00:07, 23.32it/s][A[A[A


171it [00:07, 22.95it/s][A[A[A


174it [00:07, 23.14it/s][A[A[A


177it [00:07, 23.43it/s][A[A[A


180it [00:07, 23.56it/s][A[A[A


183it [00:07, 23.68it/s][A[A[A


187it [00:08, 23.14it/s]


Epoch [81/100], Step [100/187], loss: 0.0097





105it [00:04, 23.08it/s][A[A[A


108it [00:04, 23.34it/s][A[A[A


111it [00:04, 23.44it/s][A[A[A


114it [00:04, 23.60it/s][A[A[A


117it [00:05, 23.63it/s][A[A[A


120it [00:05, 23.40it/s][A[A[A


123it [00:05, 22.58it/s][A[A[A


126it [00:05, 22.79it/s][A[A[A


129it [00:05, 22.92it/s][A[A[A


132it [00:05, 22.67it/s][A[A[A


135it [00:05, 22.78it/s][A[A[A


138it [00:05, 22.94it/s][A[A[A


141it [00:06, 22.97it/s][A[A[A


144it [00:06, 22.35it/s][A[A[A


147it [00:06, 22.34it/s][A[A[A


150it [00:06, 22.57it/s][A[A[A


153it [00:06, 22.89it/s][A[A[A


156it [00:06, 22.80it/s][A[A[A


159it [00:06, 22.74it/s][A[A[A


162it [00:07, 21.72it/s][A[A[A


165it [00:07, 21.77it/s][A[A[A


168it [00:07, 22.27it/s][A[A[A


171it [00:07, 22.49it/s][A[A[A


174it [00:07, 22.73it/s][A[A[A


177it [00:07, 23.03it/s][A[A[A


180it [00:07, 23.28it/s][A[A[A


183it [00:07, 23.19it/s][A[A[A


187it [00:08, 22.96it/s]


Epoch [82/100], Step [100/187], loss: 0.0061





105it [00:04, 22.52it/s][A[A[A


108it [00:04, 22.91it/s][A[A[A


111it [00:04, 23.04it/s][A[A[A


114it [00:04, 22.99it/s][A[A[A


117it [00:05, 23.09it/s][A[A[A


120it [00:05, 22.86it/s][A[A[A


123it [00:05, 22.91it/s][A[A[A


126it [00:05, 23.07it/s][A[A[A


129it [00:05, 23.16it/s][A[A[A


132it [00:05, 23.04it/s][A[A[A


135it [00:05, 23.13it/s][A[A[A


138it [00:05, 23.34it/s][A[A[A


141it [00:06, 22.46it/s][A[A[A


144it [00:06, 22.88it/s][A[A[A


147it [00:06, 23.25it/s][A[A[A


150it [00:06, 23.38it/s][A[A[A


153it [00:06, 23.48it/s][A[A[A


156it [00:06, 23.54it/s][A[A[A


159it [00:06, 23.59it/s][A[A[A


162it [00:07, 23.44it/s][A[A[A


165it [00:07, 22.87it/s][A[A[A


168it [00:07, 22.07it/s][A[A[A


171it [00:07, 21.87it/s][A[A[A


174it [00:07, 22.06it/s][A[A[A


177it [00:07, 22.25it/s][A[A[A


180it [00:07, 22.59it/s][A[A[A


183it [00:07, 22.94it/s][A[A[A


187it [00:08, 22.99it/s]


Epoch [83/100], Step [100/187], loss: 0.3663





105it [00:04, 22.68it/s][A[A[A


108it [00:04, 22.99it/s][A[A[A


111it [00:04, 23.11it/s][A[A[A


114it [00:04, 23.03it/s][A[A[A


117it [00:05, 21.64it/s][A[A[A


120it [00:05, 21.40it/s][A[A[A


123it [00:05, 21.23it/s][A[A[A


126it [00:05, 21.81it/s][A[A[A


129it [00:05, 22.17it/s][A[A[A


132it [00:05, 22.26it/s][A[A[A


135it [00:05, 21.81it/s][A[A[A


138it [00:06, 21.94it/s][A[A[A


141it [00:06, 21.61it/s][A[A[A


144it [00:06, 21.96it/s][A[A[A


147it [00:06, 22.21it/s][A[A[A


150it [00:06, 22.27it/s][A[A[A


153it [00:06, 22.38it/s][A[A[A


156it [00:06, 22.62it/s][A[A[A


159it [00:06, 22.69it/s][A[A[A


162it [00:07, 22.56it/s][A[A[A


165it [00:07, 22.73it/s][A[A[A


168it [00:07, 22.68it/s][A[A[A


171it [00:07, 22.88it/s][A[A[A


174it [00:07, 22.89it/s][A[A[A


177it [00:07, 22.47it/s][A[A[A


180it [00:07, 22.78it/s][A[A[A


183it [00:08, 22.91it/s][A[A[A


187it [00:08, 22.83it/s]


Epoch [84/100], Step [100/187], loss: 0.2890





105it [00:04, 22.40it/s][A[A[A


108it [00:04, 22.58it/s][A[A[A


111it [00:04, 22.55it/s][A[A[A


114it [00:05, 22.51it/s][A[A[A


117it [00:05, 22.26it/s][A[A[A


120it [00:05, 22.29it/s][A[A[A


123it [00:05, 22.55it/s][A[A[A


126it [00:05, 22.20it/s][A[A[A


129it [00:05, 22.39it/s][A[A[A


132it [00:05, 22.64it/s][A[A[A


135it [00:06, 22.41it/s][A[A[A


138it [00:06, 22.47it/s][A[A[A


141it [00:06, 22.79it/s][A[A[A


144it [00:06, 22.77it/s][A[A[A


147it [00:06, 22.84it/s][A[A[A


150it [00:06, 22.62it/s][A[A[A


153it [00:06, 22.80it/s][A[A[A


156it [00:06, 21.90it/s][A[A[A


159it [00:07, 22.07it/s][A[A[A


162it [00:07, 22.53it/s][A[A[A


165it [00:07, 22.45it/s][A[A[A


168it [00:07, 21.78it/s][A[A[A


171it [00:07, 22.37it/s][A[A[A


174it [00:07, 22.60it/s][A[A[A


177it [00:07, 22.88it/s][A[A[A


180it [00:08, 22.75it/s][A[A[A


183it [00:08, 22.80it/s][A[A[A


187it [00:08, 22.49it/s]


Epoch [85/100], Step [100/187], loss: 0.0172





105it [00:04, 21.68it/s][A[A[A


108it [00:04, 22.08it/s][A[A[A


111it [00:04, 22.11it/s][A[A[A


114it [00:04, 22.50it/s][A[A[A


117it [00:05, 22.84it/s][A[A[A


120it [00:05, 22.96it/s][A[A[A


123it [00:05, 23.11it/s][A[A[A


126it [00:05, 23.19it/s][A[A[A


129it [00:05, 22.95it/s][A[A[A


132it [00:05, 22.82it/s][A[A[A


135it [00:05, 22.98it/s][A[A[A


138it [00:06, 23.05it/s][A[A[A


141it [00:06, 23.19it/s][A[A[A


144it [00:06, 23.33it/s][A[A[A


147it [00:06, 22.88it/s][A[A[A


150it [00:06, 23.08it/s][A[A[A


153it [00:06, 23.07it/s][A[A[A


156it [00:06, 23.03it/s][A[A[A


159it [00:06, 23.32it/s][A[A[A


162it [00:07, 23.17it/s][A[A[A


165it [00:07, 23.21it/s][A[A[A


168it [00:07, 23.23it/s][A[A[A


171it [00:07, 23.16it/s][A[A[A


174it [00:07, 23.14it/s][A[A[A


177it [00:07, 23.25it/s][A[A[A


180it [00:07, 22.59it/s][A[A[A


183it [00:07, 22.38it/s][A[A[A


187it [00:08, 22.95it/s]


Epoch [86/100], Step [100/187], loss: 0.8499





105it [00:04, 22.71it/s][A[A[A


108it [00:04, 22.91it/s][A[A[A


111it [00:04, 22.95it/s][A[A[A


114it [00:04, 23.28it/s][A[A[A


117it [00:05, 23.31it/s][A[A[A


120it [00:05, 23.43it/s][A[A[A


123it [00:05, 23.52it/s][A[A[A


126it [00:05, 23.50it/s][A[A[A


129it [00:05, 23.58it/s][A[A[A


132it [00:05, 23.60it/s][A[A[A


135it [00:05, 23.46it/s][A[A[A


138it [00:05, 23.68it/s][A[A[A


141it [00:06, 23.64it/s][A[A[A


144it [00:06, 23.13it/s][A[A[A


147it [00:06, 23.31it/s][A[A[A


150it [00:06, 23.49it/s][A[A[A


153it [00:06, 23.44it/s][A[A[A


156it [00:06, 22.58it/s][A[A[A


159it [00:06, 22.84it/s][A[A[A


162it [00:07, 23.05it/s][A[A[A


165it [00:07, 23.27it/s][A[A[A


168it [00:07, 23.52it/s][A[A[A


171it [00:07, 23.50it/s][A[A[A


174it [00:07, 23.49it/s][A[A[A


177it [00:07, 23.54it/s][A[A[A


180it [00:07, 22.92it/s][A[A[A


183it [00:07, 23.17it/s][A[A[A


187it [00:08, 23.13it/s]


Epoch [87/100], Step [100/187], loss: 0.0305





105it [00:04, 22.98it/s][A[A[A


108it [00:04, 23.10it/s][A[A[A


111it [00:04, 23.05it/s][A[A[A


114it [00:04, 23.26it/s][A[A[A


117it [00:05, 22.94it/s][A[A[A


120it [00:05, 23.08it/s][A[A[A


123it [00:05, 23.29it/s][A[A[A


126it [00:05, 23.25it/s][A[A[A


129it [00:05, 23.43it/s][A[A[A


132it [00:05, 23.17it/s][A[A[A


135it [00:05, 23.20it/s][A[A[A


138it [00:05, 22.98it/s][A[A[A


141it [00:06, 23.11it/s][A[A[A


144it [00:06, 23.23it/s][A[A[A


147it [00:06, 23.37it/s][A[A[A


150it [00:06, 23.17it/s][A[A[A


153it [00:06, 23.13it/s][A[A[A


156it [00:06, 22.57it/s][A[A[A


159it [00:06, 22.52it/s][A[A[A


162it [00:07, 22.82it/s][A[A[A


165it [00:07, 22.94it/s][A[A[A


168it [00:07, 23.33it/s][A[A[A


171it [00:07, 23.46it/s][A[A[A


174it [00:07, 23.48it/s][A[A[A


177it [00:07, 23.55it/s][A[A[A


180it [00:07, 23.32it/s][A[A[A


183it [00:07, 23.27it/s][A[A[A


187it [00:08, 23.13it/s]


Epoch [88/100], Step [100/187], loss: 0.0497





105it [00:04, 22.86it/s][A[A[A


108it [00:04, 23.11it/s][A[A[A


111it [00:04, 23.00it/s][A[A[A


114it [00:04, 23.20it/s][A[A[A


117it [00:05, 23.28it/s][A[A[A


120it [00:05, 23.20it/s][A[A[A


123it [00:05, 23.34it/s][A[A[A


126it [00:05, 23.32it/s][A[A[A


129it [00:05, 23.16it/s][A[A[A


132it [00:05, 23.44it/s][A[A[A


135it [00:05, 23.18it/s][A[A[A


138it [00:05, 23.17it/s][A[A[A


141it [00:06, 23.31it/s][A[A[A


144it [00:06, 22.93it/s][A[A[A


147it [00:06, 23.11it/s][A[A[A


150it [00:06, 23.26it/s][A[A[A


153it [00:06, 23.24it/s][A[A[A


156it [00:06, 23.12it/s][A[A[A


159it [00:06, 23.23it/s][A[A[A


162it [00:06, 23.08it/s][A[A[A


165it [00:07, 23.15it/s][A[A[A


168it [00:07, 23.31it/s][A[A[A


171it [00:07, 23.22it/s][A[A[A


174it [00:07, 23.20it/s][A[A[A


177it [00:07, 23.15it/s][A[A[A


180it [00:07, 22.87it/s][A[A[A


183it [00:07, 23.08it/s][A[A[A


187it [00:08, 23.19it/s]


Epoch [89/100], Step [100/187], loss: 0.1911





105it [00:04, 23.04it/s][A[A[A


108it [00:04, 23.09it/s][A[A[A


111it [00:04, 22.87it/s][A[A[A


114it [00:04, 23.14it/s][A[A[A


117it [00:05, 22.88it/s][A[A[A


120it [00:05, 23.09it/s][A[A[A


123it [00:05, 23.26it/s][A[A[A


126it [00:05, 23.21it/s][A[A[A


129it [00:05, 23.28it/s][A[A[A


132it [00:05, 23.21it/s][A[A[A


135it [00:05, 23.06it/s][A[A[A


138it [00:05, 22.96it/s][A[A[A


141it [00:06, 23.24it/s][A[A[A


144it [00:06, 22.64it/s][A[A[A


147it [00:06, 22.99it/s][A[A[A


150it [00:06, 23.00it/s][A[A[A


153it [00:06, 22.62it/s][A[A[A


156it [00:06, 22.48it/s][A[A[A


159it [00:06, 22.62it/s][A[A[A


162it [00:07, 22.70it/s][A[A[A


165it [00:07, 23.06it/s][A[A[A


168it [00:07, 23.12it/s][A[A[A


171it [00:07, 23.25it/s][A[A[A


174it [00:07, 23.34it/s][A[A[A


177it [00:07, 23.31it/s][A[A[A


180it [00:07, 23.11it/s][A[A[A


183it [00:07, 22.63it/s][A[A[A


187it [00:08, 22.99it/s]


Epoch [90/100], Step [100/187], loss: 0.0047





105it [00:04, 23.13it/s][A[A[A


108it [00:04, 23.21it/s][A[A[A


111it [00:04, 22.82it/s][A[A[A


114it [00:04, 22.98it/s][A[A[A


117it [00:05, 23.20it/s][A[A[A


120it [00:05, 23.13it/s][A[A[A


123it [00:05, 23.31it/s][A[A[A


126it [00:05, 23.46it/s][A[A[A


129it [00:05, 23.49it/s][A[A[A


132it [00:05, 22.81it/s][A[A[A


135it [00:05, 22.29it/s][A[A[A


138it [00:05, 22.32it/s][A[A[A


141it [00:06, 22.70it/s][A[A[A


144it [00:06, 23.05it/s][A[A[A


147it [00:06, 23.02it/s][A[A[A


150it [00:06, 23.29it/s][A[A[A


153it [00:06, 23.48it/s][A[A[A


156it [00:06, 23.26it/s][A[A[A


159it [00:06, 23.38it/s][A[A[A


162it [00:06, 23.33it/s][A[A[A


165it [00:07, 23.41it/s][A[A[A


168it [00:07, 22.87it/s][A[A[A


171it [00:07, 22.90it/s][A[A[A


174it [00:07, 22.89it/s][A[A[A


177it [00:07, 23.20it/s][A[A[A


180it [00:07, 22.89it/s][A[A[A


183it [00:07, 23.19it/s][A[A[A


187it [00:08, 23.23it/s]


Epoch [91/100], Step [100/187], loss: 0.0246





105it [00:04, 22.11it/s][A[A[A


108it [00:04, 22.22it/s][A[A[A


111it [00:04, 22.26it/s][A[A[A


114it [00:04, 22.54it/s][A[A[A


117it [00:05, 22.89it/s][A[A[A


120it [00:05, 23.21it/s][A[A[A


123it [00:05, 22.61it/s][A[A[A


126it [00:05, 22.55it/s][A[A[A


129it [00:05, 22.78it/s][A[A[A


132it [00:05, 22.73it/s][A[A[A


135it [00:05, 22.76it/s][A[A[A


138it [00:05, 22.98it/s][A[A[A


141it [00:06, 23.02it/s][A[A[A


144it [00:06, 23.21it/s][A[A[A


147it [00:06, 23.43it/s][A[A[A


150it [00:06, 23.38it/s][A[A[A


153it [00:06, 23.46it/s][A[A[A


156it [00:06, 23.38it/s][A[A[A


159it [00:06, 23.43it/s][A[A[A


162it [00:07, 23.29it/s][A[A[A


165it [00:07, 23.17it/s][A[A[A


168it [00:07, 23.36it/s][A[A[A


171it [00:07, 23.18it/s][A[A[A


174it [00:07, 23.25it/s][A[A[A


177it [00:07, 23.55it/s][A[A[A


180it [00:07, 23.27it/s][A[A[A


183it [00:07, 23.49it/s][A[A[A


187it [00:08, 23.13it/s]


Epoch [92/100], Step [100/187], loss: 0.0015





105it [00:04, 22.33it/s][A[A[A


108it [00:04, 22.76it/s][A[A[A


111it [00:04, 22.91it/s][A[A[A


114it [00:04, 23.30it/s][A[A[A


117it [00:05, 23.45it/s][A[A[A


120it [00:05, 23.40it/s][A[A[A


123it [00:05, 23.51it/s][A[A[A


126it [00:05, 23.68it/s][A[A[A


129it [00:05, 23.58it/s][A[A[A


132it [00:05, 23.67it/s][A[A[A


135it [00:05, 23.60it/s][A[A[A


138it [00:05, 23.52it/s][A[A[A


141it [00:06, 23.46it/s][A[A[A


144it [00:06, 23.57it/s][A[A[A


147it [00:06, 23.60it/s][A[A[A


150it [00:06, 22.78it/s][A[A[A


153it [00:06, 23.05it/s][A[A[A


156it [00:06, 23.09it/s][A[A[A


159it [00:06, 22.87it/s][A[A[A


162it [00:06, 22.80it/s][A[A[A


165it [00:07, 23.08it/s][A[A[A


168it [00:07, 23.40it/s][A[A[A


171it [00:07, 23.20it/s][A[A[A


174it [00:07, 23.35it/s][A[A[A


177it [00:07, 23.54it/s][A[A[A


180it [00:07, 23.28it/s][A[A[A


183it [00:07, 23.20it/s][A[A[A


187it [00:08, 23.21it/s]


Epoch [93/100], Step [100/187], loss: 0.0272





105it [00:04, 22.94it/s][A[A[A


108it [00:04, 23.06it/s][A[A[A


111it [00:04, 23.05it/s][A[A[A


114it [00:04, 23.30it/s][A[A[A


117it [00:05, 23.11it/s][A[A[A


120it [00:05, 23.05it/s][A[A[A


123it [00:05, 23.28it/s][A[A[A


126it [00:05, 23.41it/s][A[A[A


129it [00:05, 23.22it/s][A[A[A


132it [00:05, 23.12it/s][A[A[A


135it [00:05, 23.02it/s][A[A[A


138it [00:05, 22.86it/s][A[A[A


141it [00:06, 23.22it/s][A[A[A


144it [00:06, 23.39it/s][A[A[A


147it [00:06, 22.98it/s][A[A[A


150it [00:06, 22.82it/s][A[A[A


153it [00:06, 22.97it/s][A[A[A


156it [00:06, 23.07it/s][A[A[A


159it [00:06, 23.02it/s][A[A[A


162it [00:07, 22.93it/s][A[A[A


165it [00:07, 22.84it/s][A[A[A


168it [00:07, 23.16it/s][A[A[A


171it [00:07, 23.29it/s][A[A[A


174it [00:07, 23.25it/s][A[A[A


177it [00:07, 23.31it/s][A[A[A


180it [00:07, 23.27it/s][A[A[A


183it [00:07, 22.99it/s][A[A[A


187it [00:08, 23.11it/s]


Epoch [94/100], Step [100/187], loss: 0.0716





105it [00:04, 22.54it/s][A[A[A


108it [00:04, 22.27it/s][A[A[A


111it [00:04, 22.01it/s][A[A[A


114it [00:04, 22.12it/s][A[A[A


117it [00:05, 22.28it/s][A[A[A


120it [00:05, 22.30it/s][A[A[A


123it [00:05, 22.73it/s][A[A[A


126it [00:05, 22.97it/s][A[A[A


129it [00:05, 22.98it/s][A[A[A


132it [00:05, 23.24it/s][A[A[A


135it [00:05, 23.10it/s][A[A[A


138it [00:06, 23.40it/s][A[A[A


141it [00:06, 23.45it/s][A[A[A


144it [00:06, 23.64it/s][A[A[A


147it [00:06, 23.74it/s][A[A[A


150it [00:06, 23.31it/s][A[A[A


153it [00:06, 23.50it/s][A[A[A


156it [00:06, 23.56it/s][A[A[A


159it [00:06, 22.71it/s][A[A[A


162it [00:07, 22.99it/s][A[A[A


165it [00:07, 23.26it/s][A[A[A


168it [00:07, 23.39it/s][A[A[A


171it [00:07, 23.16it/s][A[A[A


174it [00:07, 23.28it/s][A[A[A


177it [00:07, 23.48it/s][A[A[A


180it [00:07, 23.56it/s][A[A[A


183it [00:07, 23.42it/s][A[A[A


187it [00:08, 23.03it/s]


Epoch [95/100], Step [100/187], loss: 0.1696





105it [00:04, 22.51it/s][A[A[A


108it [00:04, 22.70it/s][A[A[A


111it [00:04, 22.73it/s][A[A[A


114it [00:04, 22.95it/s][A[A[A


117it [00:05, 23.12it/s][A[A[A


120it [00:05, 23.31it/s][A[A[A


123it [00:05, 23.29it/s][A[A[A


126it [00:05, 23.42it/s][A[A[A


129it [00:05, 23.39it/s][A[A[A


132it [00:05, 22.63it/s][A[A[A


135it [00:05, 22.97it/s][A[A[A


138it [00:06, 23.20it/s][A[A[A


141it [00:06, 23.15it/s][A[A[A


144it [00:06, 23.28it/s][A[A[A


147it [00:06, 23.42it/s][A[A[A


150it [00:06, 23.24it/s][A[A[A


153it [00:06, 23.27it/s][A[A[A


156it [00:06, 22.92it/s][A[A[A


159it [00:06, 23.01it/s][A[A[A


162it [00:07, 22.43it/s][A[A[A


165it [00:07, 22.30it/s][A[A[A


168it [00:07, 22.20it/s][A[A[A


171it [00:07, 22.40it/s][A[A[A


174it [00:07, 22.57it/s][A[A[A


177it [00:07, 22.84it/s][A[A[A


180it [00:07, 22.68it/s][A[A[A


183it [00:08, 22.79it/s][A[A[A


187it [00:08, 22.87it/s]


Epoch [96/100], Step [100/187], loss: 0.0495





105it [00:04, 23.08it/s][A[A[A


108it [00:04, 22.76it/s][A[A[A


111it [00:04, 22.89it/s][A[A[A


114it [00:04, 23.01it/s][A[A[A


117it [00:05, 23.16it/s][A[A[A


120it [00:05, 22.29it/s][A[A[A


123it [00:05, 22.53it/s][A[A[A


126it [00:05, 22.80it/s][A[A[A


129it [00:05, 23.16it/s][A[A[A


132it [00:05, 22.62it/s][A[A[A


135it [00:05, 22.87it/s][A[A[A


138it [00:06, 23.08it/s][A[A[A


141it [00:06, 23.12it/s][A[A[A


144it [00:06, 23.22it/s][A[A[A


147it [00:06, 23.05it/s][A[A[A


150it [00:06, 23.17it/s][A[A[A


153it [00:06, 23.22it/s][A[A[A


156it [00:06, 22.87it/s][A[A[A


159it [00:06, 23.03it/s][A[A[A


162it [00:07, 23.13it/s][A[A[A


165it [00:07, 23.07it/s][A[A[A


168it [00:07, 23.33it/s][A[A[A


171it [00:07, 23.42it/s][A[A[A


174it [00:07, 23.28it/s][A[A[A


177it [00:07, 23.33it/s][A[A[A


180it [00:07, 23.14it/s][A[A[A


183it [00:07, 22.84it/s][A[A[A


187it [00:08, 23.00it/s]


Epoch [97/100], Step [100/187], loss: 0.1982





105it [00:04, 22.45it/s][A[A[A


108it [00:04, 21.97it/s][A[A[A


111it [00:04, 22.32it/s][A[A[A


114it [00:04, 22.83it/s][A[A[A


117it [00:05, 23.12it/s][A[A[A


120it [00:05, 23.27it/s][A[A[A


123it [00:05, 23.42it/s][A[A[A


126it [00:05, 23.57it/s][A[A[A


129it [00:05, 23.47it/s][A[A[A


132it [00:05, 23.03it/s][A[A[A


135it [00:05, 23.27it/s][A[A[A


138it [00:05, 23.18it/s][A[A[A


141it [00:06, 22.83it/s][A[A[A


144it [00:06, 23.12it/s][A[A[A


147it [00:06, 23.35it/s][A[A[A


150it [00:06, 23.21it/s][A[A[A


153it [00:06, 23.36it/s][A[A[A


156it [00:06, 23.12it/s][A[A[A


159it [00:06, 23.05it/s][A[A[A


162it [00:06, 23.32it/s][A[A[A


165it [00:07, 23.44it/s][A[A[A


168it [00:07, 23.31it/s][A[A[A


171it [00:07, 23.32it/s][A[A[A


174it [00:07, 23.25it/s][A[A[A


177it [00:07, 23.13it/s][A[A[A


180it [00:07, 23.07it/s][A[A[A


183it [00:07, 23.22it/s][A[A[A


187it [00:08, 23.10it/s]


Epoch [98/100], Step [100/187], loss: 0.0413





105it [00:04, 22.92it/s][A[A[A


108it [00:04, 22.37it/s][A[A[A


111it [00:04, 22.60it/s][A[A[A


114it [00:04, 22.63it/s][A[A[A


117it [00:05, 22.94it/s][A[A[A


120it [00:05, 23.26it/s][A[A[A


123it [00:05, 23.56it/s][A[A[A


126it [00:05, 23.59it/s][A[A[A


129it [00:05, 23.68it/s][A[A[A


132it [00:05, 23.58it/s][A[A[A


135it [00:05, 23.50it/s][A[A[A


138it [00:05, 23.59it/s][A[A[A


141it [00:06, 23.67it/s][A[A[A


144it [00:06, 23.56it/s][A[A[A


147it [00:06, 23.65it/s][A[A[A


150it [00:06, 23.48it/s][A[A[A


153it [00:06, 23.53it/s][A[A[A


156it [00:06, 23.31it/s][A[A[A


159it [00:06, 23.12it/s][A[A[A


162it [00:06, 23.34it/s][A[A[A


165it [00:07, 23.54it/s][A[A[A


168it [00:07, 23.42it/s][A[A[A


171it [00:07, 23.54it/s][A[A[A


174it [00:07, 23.68it/s][A[A[A


177it [00:07, 22.98it/s][A[A[A


180it [00:07, 22.92it/s][A[A[A


183it [00:07, 23.05it/s][A[A[A


187it [00:08, 23.15it/s]


Epoch [99/100], Step [100/187], loss: 0.0066





105it [00:04, 22.85it/s][A[A[A


108it [00:04, 23.03it/s][A[A[A


111it [00:04, 22.75it/s][A[A[A


114it [00:04, 22.85it/s][A[A[A


117it [00:05, 23.02it/s][A[A[A


120it [00:05, 23.05it/s][A[A[A


123it [00:05, 23.21it/s][A[A[A


126it [00:05, 23.31it/s][A[A[A


129it [00:05, 23.34it/s][A[A[A


132it [00:05, 22.71it/s][A[A[A


135it [00:05, 22.72it/s][A[A[A


138it [00:05, 22.20it/s][A[A[A


141it [00:06, 22.62it/s][A[A[A


144it [00:06, 23.06it/s][A[A[A


147it [00:06, 23.03it/s][A[A[A


150it [00:06, 23.30it/s][A[A[A


153it [00:06, 23.38it/s][A[A[A


156it [00:06, 23.44it/s][A[A[A


159it [00:06, 23.57it/s][A[A[A


162it [00:06, 23.42it/s][A[A[A


165it [00:07, 23.45it/s][A[A[A


168it [00:07, 23.50it/s][A[A[A


171it [00:07, 23.48it/s][A[A[A


174it [00:07, 23.58it/s][A[A[A


177it [00:07, 23.72it/s][A[A[A


180it [00:07, 23.55it/s][A[A[A


183it [00:07, 23.61it/s][A[A[A


187it [00:08, 23.31it/s]


In [15]:
with t.no_grad():
    correct = 0
    total = 0
    for img, label in testLoader:
        img = img.to(device)
        label = label.to(device)
        outputs = net(img)
        _, predicted = t.max(outputs.data, 1)
        total += label.size(0)
        correct += (predicted == label).sum().item()
        print('Accuracy of the model on the test images: {} %'.format(100 * correct / total))

Accuracy of the model on the test images: 100.0 %
Accuracy of the model on the test images: 100.0 %
Accuracy of the model on the test images: 100.0 %
Accuracy of the model on the test images: 100.0 %
Accuracy of the model on the test images: 100.0 %
Accuracy of the model on the test images: 100.0 %
Accuracy of the model on the test images: 92.85714285714286 %
Accuracy of the model on the test images: 93.75 %
Accuracy of the model on the test images: 94.44444444444444 %
Accuracy of the model on the test images: 95.0 %
Accuracy of the model on the test images: 95.45454545454545 %
Accuracy of the model on the test images: 95.83333333333333 %
Accuracy of the model on the test images: 96.15384615384616 %
Accuracy of the model on the test images: 92.85714285714286 %
Accuracy of the model on the test images: 93.33333333333333 %
Accuracy of the model on the test images: 93.75 %
Accuracy of the model on the test images: 94.11764705882354 %
Accuracy of the model on the test images: 94.4444444444