## Multiclass Classification Model on MNIST Dataset with Mixup

### Dependencies Imports

In [2]:
import torch
import torch.nn as nn
import torch.nn.functional as F

import torch.optim as optim
from torch.utils.data import TensorDataset, DataLoader

import torchvision
import torchvision.datasets as datasets
import torchvision.transforms as transforms
from PIL import Image

import numpy as np
import random

### Data Preparation

In [3]:
transform = transforms.Compose([
    transforms.ToTensor(),
    transforms.Normalize((0.5,), (0.5,)),
])

In [4]:
mnist_train = datasets.MNIST(root='./data', train=True, download=False, transform=transform)
mnist_test = datasets.MNIST(root='./data', train=False, download=False, transform=transform)

### Model

In [5]:
class MNIST_Model(nn.Module):
    def __init__(self):
        super(MNIST_Model, self).__init__()
        self.hidden1 = nn.Linear(28*28, 50)
        self.output = nn.Linear(50, 10)
    def forward(self, x):
        x = self.hidden1(x)
        x = F.sigmoid(x)
        x = self.output(x)
        x = F.softmax(x)
        return x

### Training

In [7]:
def mixup_data(x, y, alpha=1.0):
    """Applies mixup to a single batch of data."""
    if alpha > 0:
        lam = np.random.beta(alpha, alpha)
    else:
        lam = 1

    batch_size = x.size()[0]
    index = torch.randperm(batch_size)

    mixed_x = lam * x + (1 - lam) * x[index, :]
    y_a, y_b = y, y[index]
    return mixed_x, y_a, y_b, lam

In [8]:
def train_model(model, train_data, alpha=1.0):
    train_loader = DataLoader(train_data, batch_size=10, shuffle=True)
    loss_fn = nn.CrossEntropyLoss()
    optimizer = optim.Adam(model.parameters(), lr=0.001)
    epochs = 10  # Note: changed 'epoch' to 'epochs' for clarity

    for epoch in range(epochs):
        model.train()
        batch = 0
        for data in train_loader:
            batch += 1
            x, y = data
            x, y_a, y_b, lam = mixup_data(x.view(-1, 28*28), y, alpha)
            optimizer.zero_grad()
            output = model(x)
            loss = lam * loss_fn(output, y_a) + (1 - lam) * loss_fn(output, y_b)
            print(f'Epoch {epoch + 1}, batch {batch}')
            print(f'Training loss: {loss.item()} \n')
            loss.backward()
            optimizer.step()
            
model = MNIST_Model()
train_model(model, mnist_train)

  x = F.softmax(x)


Epoch 1, batch 1
Training loss: 2.310678005218506 

Epoch 1, batch 2
Training loss: 2.280592679977417 

Epoch 1, batch 3
Training loss: 2.28916597366333 

Epoch 1, batch 4
Training loss: 2.3293840885162354 

Epoch 1, batch 5
Training loss: 2.323482036590576 

Epoch 1, batch 6
Training loss: 2.3030123710632324 

Epoch 1, batch 7
Training loss: 2.2996597290039062 

Epoch 1, batch 8
Training loss: 2.254042863845825 

Epoch 1, batch 9
Training loss: 2.325225591659546 

Epoch 1, batch 10
Training loss: 2.274379253387451 

Epoch 1, batch 11
Training loss: 2.305370330810547 

Epoch 1, batch 12
Training loss: 2.330580472946167 

Epoch 1, batch 13
Training loss: 2.324124574661255 

Epoch 1, batch 14
Training loss: 2.2795872688293457 

Epoch 1, batch 15
Training loss: 2.28515887260437 

Epoch 1, batch 16
Training loss: 2.271048069000244 

Epoch 1, batch 17
Training loss: 2.287893295288086 

Epoch 1, batch 18
Training loss: 2.282364845275879 

Epoch 1, batch 19
Training loss: 2.284468412399292 



Epoch 1, batch 160
Training loss: 2.049644708633423 

Epoch 1, batch 161
Training loss: 2.1075847148895264 

Epoch 1, batch 162
Training loss: 2.1460647583007812 

Epoch 1, batch 163
Training loss: 2.2185912132263184 

Epoch 1, batch 164
Training loss: 2.1662280559539795 

Epoch 1, batch 165
Training loss: 2.159369945526123 

Epoch 1, batch 166
Training loss: 2.115105628967285 

Epoch 1, batch 167
Training loss: 2.2002720832824707 

Epoch 1, batch 168
Training loss: 2.097087860107422 

Epoch 1, batch 169
Training loss: 2.1171138286590576 

Epoch 1, batch 170
Training loss: 2.1148295402526855 

Epoch 1, batch 171
Training loss: 2.2220606803894043 

Epoch 1, batch 172
Training loss: 1.9384597539901733 

Epoch 1, batch 173
Training loss: 2.2526237964630127 

Epoch 1, batch 174
Training loss: 2.071743965148926 

Epoch 1, batch 175
Training loss: 2.195497512817383 

Epoch 1, batch 176
Training loss: 2.1983394622802734 

Epoch 1, batch 177
Training loss: 2.006546974182129 

Epoch 1, batch 17

Epoch 1, batch 348
Training loss: 2.044792652130127 

Epoch 1, batch 349
Training loss: 1.876511573791504 

Epoch 1, batch 350
Training loss: 2.0167174339294434 

Epoch 1, batch 351
Training loss: 2.0258309841156006 

Epoch 1, batch 352
Training loss: 1.9759562015533447 

Epoch 1, batch 353
Training loss: 2.0927658081054688 

Epoch 1, batch 354
Training loss: 2.0816683769226074 

Epoch 1, batch 355
Training loss: 2.0937228202819824 

Epoch 1, batch 356
Training loss: 2.0363683700561523 

Epoch 1, batch 357
Training loss: 2.051100254058838 

Epoch 1, batch 358
Training loss: 1.990166425704956 

Epoch 1, batch 359
Training loss: 2.0344324111938477 

Epoch 1, batch 360
Training loss: 2.13844633102417 

Epoch 1, batch 361
Training loss: 1.9163111448287964 

Epoch 1, batch 362
Training loss: 2.0477609634399414 

Epoch 1, batch 363
Training loss: 2.076744318008423 

Epoch 1, batch 364
Training loss: 1.879331350326538 

Epoch 1, batch 365
Training loss: 2.0428435802459717 

Epoch 1, batch 366

Epoch 1, batch 550
Training loss: 2.091257333755493 

Epoch 1, batch 551
Training loss: 2.0541844367980957 

Epoch 1, batch 552
Training loss: 2.1060454845428467 

Epoch 1, batch 553
Training loss: 1.9072729349136353 

Epoch 1, batch 554
Training loss: 2.0225775241851807 

Epoch 1, batch 555
Training loss: 1.9875385761260986 

Epoch 1, batch 556
Training loss: 2.09385347366333 

Epoch 1, batch 557
Training loss: 1.9019944667816162 

Epoch 1, batch 558
Training loss: 2.001058578491211 

Epoch 1, batch 559
Training loss: 2.10783314704895 

Epoch 1, batch 560
Training loss: 1.985097050666809 

Epoch 1, batch 561
Training loss: 2.0933830738067627 

Epoch 1, batch 562
Training loss: 1.9409942626953125 

Epoch 1, batch 563
Training loss: 2.0684235095977783 

Epoch 1, batch 564
Training loss: 1.925426959991455 

Epoch 1, batch 565
Training loss: 2.018190860748291 

Epoch 1, batch 566
Training loss: 1.871867060661316 

Epoch 1, batch 567
Training loss: 1.7232798337936401 

Epoch 1, batch 568
T

Epoch 1, batch 754
Training loss: 1.976341724395752 

Epoch 1, batch 755
Training loss: 1.9317498207092285 

Epoch 1, batch 756
Training loss: 2.031097888946533 

Epoch 1, batch 757
Training loss: 1.934415578842163 

Epoch 1, batch 758
Training loss: 1.8543277978897095 

Epoch 1, batch 759
Training loss: 1.6201590299606323 

Epoch 1, batch 760
Training loss: 2.0345988273620605 

Epoch 1, batch 761
Training loss: 2.050844669342041 

Epoch 1, batch 762
Training loss: 1.7541072368621826 

Epoch 1, batch 763
Training loss: 2.0621931552886963 

Epoch 1, batch 764
Training loss: 2.04879093170166 

Epoch 1, batch 765
Training loss: 1.990237832069397 

Epoch 1, batch 766
Training loss: 1.930469274520874 

Epoch 1, batch 767
Training loss: 2.014909505844116 

Epoch 1, batch 768
Training loss: 1.7063738107681274 

Epoch 1, batch 769
Training loss: 1.6490200757980347 

Epoch 1, batch 770
Training loss: 1.974923849105835 

Epoch 1, batch 771
Training loss: 1.879180669784546 

Epoch 1, batch 772
Tr

Epoch 1, batch 954
Training loss: 1.995559573173523 

Epoch 1, batch 955
Training loss: 1.7274205684661865 

Epoch 1, batch 956
Training loss: 1.9383784532546997 

Epoch 1, batch 957
Training loss: 1.8701093196868896 

Epoch 1, batch 958
Training loss: 1.8636902570724487 

Epoch 1, batch 959
Training loss: 1.9155051708221436 

Epoch 1, batch 960
Training loss: 1.5561890602111816 

Epoch 1, batch 961
Training loss: 2.0164268016815186 

Epoch 1, batch 962
Training loss: 1.730101227760315 

Epoch 1, batch 963
Training loss: 1.7593556642532349 

Epoch 1, batch 964
Training loss: 1.9074292182922363 

Epoch 1, batch 965
Training loss: 1.58558988571167 

Epoch 1, batch 966
Training loss: 2.0857222080230713 

Epoch 1, batch 967
Training loss: 1.8611165285110474 

Epoch 1, batch 968
Training loss: 1.9284003973007202 

Epoch 1, batch 969
Training loss: 2.0385544300079346 

Epoch 1, batch 970
Training loss: 1.9609909057617188 

Epoch 1, batch 971
Training loss: 1.9400556087493896 

Epoch 1, batch

Epoch 1, batch 1154
Training loss: 2.024637222290039 

Epoch 1, batch 1155
Training loss: 1.8319847583770752 

Epoch 1, batch 1156
Training loss: 1.8792998790740967 

Epoch 1, batch 1157
Training loss: 1.8135662078857422 

Epoch 1, batch 1158
Training loss: 1.8669629096984863 

Epoch 1, batch 1159
Training loss: 1.877251386642456 

Epoch 1, batch 1160
Training loss: 1.999910831451416 

Epoch 1, batch 1161
Training loss: 1.7775380611419678 

Epoch 1, batch 1162
Training loss: 1.7271640300750732 

Epoch 1, batch 1163
Training loss: 1.5373241901397705 

Epoch 1, batch 1164
Training loss: 1.7901474237442017 

Epoch 1, batch 1165
Training loss: 1.9381338357925415 

Epoch 1, batch 1166
Training loss: 1.842911958694458 

Epoch 1, batch 1167
Training loss: 1.7591310739517212 

Epoch 1, batch 1168
Training loss: 1.6813695430755615 

Epoch 1, batch 1169
Training loss: 1.8699805736541748 

Epoch 1, batch 1170
Training loss: 2.1405975818634033 

Epoch 1, batch 1171
Training loss: 2.052858829498291

Epoch 1, batch 1354
Training loss: 1.9882439374923706 

Epoch 1, batch 1355
Training loss: 1.9431802034378052 

Epoch 1, batch 1356
Training loss: 1.865349531173706 

Epoch 1, batch 1357
Training loss: 1.8206892013549805 

Epoch 1, batch 1358
Training loss: 1.8282300233840942 

Epoch 1, batch 1359
Training loss: 1.6788136959075928 

Epoch 1, batch 1360
Training loss: 2.016660451889038 

Epoch 1, batch 1361
Training loss: 2.103506326675415 

Epoch 1, batch 1362
Training loss: 1.876542568206787 

Epoch 1, batch 1363
Training loss: 2.063750743865967 

Epoch 1, batch 1364
Training loss: 2.121925115585327 

Epoch 1, batch 1365
Training loss: 1.7593669891357422 

Epoch 1, batch 1366
Training loss: 1.7422559261322021 

Epoch 1, batch 1367
Training loss: 1.6745134592056274 

Epoch 1, batch 1368
Training loss: 1.8004554510116577 

Epoch 1, batch 1369
Training loss: 1.9346895217895508 

Epoch 1, batch 1370
Training loss: 1.912184238433838 

Epoch 1, batch 1371
Training loss: 2.079364776611328 



Epoch 1, batch 1554
Training loss: 1.7957701683044434 

Epoch 1, batch 1555
Training loss: 1.9410121440887451 

Epoch 1, batch 1556
Training loss: 1.672340750694275 

Epoch 1, batch 1557
Training loss: 1.7924463748931885 

Epoch 1, batch 1558
Training loss: 1.9916765689849854 

Epoch 1, batch 1559
Training loss: 1.675140619277954 

Epoch 1, batch 1560
Training loss: 1.88649320602417 

Epoch 1, batch 1561
Training loss: 1.9434624910354614 

Epoch 1, batch 1562
Training loss: 1.8877575397491455 

Epoch 1, batch 1563
Training loss: 1.8375439643859863 

Epoch 1, batch 1564
Training loss: 1.8485920429229736 

Epoch 1, batch 1565
Training loss: 1.921270728111267 

Epoch 1, batch 1566
Training loss: 2.0807416439056396 

Epoch 1, batch 1567
Training loss: 1.9198969602584839 

Epoch 1, batch 1568
Training loss: 1.767448902130127 

Epoch 1, batch 1569
Training loss: 2.0325584411621094 

Epoch 1, batch 1570
Training loss: 2.053271770477295 

Epoch 1, batch 1571
Training loss: 1.7302440404891968 


Epoch 1, batch 1755
Training loss: 1.9206042289733887 

Epoch 1, batch 1756
Training loss: 1.848912000656128 

Epoch 1, batch 1757
Training loss: 1.8030024766921997 

Epoch 1, batch 1758
Training loss: 1.923781394958496 

Epoch 1, batch 1759
Training loss: 1.842555284500122 

Epoch 1, batch 1760
Training loss: 1.8725595474243164 

Epoch 1, batch 1761
Training loss: 2.096893787384033 

Epoch 1, batch 1762
Training loss: 1.7909517288208008 

Epoch 1, batch 1763
Training loss: 1.7702316045761108 

Epoch 1, batch 1764
Training loss: 1.6968462467193604 

Epoch 1, batch 1765
Training loss: 1.7699050903320312 

Epoch 1, batch 1766
Training loss: 1.7592421770095825 

Epoch 1, batch 1767
Training loss: 1.8513832092285156 

Epoch 1, batch 1768
Training loss: 1.9488664865493774 

Epoch 1, batch 1769
Training loss: 1.8105952739715576 

Epoch 1, batch 1770
Training loss: 1.758373737335205 

Epoch 1, batch 1771
Training loss: 1.8513731956481934 

Epoch 1, batch 1772
Training loss: 2.0188186168670654

Epoch 1, batch 1954
Training loss: 1.9752217531204224 

Epoch 1, batch 1955
Training loss: 1.7748132944107056 

Epoch 1, batch 1956
Training loss: 1.7998459339141846 

Epoch 1, batch 1957
Training loss: 1.833019495010376 

Epoch 1, batch 1958
Training loss: 1.6466935873031616 

Epoch 1, batch 1959
Training loss: 1.5068354606628418 

Epoch 1, batch 1960
Training loss: 1.8251374959945679 

Epoch 1, batch 1961
Training loss: 2.039773464202881 

Epoch 1, batch 1962
Training loss: 1.944989562034607 

Epoch 1, batch 1963
Training loss: 1.9572536945343018 

Epoch 1, batch 1964
Training loss: 1.8552825450897217 

Epoch 1, batch 1965
Training loss: 1.8144241571426392 

Epoch 1, batch 1966
Training loss: 1.7431154251098633 

Epoch 1, batch 1967
Training loss: 1.6142539978027344 

Epoch 1, batch 1968
Training loss: 1.7092409133911133 

Epoch 1, batch 1969
Training loss: 1.8409802913665771 

Epoch 1, batch 1970
Training loss: 1.7300983667373657 

Epoch 1, batch 1971
Training loss: 1.83659648895263

Epoch 1, batch 2154
Training loss: 1.6863890886306763 

Epoch 1, batch 2155
Training loss: 1.8602100610733032 

Epoch 1, batch 2156
Training loss: 1.7579538822174072 

Epoch 1, batch 2157
Training loss: 2.0051896572113037 

Epoch 1, batch 2158
Training loss: 1.9189679622650146 

Epoch 1, batch 2159
Training loss: 2.2024221420288086 

Epoch 1, batch 2160
Training loss: 1.9151897430419922 

Epoch 1, batch 2161
Training loss: 1.803123116493225 

Epoch 1, batch 2162
Training loss: 1.889714241027832 

Epoch 1, batch 2163
Training loss: 1.6743396520614624 

Epoch 1, batch 2164
Training loss: 1.9450442790985107 

Epoch 1, batch 2165
Training loss: 1.8821940422058105 

Epoch 1, batch 2166
Training loss: 1.8133994340896606 

Epoch 1, batch 2167
Training loss: 1.905796766281128 

Epoch 1, batch 2168
Training loss: 1.9669556617736816 

Epoch 1, batch 2169
Training loss: 1.9682655334472656 

Epoch 1, batch 2170
Training loss: 1.7177350521087646 

Epoch 1, batch 2171
Training loss: 1.94020557403564

Epoch 1, batch 2355
Training loss: 1.9869372844696045 

Epoch 1, batch 2356
Training loss: 1.7321782112121582 

Epoch 1, batch 2357
Training loss: 1.946142315864563 

Epoch 1, batch 2358
Training loss: 2.0040156841278076 

Epoch 1, batch 2359
Training loss: 1.8459010124206543 

Epoch 1, batch 2360
Training loss: 1.9176523685455322 

Epoch 1, batch 2361
Training loss: 1.7074347734451294 

Epoch 1, batch 2362
Training loss: 1.622418999671936 

Epoch 1, batch 2363
Training loss: 1.9986820220947266 

Epoch 1, batch 2364
Training loss: 1.6985005140304565 

Epoch 1, batch 2365
Training loss: 1.9357566833496094 

Epoch 1, batch 2366
Training loss: 1.6923658847808838 

Epoch 1, batch 2367
Training loss: 1.9265189170837402 

Epoch 1, batch 2368
Training loss: 1.984581470489502 

Epoch 1, batch 2369
Training loss: 1.9676841497421265 

Epoch 1, batch 2370
Training loss: 1.8534204959869385 

Epoch 1, batch 2371
Training loss: 1.9101920127868652 

Epoch 1, batch 2372
Training loss: 1.67914652824401

Epoch 1, batch 2554
Training loss: 2.012242555618286 

Epoch 1, batch 2555
Training loss: 1.9341963529586792 

Epoch 1, batch 2556
Training loss: 1.6770212650299072 

Epoch 1, batch 2557
Training loss: 1.820076823234558 

Epoch 1, batch 2558
Training loss: 1.7424309253692627 

Epoch 1, batch 2559
Training loss: 1.7711291313171387 

Epoch 1, batch 2560
Training loss: 1.678358793258667 

Epoch 1, batch 2561
Training loss: 1.9314067363739014 

Epoch 1, batch 2562
Training loss: 1.8902997970581055 

Epoch 1, batch 2563
Training loss: 1.8977999687194824 

Epoch 1, batch 2564
Training loss: 1.5831660032272339 

Epoch 1, batch 2565
Training loss: 1.8122185468673706 

Epoch 1, batch 2566
Training loss: 1.8332226276397705 

Epoch 1, batch 2567
Training loss: 1.7601454257965088 

Epoch 1, batch 2568
Training loss: 1.8735296726226807 

Epoch 1, batch 2569
Training loss: 1.8385937213897705 

Epoch 1, batch 2570
Training loss: 1.9301034212112427 

Epoch 1, batch 2571
Training loss: 1.64877772331237

Epoch 1, batch 2755
Training loss: 1.899017095565796 

Epoch 1, batch 2756
Training loss: 1.6262905597686768 

Epoch 1, batch 2757
Training loss: 1.8210837841033936 

Epoch 1, batch 2758
Training loss: 2.010481595993042 

Epoch 1, batch 2759
Training loss: 1.7991710901260376 

Epoch 1, batch 2760
Training loss: 1.8353869915008545 

Epoch 1, batch 2761
Training loss: 1.721046805381775 

Epoch 1, batch 2762
Training loss: 1.8633317947387695 

Epoch 1, batch 2763
Training loss: 1.7298846244812012 

Epoch 1, batch 2764
Training loss: 1.6230428218841553 

Epoch 1, batch 2765
Training loss: 1.7149847745895386 

Epoch 1, batch 2766
Training loss: 1.8367770910263062 

Epoch 1, batch 2767
Training loss: 1.8483915328979492 

Epoch 1, batch 2768
Training loss: 1.8608534336090088 

Epoch 1, batch 2769
Training loss: 2.044529914855957 

Epoch 1, batch 2770
Training loss: 1.745470404624939 

Epoch 1, batch 2771
Training loss: 1.8593904972076416 

Epoch 1, batch 2772
Training loss: 1.8418887853622437

Epoch 1, batch 2953
Training loss: 1.737047553062439 

Epoch 1, batch 2954
Training loss: 1.8975226879119873 

Epoch 1, batch 2955
Training loss: 2.0239899158477783 

Epoch 1, batch 2956
Training loss: 1.901519775390625 

Epoch 1, batch 2957
Training loss: 1.5805346965789795 

Epoch 1, batch 2958
Training loss: 1.7328906059265137 

Epoch 1, batch 2959
Training loss: 1.7925641536712646 

Epoch 1, batch 2960
Training loss: 1.5606634616851807 

Epoch 1, batch 2961
Training loss: 1.964219093322754 

Epoch 1, batch 2962
Training loss: 1.7347743511199951 

Epoch 1, batch 2963
Training loss: 1.9037327766418457 

Epoch 1, batch 2964
Training loss: 2.0210914611816406 

Epoch 1, batch 2965
Training loss: 1.5823132991790771 

Epoch 1, batch 2966
Training loss: 1.7226195335388184 

Epoch 1, batch 2967
Training loss: 1.8848347663879395 

Epoch 1, batch 2968
Training loss: 1.8848655223846436 

Epoch 1, batch 2969
Training loss: 1.8341848850250244 

Epoch 1, batch 2970
Training loss: 1.81289386749267

Epoch 1, batch 3155
Training loss: 1.9671764373779297 

Epoch 1, batch 3156
Training loss: 1.8260380029678345 

Epoch 1, batch 3157
Training loss: 1.7832293510437012 

Epoch 1, batch 3158
Training loss: 1.845280408859253 

Epoch 1, batch 3159
Training loss: 2.025552272796631 

Epoch 1, batch 3160
Training loss: 1.97532057762146 

Epoch 1, batch 3161
Training loss: 1.8767099380493164 

Epoch 1, batch 3162
Training loss: 1.8513935804367065 

Epoch 1, batch 3163
Training loss: 1.7678463459014893 

Epoch 1, batch 3164
Training loss: 1.8456668853759766 

Epoch 1, batch 3165
Training loss: 1.9846981763839722 

Epoch 1, batch 3166
Training loss: 1.8188477754592896 

Epoch 1, batch 3167
Training loss: 1.7921147346496582 

Epoch 1, batch 3168
Training loss: 2.012953758239746 

Epoch 1, batch 3169
Training loss: 1.9017326831817627 

Epoch 1, batch 3170
Training loss: 1.9181077480316162 

Epoch 1, batch 3171
Training loss: 2.100064754486084 

Epoch 1, batch 3172
Training loss: 1.7315640449523926 

Epoch 1, batch 3354
Training loss: 1.8629822731018066 

Epoch 1, batch 3355
Training loss: 1.7113595008850098 

Epoch 1, batch 3356
Training loss: 1.9021215438842773 

Epoch 1, batch 3357
Training loss: 1.552502989768982 

Epoch 1, batch 3358
Training loss: 1.6488707065582275 

Epoch 1, batch 3359
Training loss: 1.8533415794372559 

Epoch 1, batch 3360
Training loss: 1.8576613664627075 

Epoch 1, batch 3361
Training loss: 1.9805340766906738 

Epoch 1, batch 3362
Training loss: 1.7135244607925415 

Epoch 1, batch 3363
Training loss: 1.610908031463623 

Epoch 1, batch 3364
Training loss: 1.7654023170471191 

Epoch 1, batch 3365
Training loss: 1.840558409690857 

Epoch 1, batch 3366
Training loss: 1.982944130897522 

Epoch 1, batch 3367
Training loss: 1.680391788482666 

Epoch 1, batch 3368
Training loss: 1.874260663986206 

Epoch 1, batch 3369
Training loss: 1.8963817358016968 

Epoch 1, batch 3370
Training loss: 1.7329834699630737 

Epoch 1, batch 3371
Training loss: 1.672776699066162 


Epoch 1, batch 3557
Training loss: 1.7857391834259033 

Epoch 1, batch 3558
Training loss: 1.6788561344146729 

Epoch 1, batch 3559
Training loss: 1.911219835281372 

Epoch 1, batch 3560
Training loss: 1.9674413204193115 

Epoch 1, batch 3561
Training loss: 2.0477166175842285 

Epoch 1, batch 3562
Training loss: 1.6601345539093018 

Epoch 1, batch 3563
Training loss: 1.682304859161377 

Epoch 1, batch 3564
Training loss: 1.7862106561660767 

Epoch 1, batch 3565
Training loss: 1.5986676216125488 

Epoch 1, batch 3566
Training loss: 1.7671847343444824 

Epoch 1, batch 3567
Training loss: 1.9796655178070068 

Epoch 1, batch 3568
Training loss: 1.7849931716918945 

Epoch 1, batch 3569
Training loss: 1.8051080703735352 

Epoch 1, batch 3570
Training loss: 1.7808690071105957 

Epoch 1, batch 3571
Training loss: 1.9384174346923828 

Epoch 1, batch 3572
Training loss: 1.884389042854309 

Epoch 1, batch 3573
Training loss: 1.6800518035888672 

Epoch 1, batch 3574
Training loss: 2.01356148719787

Epoch 1, batch 3759
Training loss: 1.8344647884368896 

Epoch 1, batch 3760
Training loss: 1.7980852127075195 

Epoch 1, batch 3761
Training loss: 1.8181318044662476 

Epoch 1, batch 3762
Training loss: 1.6681551933288574 

Epoch 1, batch 3763
Training loss: 2.018566608428955 

Epoch 1, batch 3764
Training loss: 1.8944309949874878 

Epoch 1, batch 3765
Training loss: 1.865709900856018 

Epoch 1, batch 3766
Training loss: 1.7436766624450684 

Epoch 1, batch 3767
Training loss: 1.899479866027832 

Epoch 1, batch 3768
Training loss: 1.8415271043777466 

Epoch 1, batch 3769
Training loss: 1.9999160766601562 

Epoch 1, batch 3770
Training loss: 1.975024700164795 

Epoch 1, batch 3771
Training loss: 1.8358557224273682 

Epoch 1, batch 3772
Training loss: 1.9679627418518066 

Epoch 1, batch 3773
Training loss: 2.0238280296325684 

Epoch 1, batch 3774
Training loss: 1.8920884132385254 

Epoch 1, batch 3775
Training loss: 1.8700141906738281 

Epoch 1, batch 3776
Training loss: 1.609337687492370

Epoch 1, batch 3958
Training loss: 1.9276812076568604 

Epoch 1, batch 3959
Training loss: 1.7525806427001953 

Epoch 1, batch 3960
Training loss: 1.8393748998641968 

Epoch 1, batch 3961
Training loss: 1.9196285009384155 

Epoch 1, batch 3962
Training loss: 1.4885237216949463 

Epoch 1, batch 3963
Training loss: 1.999611735343933 

Epoch 1, batch 3964
Training loss: 1.6123971939086914 

Epoch 1, batch 3965
Training loss: 1.5826168060302734 

Epoch 1, batch 3966
Training loss: 2.029383659362793 

Epoch 1, batch 3967
Training loss: 1.6141692399978638 

Epoch 1, batch 3968
Training loss: 1.749394416809082 

Epoch 1, batch 3969
Training loss: 1.9009501934051514 

Epoch 1, batch 3970
Training loss: 1.688499093055725 

Epoch 1, batch 3971
Training loss: 1.8410624265670776 

Epoch 1, batch 3972
Training loss: 1.8134386539459229 

Epoch 1, batch 3973
Training loss: 1.837334156036377 

Epoch 1, batch 3974
Training loss: 1.850367546081543 

Epoch 1, batch 3975
Training loss: 1.7520337104797363 

Epoch 1, batch 4161
Training loss: 1.52207350730896 

Epoch 1, batch 4162
Training loss: 1.7960517406463623 

Epoch 1, batch 4163
Training loss: 1.7053269147872925 

Epoch 1, batch 4164
Training loss: 1.5673224925994873 

Epoch 1, batch 4165
Training loss: 1.985214352607727 

Epoch 1, batch 4166
Training loss: 1.8378276824951172 

Epoch 1, batch 4167
Training loss: 1.728959321975708 

Epoch 1, batch 4168
Training loss: 1.9983997344970703 

Epoch 1, batch 4169
Training loss: 1.538861632347107 

Epoch 1, batch 4170
Training loss: 1.9198861122131348 

Epoch 1, batch 4171
Training loss: 1.6034326553344727 

Epoch 1, batch 4172
Training loss: 1.9589910507202148 

Epoch 1, batch 4173
Training loss: 1.7824361324310303 

Epoch 1, batch 4174
Training loss: 1.6534669399261475 

Epoch 1, batch 4175
Training loss: 1.8402764797210693 

Epoch 1, batch 4176
Training loss: 1.5351778268814087 

Epoch 1, batch 4177
Training loss: 1.9055066108703613 

Epoch 1, batch 4178
Training loss: 1.9645681381225586

Epoch 1, batch 4364
Training loss: 1.6738882064819336 

Epoch 1, batch 4365
Training loss: 1.6837503910064697 

Epoch 1, batch 4366
Training loss: 1.8748067617416382 

Epoch 1, batch 4367
Training loss: 1.9249567985534668 

Epoch 1, batch 4368
Training loss: 1.8861044645309448 

Epoch 1, batch 4369
Training loss: 1.7827284336090088 

Epoch 1, batch 4370
Training loss: 1.522486925125122 

Epoch 1, batch 4371
Training loss: 1.5667811632156372 

Epoch 1, batch 4372
Training loss: 1.5988911390304565 

Epoch 1, batch 4373
Training loss: 1.8101310729980469 

Epoch 1, batch 4374
Training loss: 1.7892793416976929 

Epoch 1, batch 4375
Training loss: 1.6723517179489136 

Epoch 1, batch 4376
Training loss: 1.813520908355713 

Epoch 1, batch 4377
Training loss: 1.646221399307251 

Epoch 1, batch 4378
Training loss: 1.9246318340301514 

Epoch 1, batch 4379
Training loss: 1.8251473903656006 

Epoch 1, batch 4380
Training loss: 1.8695685863494873 

Epoch 1, batch 4381
Training loss: 1.53119480609893

Epoch 1, batch 4568
Training loss: 1.7710521221160889 

Epoch 1, batch 4569
Training loss: 1.6933587789535522 

Epoch 1, batch 4570
Training loss: 1.7221423387527466 

Epoch 1, batch 4571
Training loss: 1.795190691947937 

Epoch 1, batch 4572
Training loss: 1.9257090091705322 

Epoch 1, batch 4573
Training loss: 1.815200924873352 

Epoch 1, batch 4574
Training loss: 1.6676008701324463 

Epoch 1, batch 4575
Training loss: 1.8577468395233154 

Epoch 1, batch 4576
Training loss: 1.8919529914855957 

Epoch 1, batch 4577
Training loss: 1.630547285079956 

Epoch 1, batch 4578
Training loss: 1.7720308303833008 

Epoch 1, batch 4579
Training loss: 1.645851492881775 

Epoch 1, batch 4580
Training loss: 1.8554048538208008 

Epoch 1, batch 4581
Training loss: 1.8681960105895996 

Epoch 1, batch 4582
Training loss: 1.8864367008209229 

Epoch 1, batch 4583
Training loss: 1.7059071063995361 

Epoch 1, batch 4584
Training loss: 1.879787802696228 

Epoch 1, batch 4585
Training loss: 1.7588878870010376

Epoch 1, batch 4772
Training loss: 1.7248685359954834 

Epoch 1, batch 4773
Training loss: 1.9972445964813232 

Epoch 1, batch 4774
Training loss: 1.57808518409729 

Epoch 1, batch 4775
Training loss: 1.7032498121261597 

Epoch 1, batch 4776
Training loss: 1.778005599975586 

Epoch 1, batch 4777
Training loss: 1.792820930480957 

Epoch 1, batch 4778
Training loss: 1.5307286977767944 

Epoch 1, batch 4779
Training loss: 1.85514497756958 

Epoch 1, batch 4780
Training loss: 1.8867549896240234 

Epoch 1, batch 4781
Training loss: 1.7108418941497803 

Epoch 1, batch 4782
Training loss: 1.7219884395599365 

Epoch 1, batch 4783
Training loss: 1.648167610168457 

Epoch 1, batch 4784
Training loss: 1.9136741161346436 

Epoch 1, batch 4785
Training loss: 1.5915950536727905 

Epoch 1, batch 4786
Training loss: 1.6331936120986938 

Epoch 1, batch 4787
Training loss: 1.8950300216674805 

Epoch 1, batch 4788
Training loss: 1.6048702001571655 

Epoch 1, batch 4789
Training loss: 1.800873041152954 



Epoch 1, batch 4976
Training loss: 1.6420834064483643 

Epoch 1, batch 4977
Training loss: 1.818681240081787 

Epoch 1, batch 4978
Training loss: 1.6353542804718018 

Epoch 1, batch 4979
Training loss: 1.9628267288208008 

Epoch 1, batch 4980
Training loss: 1.6093711853027344 

Epoch 1, batch 4981
Training loss: 1.6309449672698975 

Epoch 1, batch 4982
Training loss: 1.5964668989181519 

Epoch 1, batch 4983
Training loss: 1.9235700368881226 

Epoch 1, batch 4984
Training loss: 1.6902999877929688 

Epoch 1, batch 4985
Training loss: 1.897047758102417 

Epoch 1, batch 4986
Training loss: 1.8545045852661133 

Epoch 1, batch 4987
Training loss: 1.9755630493164062 

Epoch 1, batch 4988
Training loss: 1.7275097370147705 

Epoch 1, batch 4989
Training loss: 2.021723508834839 

Epoch 1, batch 4990
Training loss: 1.7141573429107666 

Epoch 1, batch 4991
Training loss: 1.9715673923492432 

Epoch 1, batch 4992
Training loss: 1.567627191543579 

Epoch 1, batch 4993
Training loss: 1.649146199226379

Epoch 1, batch 5178
Training loss: 1.9563854932785034 

Epoch 1, batch 5179
Training loss: 1.5976554155349731 

Epoch 1, batch 5180
Training loss: 1.8480501174926758 

Epoch 1, batch 5181
Training loss: 1.8498806953430176 

Epoch 1, batch 5182
Training loss: 1.6328284740447998 

Epoch 1, batch 5183
Training loss: 1.779422402381897 

Epoch 1, batch 5184
Training loss: 1.5372344255447388 

Epoch 1, batch 5185
Training loss: 1.8638291358947754 

Epoch 1, batch 5186
Training loss: 1.9199063777923584 

Epoch 1, batch 5187
Training loss: 2.0003905296325684 

Epoch 1, batch 5188
Training loss: 1.9966940879821777 

Epoch 1, batch 5189
Training loss: 1.7166118621826172 

Epoch 1, batch 5190
Training loss: 1.8954213857650757 

Epoch 1, batch 5191
Training loss: 1.8696529865264893 

Epoch 1, batch 5192
Training loss: 1.8218538761138916 

Epoch 1, batch 5193
Training loss: 1.7696518898010254 

Epoch 1, batch 5194
Training loss: 1.6228522062301636 

Epoch 1, batch 5195
Training loss: 1.769911050796

Epoch 1, batch 5371
Training loss: 1.90274977684021 

Epoch 1, batch 5372
Training loss: 1.7060847282409668 

Epoch 1, batch 5373
Training loss: 1.7573332786560059 

Epoch 1, batch 5374
Training loss: 1.7982118129730225 

Epoch 1, batch 5375
Training loss: 1.5580816268920898 

Epoch 1, batch 5376
Training loss: 1.8431164026260376 

Epoch 1, batch 5377
Training loss: 1.860021948814392 

Epoch 1, batch 5378
Training loss: 1.7287734746932983 

Epoch 1, batch 5379
Training loss: 1.705265760421753 

Epoch 1, batch 5380
Training loss: 1.879399299621582 

Epoch 1, batch 5381
Training loss: 1.829736590385437 

Epoch 1, batch 5382
Training loss: 1.671492099761963 

Epoch 1, batch 5383
Training loss: 1.7054826021194458 

Epoch 1, batch 5384
Training loss: 1.6444510221481323 

Epoch 1, batch 5385
Training loss: 1.8520772457122803 

Epoch 1, batch 5386
Training loss: 1.866537094116211 

Epoch 1, batch 5387
Training loss: 1.8724100589752197 

Epoch 1, batch 5388
Training loss: 1.92844557762146 

Ep

Epoch 1, batch 5572
Training loss: 1.7170838117599487 

Epoch 1, batch 5573
Training loss: 1.6851805448532104 

Epoch 1, batch 5574
Training loss: 1.7638094425201416 

Epoch 1, batch 5575
Training loss: 1.956654667854309 

Epoch 1, batch 5576
Training loss: 1.6545757055282593 

Epoch 1, batch 5577
Training loss: 1.5926158428192139 

Epoch 1, batch 5578
Training loss: 1.8811795711517334 

Epoch 1, batch 5579
Training loss: 1.7604236602783203 

Epoch 1, batch 5580
Training loss: 1.9100360870361328 

Epoch 1, batch 5581
Training loss: 1.7377063035964966 

Epoch 1, batch 5582
Training loss: 1.677367925643921 

Epoch 1, batch 5583
Training loss: 1.903027892112732 

Epoch 1, batch 5584
Training loss: 1.9285178184509277 

Epoch 1, batch 5585
Training loss: 1.8188209533691406 

Epoch 1, batch 5586
Training loss: 1.6981351375579834 

Epoch 1, batch 5587
Training loss: 1.9463518857955933 

Epoch 1, batch 5588
Training loss: 2.0124218463897705 

Epoch 1, batch 5589
Training loss: 1.63517141342163

Epoch 1, batch 5776
Training loss: 1.7477655410766602 

Epoch 1, batch 5777
Training loss: 1.516537070274353 

Epoch 1, batch 5778
Training loss: 1.8002312183380127 

Epoch 1, batch 5779
Training loss: 1.5947706699371338 

Epoch 1, batch 5780
Training loss: 1.8463705778121948 

Epoch 1, batch 5781
Training loss: 1.8605259656906128 

Epoch 1, batch 5782
Training loss: 1.636078119277954 

Epoch 1, batch 5783
Training loss: 1.7220768928527832 

Epoch 1, batch 5784
Training loss: 1.6962002515792847 

Epoch 1, batch 5785
Training loss: 1.6320419311523438 

Epoch 1, batch 5786
Training loss: 1.6159896850585938 

Epoch 1, batch 5787
Training loss: 1.9012612104415894 

Epoch 1, batch 5788
Training loss: 1.8394190073013306 

Epoch 1, batch 5789
Training loss: 1.7809076309204102 

Epoch 1, batch 5790
Training loss: 1.895271897315979 

Epoch 1, batch 5791
Training loss: 2.076242685317993 

Epoch 1, batch 5792
Training loss: 1.9443538188934326 

Epoch 1, batch 5793
Training loss: 1.799819588661193

Epoch 1, batch 5978
Training loss: 2.0123605728149414 

Epoch 1, batch 5979
Training loss: 1.7036792039871216 

Epoch 1, batch 5980
Training loss: 1.66483473777771 

Epoch 1, batch 5981
Training loss: 1.5721817016601562 

Epoch 1, batch 5982
Training loss: 1.7862093448638916 

Epoch 1, batch 5983
Training loss: 1.7612329721450806 

Epoch 1, batch 5984
Training loss: 1.7048112154006958 

Epoch 1, batch 5985
Training loss: 1.6510365009307861 

Epoch 1, batch 5986
Training loss: 2.010213613510132 

Epoch 1, batch 5987
Training loss: 1.4961800575256348 

Epoch 1, batch 5988
Training loss: 1.679824948310852 

Epoch 1, batch 5989
Training loss: 1.7027993202209473 

Epoch 1, batch 5990
Training loss: 1.7048474550247192 

Epoch 1, batch 5991
Training loss: 1.927120566368103 

Epoch 1, batch 5992
Training loss: 2.0350968837738037 

Epoch 1, batch 5993
Training loss: 1.835233449935913 

Epoch 1, batch 5994
Training loss: 1.6022623777389526 

Epoch 1, batch 5995
Training loss: 1.7596333026885986 

Epoch 2, batch 175
Training loss: 1.5818034410476685 

Epoch 2, batch 176
Training loss: 1.859336256980896 

Epoch 2, batch 177
Training loss: 1.710004448890686 

Epoch 2, batch 178
Training loss: 1.8023862838745117 

Epoch 2, batch 179
Training loss: 1.6619523763656616 

Epoch 2, batch 180
Training loss: 1.9139593839645386 

Epoch 2, batch 181
Training loss: 1.5994408130645752 

Epoch 2, batch 182
Training loss: 1.727027177810669 

Epoch 2, batch 183
Training loss: 1.679115653038025 

Epoch 2, batch 184
Training loss: 1.6718392372131348 

Epoch 2, batch 185
Training loss: 2.0331921577453613 

Epoch 2, batch 186
Training loss: 1.9043712615966797 

Epoch 2, batch 187
Training loss: 1.6203333139419556 

Epoch 2, batch 188
Training loss: 1.8580713272094727 

Epoch 2, batch 189
Training loss: 1.5888564586639404 

Epoch 2, batch 190
Training loss: 1.748136043548584 

Epoch 2, batch 191
Training loss: 1.7840054035186768 

Epoch 2, batch 192
Training loss: 1.800377607345581 

Epoch 2, batch 1

Epoch 2, batch 376
Training loss: 1.7502570152282715 

Epoch 2, batch 377
Training loss: 1.6915547847747803 

Epoch 2, batch 378
Training loss: 1.856742262840271 

Epoch 2, batch 379
Training loss: 2.0304126739501953 

Epoch 2, batch 380
Training loss: 1.9203200340270996 

Epoch 2, batch 381
Training loss: 1.7836666107177734 

Epoch 2, batch 382
Training loss: 1.934903621673584 

Epoch 2, batch 383
Training loss: 1.928591012954712 

Epoch 2, batch 384
Training loss: 2.0509660243988037 

Epoch 2, batch 385
Training loss: 1.7420542240142822 

Epoch 2, batch 386
Training loss: 1.6175061464309692 

Epoch 2, batch 387
Training loss: 1.7756874561309814 

Epoch 2, batch 388
Training loss: 1.6904069185256958 

Epoch 2, batch 389
Training loss: 1.8029670715332031 

Epoch 2, batch 390
Training loss: 1.7300522327423096 

Epoch 2, batch 391
Training loss: 1.8159936666488647 

Epoch 2, batch 392
Training loss: 1.632368564605713 

Epoch 2, batch 393
Training loss: 1.8517401218414307 

Epoch 2, batch

Epoch 2, batch 577
Training loss: 1.6032748222351074 

Epoch 2, batch 578
Training loss: 1.8229230642318726 

Epoch 2, batch 579
Training loss: 1.8458609580993652 

Epoch 2, batch 580
Training loss: 2.020284652709961 

Epoch 2, batch 581
Training loss: 1.5036181211471558 

Epoch 2, batch 582
Training loss: 1.6918443441390991 

Epoch 2, batch 583
Training loss: 1.7177734375 

Epoch 2, batch 584
Training loss: 1.8343255519866943 

Epoch 2, batch 585
Training loss: 1.6709855794906616 

Epoch 2, batch 586
Training loss: 1.9381216764450073 

Epoch 2, batch 587
Training loss: 2.0865399837493896 

Epoch 2, batch 588
Training loss: 1.7894788980484009 

Epoch 2, batch 589
Training loss: 1.6394281387329102 

Epoch 2, batch 590
Training loss: 1.637372374534607 

Epoch 2, batch 591
Training loss: 1.48271644115448 

Epoch 2, batch 592
Training loss: 1.8722416162490845 

Epoch 2, batch 593
Training loss: 1.904003620147705 

Epoch 2, batch 594
Training loss: 1.7257862091064453 

Epoch 2, batch 595
Tr

Epoch 2, batch 777
Training loss: 1.6041812896728516 

Epoch 2, batch 778
Training loss: 1.7034225463867188 

Epoch 2, batch 779
Training loss: 1.8283857107162476 

Epoch 2, batch 780
Training loss: 1.7832553386688232 

Epoch 2, batch 781
Training loss: 1.6153324842453003 

Epoch 2, batch 782
Training loss: 1.7086800336837769 

Epoch 2, batch 783
Training loss: 1.7827900648117065 

Epoch 2, batch 784
Training loss: 1.5270476341247559 

Epoch 2, batch 785
Training loss: 1.9463638067245483 

Epoch 2, batch 786
Training loss: 1.625065803527832 

Epoch 2, batch 787
Training loss: 1.7333641052246094 

Epoch 2, batch 788
Training loss: 1.8825149536132812 

Epoch 2, batch 789
Training loss: 1.8948490619659424 

Epoch 2, batch 790
Training loss: 1.8399035930633545 

Epoch 2, batch 791
Training loss: 1.7010570764541626 

Epoch 2, batch 792
Training loss: 1.7542996406555176 

Epoch 2, batch 793
Training loss: 1.637910008430481 

Epoch 2, batch 794
Training loss: 1.8304274082183838 

Epoch 2, bat

Epoch 2, batch 979
Training loss: 1.8267154693603516 

Epoch 2, batch 980
Training loss: 1.6650102138519287 

Epoch 2, batch 981
Training loss: 1.5799453258514404 

Epoch 2, batch 982
Training loss: 1.4889291524887085 

Epoch 2, batch 983
Training loss: 1.6835238933563232 

Epoch 2, batch 984
Training loss: 1.8443409204483032 

Epoch 2, batch 985
Training loss: 1.8230104446411133 

Epoch 2, batch 986
Training loss: 1.8493434190750122 

Epoch 2, batch 987
Training loss: 1.98478364944458 

Epoch 2, batch 988
Training loss: 1.799141526222229 

Epoch 2, batch 989
Training loss: 1.95566725730896 

Epoch 2, batch 990
Training loss: 1.86238694190979 

Epoch 2, batch 991
Training loss: 1.7544137239456177 

Epoch 2, batch 992
Training loss: 1.822403073310852 

Epoch 2, batch 993
Training loss: 1.7445380687713623 

Epoch 2, batch 994
Training loss: 1.5740653276443481 

Epoch 2, batch 995
Training loss: 1.639102578163147 

Epoch 2, batch 996
Training loss: 1.9608814716339111 

Epoch 2, batch 997


Epoch 2, batch 1180
Training loss: 1.8013145923614502 

Epoch 2, batch 1181
Training loss: 1.5584690570831299 

Epoch 2, batch 1182
Training loss: 1.7227933406829834 

Epoch 2, batch 1183
Training loss: 2.0159506797790527 

Epoch 2, batch 1184
Training loss: 1.8438754081726074 

Epoch 2, batch 1185
Training loss: 1.7453522682189941 

Epoch 2, batch 1186
Training loss: 1.8309261798858643 

Epoch 2, batch 1187
Training loss: 1.8351905345916748 

Epoch 2, batch 1188
Training loss: 1.8334541320800781 

Epoch 2, batch 1189
Training loss: 1.8956820964813232 

Epoch 2, batch 1190
Training loss: 1.9101336002349854 

Epoch 2, batch 1191
Training loss: 1.6665687561035156 

Epoch 2, batch 1192
Training loss: 1.6057312488555908 

Epoch 2, batch 1193
Training loss: 1.6783696413040161 

Epoch 2, batch 1194
Training loss: 1.5650060176849365 

Epoch 2, batch 1195
Training loss: 1.7508318424224854 

Epoch 2, batch 1196
Training loss: 1.9100826978683472 

Epoch 2, batch 1197
Training loss: 2.00585007667

Epoch 2, batch 1383
Training loss: 1.8114418983459473 

Epoch 2, batch 1384
Training loss: 1.5687819719314575 

Epoch 2, batch 1385
Training loss: 1.6095004081726074 

Epoch 2, batch 1386
Training loss: 1.819636583328247 

Epoch 2, batch 1387
Training loss: 1.7246567010879517 

Epoch 2, batch 1388
Training loss: 1.9173386096954346 

Epoch 2, batch 1389
Training loss: 1.734458327293396 

Epoch 2, batch 1390
Training loss: 1.6178665161132812 

Epoch 2, batch 1391
Training loss: 1.6302390098571777 

Epoch 2, batch 1392
Training loss: 1.8158197402954102 

Epoch 2, batch 1393
Training loss: 1.556296944618225 

Epoch 2, batch 1394
Training loss: 1.8752901554107666 

Epoch 2, batch 1395
Training loss: 1.6751008033752441 

Epoch 2, batch 1396
Training loss: 1.8373513221740723 

Epoch 2, batch 1397
Training loss: 1.9616334438323975 

Epoch 2, batch 1398
Training loss: 1.5483710765838623 

Epoch 2, batch 1399
Training loss: 1.7090498208999634 

Epoch 2, batch 1400
Training loss: 1.75072884559631

Epoch 2, batch 1585
Training loss: 1.881786823272705 

Epoch 2, batch 1586
Training loss: 2.077489137649536 

Epoch 2, batch 1587
Training loss: 1.9863059520721436 

Epoch 2, batch 1588
Training loss: 1.5718913078308105 

Epoch 2, batch 1589
Training loss: 1.9024888277053833 

Epoch 2, batch 1590
Training loss: 1.5181140899658203 

Epoch 2, batch 1591
Training loss: 1.7497475147247314 

Epoch 2, batch 1592
Training loss: 1.701979160308838 

Epoch 2, batch 1593
Training loss: 1.8313941955566406 

Epoch 2, batch 1594
Training loss: 1.9569435119628906 

Epoch 2, batch 1595
Training loss: 1.8250406980514526 

Epoch 2, batch 1596
Training loss: 1.7788598537445068 

Epoch 2, batch 1597
Training loss: 1.9939963817596436 

Epoch 2, batch 1598
Training loss: 1.901127815246582 

Epoch 2, batch 1599
Training loss: 1.5597028732299805 

Epoch 2, batch 1600
Training loss: 1.7739717960357666 

Epoch 2, batch 1601
Training loss: 1.8079636096954346 

Epoch 2, batch 1602
Training loss: 1.585200309753418

Epoch 2, batch 1786
Training loss: 1.7338283061981201 

Epoch 2, batch 1787
Training loss: 1.6104191541671753 

Epoch 2, batch 1788
Training loss: 1.7821229696273804 

Epoch 2, batch 1789
Training loss: 1.715564489364624 

Epoch 2, batch 1790
Training loss: 1.5427520275115967 

Epoch 2, batch 1791
Training loss: 1.962398648262024 

Epoch 2, batch 1792
Training loss: 1.6513853073120117 

Epoch 2, batch 1793
Training loss: 1.4830271005630493 

Epoch 2, batch 1794
Training loss: 1.7255208492279053 

Epoch 2, batch 1795
Training loss: 1.6173609495162964 

Epoch 2, batch 1796
Training loss: 1.6186373233795166 

Epoch 2, batch 1797
Training loss: 1.8498178720474243 

Epoch 2, batch 1798
Training loss: 1.862452745437622 

Epoch 2, batch 1799
Training loss: 1.5941020250320435 

Epoch 2, batch 1800
Training loss: 1.6002877950668335 

Epoch 2, batch 1801
Training loss: 1.5587385892868042 

Epoch 2, batch 1802
Training loss: 1.8683730363845825 

Epoch 2, batch 1803
Training loss: 1.71060204505920

Epoch 2, batch 1985
Training loss: 1.8116331100463867 

Epoch 2, batch 1986
Training loss: 1.9158573150634766 

Epoch 2, batch 1987
Training loss: 1.4909666776657104 

Epoch 2, batch 1988
Training loss: 1.9177250862121582 

Epoch 2, batch 1989
Training loss: 1.5958893299102783 

Epoch 2, batch 1990
Training loss: 1.6638985872268677 

Epoch 2, batch 1991
Training loss: 1.8263834714889526 

Epoch 2, batch 1992
Training loss: 1.5750046968460083 

Epoch 2, batch 1993
Training loss: 1.647611379623413 

Epoch 2, batch 1994
Training loss: 1.9304111003875732 

Epoch 2, batch 1995
Training loss: 1.6185345649719238 

Epoch 2, batch 1996
Training loss: 1.788612723350525 

Epoch 2, batch 1997
Training loss: 1.8513133525848389 

Epoch 2, batch 1998
Training loss: 1.7535687685012817 

Epoch 2, batch 1999
Training loss: 1.7384886741638184 

Epoch 2, batch 2000
Training loss: 1.6114392280578613 

Epoch 2, batch 2001
Training loss: 1.7720073461532593 

Epoch 2, batch 2002
Training loss: 1.6940407752990

Epoch 2, batch 2186
Training loss: 1.5673021078109741 

Epoch 2, batch 2187
Training loss: 2.0206103324890137 

Epoch 2, batch 2188
Training loss: 1.5504732131958008 

Epoch 2, batch 2189
Training loss: 1.8840996026992798 

Epoch 2, batch 2190
Training loss: 1.6857799291610718 

Epoch 2, batch 2191
Training loss: 1.8041131496429443 

Epoch 2, batch 2192
Training loss: 1.7473061084747314 

Epoch 2, batch 2193
Training loss: 1.6030491590499878 

Epoch 2, batch 2194
Training loss: 1.5672749280929565 

Epoch 2, batch 2195
Training loss: 1.7459853887557983 

Epoch 2, batch 2196
Training loss: 1.9873619079589844 

Epoch 2, batch 2197
Training loss: 1.81890869140625 

Epoch 2, batch 2198
Training loss: 1.730712890625 

Epoch 2, batch 2199
Training loss: 1.8991923332214355 

Epoch 2, batch 2200
Training loss: 1.6940710544586182 

Epoch 2, batch 2201
Training loss: 1.8513069152832031 

Epoch 2, batch 2202
Training loss: 1.9857540130615234 

Epoch 2, batch 2203
Training loss: 1.730613350868225 


Epoch 2, batch 2389
Training loss: 1.8334168195724487 

Epoch 2, batch 2390
Training loss: 1.9142398834228516 

Epoch 2, batch 2391
Training loss: 1.8719794750213623 

Epoch 2, batch 2392
Training loss: 1.721582055091858 

Epoch 2, batch 2393
Training loss: 1.475565791130066 

Epoch 2, batch 2394
Training loss: 1.8832504749298096 

Epoch 2, batch 2395
Training loss: 1.8691637516021729 

Epoch 2, batch 2396
Training loss: 1.5781073570251465 

Epoch 2, batch 2397
Training loss: 1.895381212234497 

Epoch 2, batch 2398
Training loss: 1.862770915031433 

Epoch 2, batch 2399
Training loss: 1.6891422271728516 

Epoch 2, batch 2400
Training loss: 1.5917950868606567 

Epoch 2, batch 2401
Training loss: 1.8935143947601318 

Epoch 2, batch 2402
Training loss: 1.9119915962219238 

Epoch 2, batch 2403
Training loss: 1.483546257019043 

Epoch 2, batch 2404
Training loss: 1.6812984943389893 

Epoch 2, batch 2405
Training loss: 1.7711694240570068 

Epoch 2, batch 2406
Training loss: 1.800032138824463 

Epoch 2, batch 2594
Training loss: 1.9280800819396973 

Epoch 2, batch 2595
Training loss: 1.8874238729476929 

Epoch 2, batch 2596
Training loss: 1.8506660461425781 

Epoch 2, batch 2597
Training loss: 2.005312442779541 

Epoch 2, batch 2598
Training loss: 1.538214087486267 

Epoch 2, batch 2599
Training loss: 1.7966759204864502 

Epoch 2, batch 2600
Training loss: 1.6792036294937134 

Epoch 2, batch 2601
Training loss: 1.7757656574249268 

Epoch 2, batch 2602
Training loss: 1.7954483032226562 

Epoch 2, batch 2603
Training loss: 1.6472771167755127 

Epoch 2, batch 2604
Training loss: 1.6733554601669312 

Epoch 2, batch 2605
Training loss: 1.6665652990341187 

Epoch 2, batch 2606
Training loss: 1.8642313480377197 

Epoch 2, batch 2607
Training loss: 1.7856197357177734 

Epoch 2, batch 2608
Training loss: 1.6975871324539185 

Epoch 2, batch 2609
Training loss: 1.617067575454712 

Epoch 2, batch 2610
Training loss: 1.5419119596481323 

Epoch 2, batch 2611
Training loss: 1.72957718372344

Epoch 2, batch 2796
Training loss: 1.8321406841278076 

Epoch 2, batch 2797
Training loss: 1.749950647354126 

Epoch 2, batch 2798
Training loss: 1.9272010326385498 

Epoch 2, batch 2799
Training loss: 1.7093418836593628 

Epoch 2, batch 2800
Training loss: 1.7136783599853516 

Epoch 2, batch 2801
Training loss: 1.6502805948257446 

Epoch 2, batch 2802
Training loss: 1.8491978645324707 

Epoch 2, batch 2803
Training loss: 1.7426817417144775 

Epoch 2, batch 2804
Training loss: 2.024503469467163 

Epoch 2, batch 2805
Training loss: 1.8459553718566895 

Epoch 2, batch 2806
Training loss: 1.5784969329833984 

Epoch 2, batch 2807
Training loss: 1.8623969554901123 

Epoch 2, batch 2808
Training loss: 1.6674762964248657 

Epoch 2, batch 2809
Training loss: 1.7505748271942139 

Epoch 2, batch 2810
Training loss: 1.7182867527008057 

Epoch 2, batch 2811
Training loss: 1.7525830268859863 

Epoch 2, batch 2812
Training loss: 1.9809718132019043 

Epoch 2, batch 2813
Training loss: 1.7333090305328

Epoch 2, batch 2995
Training loss: 1.65888512134552 

Epoch 2, batch 2996
Training loss: 1.5612469911575317 

Epoch 2, batch 2997
Training loss: 1.6049938201904297 

Epoch 2, batch 2998
Training loss: 2.0330638885498047 

Epoch 2, batch 2999
Training loss: 1.735851764678955 

Epoch 2, batch 3000
Training loss: 1.699967861175537 

Epoch 2, batch 3001
Training loss: 1.6727781295776367 

Epoch 2, batch 3002
Training loss: 1.6470352411270142 

Epoch 2, batch 3003
Training loss: 1.8819150924682617 

Epoch 2, batch 3004
Training loss: 1.552504539489746 

Epoch 2, batch 3005
Training loss: 1.868809700012207 

Epoch 2, batch 3006
Training loss: 1.7370777130126953 

Epoch 2, batch 3007
Training loss: 1.847464680671692 

Epoch 2, batch 3008
Training loss: 1.7841854095458984 

Epoch 2, batch 3009
Training loss: 1.6701574325561523 

Epoch 2, batch 3010
Training loss: 1.8013606071472168 

Epoch 2, batch 3011
Training loss: 1.9796533584594727 

Epoch 2, batch 3012
Training loss: 1.592673420906067 



Epoch 2, batch 3197
Training loss: 1.553024172782898 

Epoch 2, batch 3198
Training loss: 1.8435242176055908 

Epoch 2, batch 3199
Training loss: 1.930649995803833 

Epoch 2, batch 3200
Training loss: 1.5999476909637451 

Epoch 2, batch 3201
Training loss: 1.640640139579773 

Epoch 2, batch 3202
Training loss: 1.9435278177261353 

Epoch 2, batch 3203
Training loss: 1.9490537643432617 

Epoch 2, batch 3204
Training loss: 1.8917243480682373 

Epoch 2, batch 3205
Training loss: 1.5791373252868652 

Epoch 2, batch 3206
Training loss: 1.5106866359710693 

Epoch 2, batch 3207
Training loss: 2.0009100437164307 

Epoch 2, batch 3208
Training loss: 1.9487226009368896 

Epoch 2, batch 3209
Training loss: 1.725374460220337 

Epoch 2, batch 3210
Training loss: 1.6182337999343872 

Epoch 2, batch 3211
Training loss: 1.7735106945037842 

Epoch 2, batch 3212
Training loss: 1.8083629608154297 

Epoch 2, batch 3213
Training loss: 1.7948565483093262 

Epoch 2, batch 3214
Training loss: 1.772174715995788

Epoch 2, batch 3399
Training loss: 1.7961452007293701 

Epoch 2, batch 3400
Training loss: 1.7703239917755127 

Epoch 2, batch 3401
Training loss: 1.6259980201721191 

Epoch 2, batch 3402
Training loss: 1.7802932262420654 

Epoch 2, batch 3403
Training loss: 1.6740883588790894 

Epoch 2, batch 3404
Training loss: 1.5391968488693237 

Epoch 2, batch 3405
Training loss: 2.1818251609802246 

Epoch 2, batch 3406
Training loss: 1.644768476486206 

Epoch 2, batch 3407
Training loss: 1.6723600625991821 

Epoch 2, batch 3408
Training loss: 1.751278042793274 

Epoch 2, batch 3409
Training loss: 1.8279051780700684 

Epoch 2, batch 3410
Training loss: 1.7169444561004639 

Epoch 2, batch 3411
Training loss: 1.724460482597351 

Epoch 2, batch 3412
Training loss: 1.7705479860305786 

Epoch 2, batch 3413
Training loss: 1.667604684829712 

Epoch 2, batch 3414
Training loss: 1.9835433959960938 

Epoch 2, batch 3415
Training loss: 1.8356547355651855 

Epoch 2, batch 3416
Training loss: 1.731346726417541

Epoch 2, batch 3601
Training loss: 1.6998810768127441 

Epoch 2, batch 3602
Training loss: 1.5745259523391724 

Epoch 2, batch 3603
Training loss: 1.7554421424865723 

Epoch 2, batch 3604
Training loss: 1.90012526512146 

Epoch 2, batch 3605
Training loss: 1.542409062385559 

Epoch 2, batch 3606
Training loss: 1.971449375152588 

Epoch 2, batch 3607
Training loss: 1.6106376647949219 

Epoch 2, batch 3608
Training loss: 1.7756519317626953 

Epoch 2, batch 3609
Training loss: 1.773688554763794 

Epoch 2, batch 3610
Training loss: 1.7676080465316772 

Epoch 2, batch 3611
Training loss: 1.7841928005218506 

Epoch 2, batch 3612
Training loss: 1.913031816482544 

Epoch 2, batch 3613
Training loss: 1.749249815940857 

Epoch 2, batch 3614
Training loss: 1.489405632019043 

Epoch 2, batch 3615
Training loss: 1.9072661399841309 

Epoch 2, batch 3616
Training loss: 1.742891788482666 

Epoch 2, batch 3617
Training loss: 1.8379477262496948 

Epoch 2, batch 3618
Training loss: 1.703249216079712 

Ep

Epoch 2, batch 3803
Training loss: 2.0711050033569336 

Epoch 2, batch 3804
Training loss: 1.826226830482483 

Epoch 2, batch 3805
Training loss: 1.8538541793823242 

Epoch 2, batch 3806
Training loss: 1.8796474933624268 

Epoch 2, batch 3807
Training loss: 1.990455985069275 

Epoch 2, batch 3808
Training loss: 1.5591284036636353 

Epoch 2, batch 3809
Training loss: 1.8052208423614502 

Epoch 2, batch 3810
Training loss: 1.8528664112091064 

Epoch 2, batch 3811
Training loss: 1.5791690349578857 

Epoch 2, batch 3812
Training loss: 1.593561053276062 

Epoch 2, batch 3813
Training loss: 1.791029453277588 

Epoch 2, batch 3814
Training loss: 1.5672909021377563 

Epoch 2, batch 3815
Training loss: 1.7890396118164062 

Epoch 2, batch 3816
Training loss: 1.7931331396102905 

Epoch 2, batch 3817
Training loss: 1.7489269971847534 

Epoch 2, batch 3818
Training loss: 1.8808125257492065 

Epoch 2, batch 3819
Training loss: 1.7975002527236938 

Epoch 2, batch 3820
Training loss: 1.831502437591552

Epoch 2, batch 3972
Training loss: 1.7265745401382446 

Epoch 2, batch 3973
Training loss: 1.4696725606918335 

Epoch 2, batch 3974
Training loss: 1.7014594078063965 

Epoch 2, batch 3975
Training loss: 1.753196120262146 

Epoch 2, batch 3976
Training loss: 1.6213202476501465 

Epoch 2, batch 3977
Training loss: 1.6822881698608398 

Epoch 2, batch 3978
Training loss: 1.892781138420105 

Epoch 2, batch 3979
Training loss: 1.7874844074249268 

Epoch 2, batch 3980
Training loss: 1.7254972457885742 

Epoch 2, batch 3981
Training loss: 1.7015019655227661 

Epoch 2, batch 3982
Training loss: 1.6515824794769287 

Epoch 2, batch 3983
Training loss: 1.631612777709961 

Epoch 2, batch 3984
Training loss: 1.7700934410095215 

Epoch 2, batch 3985
Training loss: 1.5899771451950073 

Epoch 2, batch 3986
Training loss: 1.930654525756836 

Epoch 2, batch 3987
Training loss: 1.7519702911376953 

Epoch 2, batch 3988
Training loss: 1.813283085823059 

Epoch 2, batch 3989
Training loss: 1.670627474784851 

Epoch 2, batch 4156
Training loss: 1.6969561576843262 

Epoch 2, batch 4157
Training loss: 1.5571861267089844 

Epoch 2, batch 4158
Training loss: 1.616283893585205 

Epoch 2, batch 4159
Training loss: 1.9799282550811768 

Epoch 2, batch 4160
Training loss: 1.914602279663086 

Epoch 2, batch 4161
Training loss: 1.6055227518081665 

Epoch 2, batch 4162
Training loss: 1.7694928646087646 

Epoch 2, batch 4163
Training loss: 1.8568291664123535 

Epoch 2, batch 4164
Training loss: 1.638585090637207 

Epoch 2, batch 4165
Training loss: 1.9975157976150513 

Epoch 2, batch 4166
Training loss: 1.5597212314605713 

Epoch 2, batch 4167
Training loss: 1.7028840780258179 

Epoch 2, batch 4168
Training loss: 1.639114260673523 

Epoch 2, batch 4169
Training loss: 1.940195083618164 

Epoch 2, batch 4170
Training loss: 1.9902820587158203 

Epoch 2, batch 4171
Training loss: 1.6690713167190552 

Epoch 2, batch 4172
Training loss: 1.9318060874938965 

Epoch 2, batch 4173
Training loss: 1.745497465133667 

Epoch 2, batch 4357
Training loss: 1.895408272743225 

Epoch 2, batch 4358
Training loss: 2.0434117317199707 

Epoch 2, batch 4359
Training loss: 1.4813898801803589 

Epoch 2, batch 4360
Training loss: 1.7958699464797974 

Epoch 2, batch 4361
Training loss: 1.8164453506469727 

Epoch 2, batch 4362
Training loss: 1.7506492137908936 

Epoch 2, batch 4363
Training loss: 1.902007818222046 

Epoch 2, batch 4364
Training loss: 1.872382640838623 

Epoch 2, batch 4365
Training loss: 1.7963497638702393 

Epoch 2, batch 4366
Training loss: 1.4977011680603027 

Epoch 2, batch 4367
Training loss: 1.8832529783248901 

Epoch 2, batch 4368
Training loss: 1.8301470279693604 

Epoch 2, batch 4369
Training loss: 1.6125725507736206 

Epoch 2, batch 4370
Training loss: 1.5607428550720215 

Epoch 2, batch 4371
Training loss: 1.8561713695526123 

Epoch 2, batch 4372
Training loss: 1.6843808889389038 

Epoch 2, batch 4373
Training loss: 1.7318735122680664 

Epoch 2, batch 4374
Training loss: 1.80859446525573

Epoch 2, batch 4560
Training loss: 1.698699951171875 

Epoch 2, batch 4561
Training loss: 1.9040334224700928 

Epoch 2, batch 4562
Training loss: 1.613652229309082 

Epoch 2, batch 4563
Training loss: 1.7569113969802856 

Epoch 2, batch 4564
Training loss: 1.6350655555725098 

Epoch 2, batch 4565
Training loss: 1.5387959480285645 

Epoch 2, batch 4566
Training loss: 1.5874758958816528 

Epoch 2, batch 4567
Training loss: 1.685293436050415 

Epoch 2, batch 4568
Training loss: 1.8520288467407227 

Epoch 2, batch 4569
Training loss: 1.747279405593872 

Epoch 2, batch 4570
Training loss: 1.731737494468689 

Epoch 2, batch 4571
Training loss: 1.635521650314331 

Epoch 2, batch 4572
Training loss: 1.7284249067306519 

Epoch 2, batch 4573
Training loss: 1.8520855903625488 

Epoch 2, batch 4574
Training loss: 1.6768529415130615 

Epoch 2, batch 4575
Training loss: 1.7442559003829956 

Epoch 2, batch 4576
Training loss: 1.6574580669403076 

Epoch 2, batch 4577
Training loss: 1.599797010421753 


Epoch 2, batch 4763
Training loss: 1.5706231594085693 

Epoch 2, batch 4764
Training loss: 1.7670581340789795 

Epoch 2, batch 4765
Training loss: 1.9829773902893066 

Epoch 2, batch 4766
Training loss: 1.7307748794555664 

Epoch 2, batch 4767
Training loss: 1.8133383989334106 

Epoch 2, batch 4768
Training loss: 1.9146515130996704 

Epoch 2, batch 4769
Training loss: 1.8568341732025146 

Epoch 2, batch 4770
Training loss: 1.8682785034179688 

Epoch 2, batch 4771
Training loss: 1.743433952331543 

Epoch 2, batch 4772
Training loss: 1.763509750366211 

Epoch 2, batch 4773
Training loss: 1.7359815835952759 

Epoch 2, batch 4774
Training loss: 1.7021052837371826 

Epoch 2, batch 4775
Training loss: 1.5785305500030518 

Epoch 2, batch 4776
Training loss: 1.746241569519043 

Epoch 2, batch 4777
Training loss: 1.7004084587097168 

Epoch 2, batch 4778
Training loss: 1.6541285514831543 

Epoch 2, batch 4779
Training loss: 2.0205349922180176 

Epoch 2, batch 4780
Training loss: 1.74441266059875

Epoch 2, batch 4963
Training loss: 1.6764605045318604 

Epoch 2, batch 4964
Training loss: 1.755787968635559 

Epoch 2, batch 4965
Training loss: 1.672508955001831 

Epoch 2, batch 4966
Training loss: 1.7219898700714111 

Epoch 2, batch 4967
Training loss: 1.5737836360931396 

Epoch 2, batch 4968
Training loss: 1.9064397811889648 

Epoch 2, batch 4969
Training loss: 1.5013370513916016 

Epoch 2, batch 4970
Training loss: 1.8042469024658203 

Epoch 2, batch 4971
Training loss: 1.8574573993682861 

Epoch 2, batch 4972
Training loss: 1.8381457328796387 

Epoch 2, batch 4973
Training loss: 1.827918291091919 

Epoch 2, batch 4974
Training loss: 1.6651575565338135 

Epoch 2, batch 4975
Training loss: 1.7961888313293457 

Epoch 2, batch 4976
Training loss: 1.7650810480117798 

Epoch 2, batch 4977
Training loss: 1.933574914932251 

Epoch 2, batch 4978
Training loss: 1.8683778047561646 

Epoch 2, batch 4979
Training loss: 1.9467493295669556 

Epoch 2, batch 4980
Training loss: 1.867273330688476

Epoch 2, batch 5165
Training loss: 2.055116653442383 

Epoch 2, batch 5166
Training loss: 1.8093845844268799 

Epoch 2, batch 5167
Training loss: 1.693652629852295 

Epoch 2, batch 5168
Training loss: 1.4934394359588623 

Epoch 2, batch 5169
Training loss: 1.9782977104187012 

Epoch 2, batch 5170
Training loss: 1.6846394538879395 

Epoch 2, batch 5171
Training loss: 2.0244293212890625 

Epoch 2, batch 5172
Training loss: 1.9739539623260498 

Epoch 2, batch 5173
Training loss: 1.669365644454956 

Epoch 2, batch 5174
Training loss: 1.9411633014678955 

Epoch 2, batch 5175
Training loss: 1.7088005542755127 

Epoch 2, batch 5176
Training loss: 1.630785584449768 

Epoch 2, batch 5177
Training loss: 1.7808361053466797 

Epoch 2, batch 5178
Training loss: 1.8336095809936523 

Epoch 2, batch 5179
Training loss: 1.827135682106018 

Epoch 2, batch 5180
Training loss: 1.8819608688354492 

Epoch 2, batch 5181
Training loss: 1.7591297626495361 

Epoch 2, batch 5182
Training loss: 1.5132317543029785

Epoch 2, batch 5367
Training loss: 1.6342079639434814 

Epoch 2, batch 5368
Training loss: 1.5159958600997925 

Epoch 2, batch 5369
Training loss: 1.5569343566894531 

Epoch 2, batch 5370
Training loss: 1.6784945726394653 

Epoch 2, batch 5371
Training loss: 1.7834373712539673 

Epoch 2, batch 5372
Training loss: 2.028230905532837 

Epoch 2, batch 5373
Training loss: 1.9573029279708862 

Epoch 2, batch 5374
Training loss: 1.5812746286392212 

Epoch 2, batch 5375
Training loss: 1.960054874420166 

Epoch 2, batch 5376
Training loss: 1.850317358970642 

Epoch 2, batch 5377
Training loss: 1.6480836868286133 

Epoch 2, batch 5378
Training loss: 1.8433032035827637 

Epoch 2, batch 5379
Training loss: 1.7572298049926758 

Epoch 2, batch 5380
Training loss: 1.7985512018203735 

Epoch 2, batch 5381
Training loss: 1.8095908164978027 

Epoch 2, batch 5382
Training loss: 2.0585391521453857 

Epoch 2, batch 5383
Training loss: 1.769920825958252 

Epoch 2, batch 5384
Training loss: 1.468697428703308

Epoch 2, batch 5567
Training loss: 1.616141676902771 

Epoch 2, batch 5568
Training loss: 1.6279363632202148 

Epoch 2, batch 5569
Training loss: 1.7714664936065674 

Epoch 2, batch 5570
Training loss: 1.8310108184814453 

Epoch 2, batch 5571
Training loss: 1.964571237564087 

Epoch 2, batch 5572
Training loss: 1.8016254901885986 

Epoch 2, batch 5573
Training loss: 1.7052412033081055 

Epoch 2, batch 5574
Training loss: 1.5601222515106201 

Epoch 2, batch 5575
Training loss: 1.5075420141220093 

Epoch 2, batch 5576
Training loss: 1.9218592643737793 

Epoch 2, batch 5577
Training loss: 1.928093433380127 

Epoch 2, batch 5578
Training loss: 1.4972320795059204 

Epoch 2, batch 5579
Training loss: 1.863655686378479 

Epoch 2, batch 5580
Training loss: 2.0623960494995117 

Epoch 2, batch 5581
Training loss: 1.8550302982330322 

Epoch 2, batch 5582
Training loss: 1.612103819847107 

Epoch 2, batch 5583
Training loss: 1.9240731000900269 

Epoch 2, batch 5584
Training loss: 1.5517061948776245

Epoch 2, batch 5768
Training loss: 1.602270483970642 

Epoch 2, batch 5769
Training loss: 1.5725188255310059 

Epoch 2, batch 5770
Training loss: 1.658308506011963 

Epoch 2, batch 5771
Training loss: 1.950596809387207 

Epoch 2, batch 5772
Training loss: 1.8991572856903076 

Epoch 2, batch 5773
Training loss: 1.8036541938781738 

Epoch 2, batch 5774
Training loss: 2.038914203643799 

Epoch 2, batch 5775
Training loss: 1.966641902923584 

Epoch 2, batch 5776
Training loss: 1.9040751457214355 

Epoch 2, batch 5777
Training loss: 1.8803942203521729 

Epoch 2, batch 5778
Training loss: 1.6429953575134277 

Epoch 2, batch 5779
Training loss: 1.9532374143600464 

Epoch 2, batch 5780
Training loss: 1.820723295211792 

Epoch 2, batch 5781
Training loss: 1.5258506536483765 

Epoch 2, batch 5782
Training loss: 1.7285130023956299 

Epoch 2, batch 5783
Training loss: 1.7506134510040283 

Epoch 2, batch 5784
Training loss: 1.6194461584091187 

Epoch 2, batch 5785
Training loss: 1.6776278018951416 

Epoch 2, batch 5970
Training loss: 2.0233445167541504 

Epoch 2, batch 5971
Training loss: 1.8861615657806396 

Epoch 2, batch 5972
Training loss: 1.6852965354919434 

Epoch 2, batch 5973
Training loss: 1.7682340145111084 

Epoch 2, batch 5974
Training loss: 1.7774640321731567 

Epoch 2, batch 5975
Training loss: 1.5596563816070557 

Epoch 2, batch 5976
Training loss: 1.6711647510528564 

Epoch 2, batch 5977
Training loss: 1.6597087383270264 

Epoch 2, batch 5978
Training loss: 1.596774697303772 

Epoch 2, batch 5979
Training loss: 1.7695064544677734 

Epoch 2, batch 5980
Training loss: 1.9010461568832397 

Epoch 2, batch 5981
Training loss: 1.9371187686920166 

Epoch 2, batch 5982
Training loss: 1.6020835638046265 

Epoch 2, batch 5983
Training loss: 1.8936957120895386 

Epoch 2, batch 5984
Training loss: 1.7192003726959229 

Epoch 2, batch 5985
Training loss: 1.925358772277832 

Epoch 2, batch 5986
Training loss: 1.5203378200531006 

Epoch 2, batch 5987
Training loss: 1.7718356847763

Epoch 3, batch 170
Training loss: 1.903620719909668 

Epoch 3, batch 171
Training loss: 1.6027278900146484 

Epoch 3, batch 172
Training loss: 1.9808297157287598 

Epoch 3, batch 173
Training loss: 1.8317359685897827 

Epoch 3, batch 174
Training loss: 1.7019339799880981 

Epoch 3, batch 175
Training loss: 1.5685211420059204 

Epoch 3, batch 176
Training loss: 1.920243740081787 

Epoch 3, batch 177
Training loss: 1.9160230159759521 

Epoch 3, batch 178
Training loss: 1.9552651643753052 

Epoch 3, batch 179
Training loss: 1.574584722518921 

Epoch 3, batch 180
Training loss: 1.8850250244140625 

Epoch 3, batch 181
Training loss: 1.4847750663757324 

Epoch 3, batch 182
Training loss: 1.7053639888763428 

Epoch 3, batch 183
Training loss: 1.6279271841049194 

Epoch 3, batch 184
Training loss: 2.024428367614746 

Epoch 3, batch 185
Training loss: 1.69654381275177 

Epoch 3, batch 186
Training loss: 1.7897183895111084 

Epoch 3, batch 187
Training loss: 1.8157093524932861 

Epoch 3, batch 1

Epoch 3, batch 374
Training loss: 1.6492780447006226 

Epoch 3, batch 375
Training loss: 1.8155102729797363 

Epoch 3, batch 376
Training loss: 1.7764923572540283 

Epoch 3, batch 377
Training loss: 1.4752542972564697 

Epoch 3, batch 378
Training loss: 1.6879022121429443 

Epoch 3, batch 379
Training loss: 1.4751147031784058 

Epoch 3, batch 380
Training loss: 1.9789142608642578 

Epoch 3, batch 381
Training loss: 1.8504365682601929 

Epoch 3, batch 382
Training loss: 1.7461130619049072 

Epoch 3, batch 383
Training loss: 1.5672879219055176 

Epoch 3, batch 384
Training loss: 1.727755069732666 

Epoch 3, batch 385
Training loss: 1.946958065032959 

Epoch 3, batch 386
Training loss: 1.9267443418502808 

Epoch 3, batch 387
Training loss: 1.9025471210479736 

Epoch 3, batch 388
Training loss: 1.6755445003509521 

Epoch 3, batch 389
Training loss: 1.9137954711914062 

Epoch 3, batch 390
Training loss: 1.8892567157745361 

Epoch 3, batch 391
Training loss: 1.99462890625 

Epoch 3, batch 39

Epoch 3, batch 576
Training loss: 1.7714959383010864 

Epoch 3, batch 577
Training loss: 1.6119182109832764 

Epoch 3, batch 578
Training loss: 1.7244741916656494 

Epoch 3, batch 579
Training loss: 1.7750920057296753 

Epoch 3, batch 580
Training loss: 1.5998367071151733 

Epoch 3, batch 581
Training loss: 1.9826246500015259 

Epoch 3, batch 582
Training loss: 1.7593512535095215 

Epoch 3, batch 583
Training loss: 1.6506941318511963 

Epoch 3, batch 584
Training loss: 1.70109224319458 

Epoch 3, batch 585
Training loss: 1.6461182832717896 

Epoch 3, batch 586
Training loss: 1.8228294849395752 

Epoch 3, batch 587
Training loss: 1.6830203533172607 

Epoch 3, batch 588
Training loss: 1.9776089191436768 

Epoch 3, batch 589
Training loss: 1.9980276823043823 

Epoch 3, batch 590
Training loss: 1.6862726211547852 

Epoch 3, batch 591
Training loss: 1.6578738689422607 

Epoch 3, batch 592
Training loss: 1.9482026100158691 

Epoch 3, batch 593
Training loss: 1.8337676525115967 

Epoch 3, bat

Epoch 3, batch 779
Training loss: 1.8359190225601196 

Epoch 3, batch 780
Training loss: 1.7091248035430908 

Epoch 3, batch 781
Training loss: 1.881129264831543 

Epoch 3, batch 782
Training loss: 1.9709089994430542 

Epoch 3, batch 783
Training loss: 1.717413067817688 

Epoch 3, batch 784
Training loss: 1.9900089502334595 

Epoch 3, batch 785
Training loss: 1.5875825881958008 

Epoch 3, batch 786
Training loss: 1.7221800088882446 

Epoch 3, batch 787
Training loss: 1.8628606796264648 

Epoch 3, batch 788
Training loss: 1.5850944519042969 

Epoch 3, batch 789
Training loss: 1.870786190032959 

Epoch 3, batch 790
Training loss: 1.543607473373413 

Epoch 3, batch 791
Training loss: 1.6894922256469727 

Epoch 3, batch 792
Training loss: 1.7221038341522217 

Epoch 3, batch 793
Training loss: 1.628251552581787 

Epoch 3, batch 794
Training loss: 1.8872965574264526 

Epoch 3, batch 795
Training loss: 1.6676771640777588 

Epoch 3, batch 796
Training loss: 1.4926674365997314 

Epoch 3, batch 

Epoch 3, batch 978
Training loss: 1.7808740139007568 

Epoch 3, batch 979
Training loss: 1.5466722249984741 

Epoch 3, batch 980
Training loss: 1.808117151260376 

Epoch 3, batch 981
Training loss: 1.9103600978851318 

Epoch 3, batch 982
Training loss: 1.8106937408447266 

Epoch 3, batch 983
Training loss: 1.6938546895980835 

Epoch 3, batch 984
Training loss: 1.5780497789382935 

Epoch 3, batch 985
Training loss: 1.9001760482788086 

Epoch 3, batch 986
Training loss: 1.504204511642456 

Epoch 3, batch 987
Training loss: 1.6926612854003906 

Epoch 3, batch 988
Training loss: 2.0275425910949707 

Epoch 3, batch 989
Training loss: 1.735835075378418 

Epoch 3, batch 990
Training loss: 1.6325128078460693 

Epoch 3, batch 991
Training loss: 1.6022024154663086 

Epoch 3, batch 992
Training loss: 1.9621295928955078 

Epoch 3, batch 993
Training loss: 2.035090923309326 

Epoch 3, batch 994
Training loss: 1.5858553647994995 

Epoch 3, batch 995
Training loss: 1.4993059635162354 

Epoch 3, batch

Epoch 3, batch 1180
Training loss: 1.6900248527526855 

Epoch 3, batch 1181
Training loss: 1.8982367515563965 

Epoch 3, batch 1182
Training loss: 1.7743351459503174 

Epoch 3, batch 1183
Training loss: 1.7541706562042236 

Epoch 3, batch 1184
Training loss: 1.690889835357666 

Epoch 3, batch 1185
Training loss: 1.6005933284759521 

Epoch 3, batch 1186
Training loss: 1.8582261800765991 

Epoch 3, batch 1187
Training loss: 1.9921772480010986 

Epoch 3, batch 1188
Training loss: 1.6754701137542725 

Epoch 3, batch 1189
Training loss: 1.7018897533416748 

Epoch 3, batch 1190
Training loss: 1.9125770330429077 

Epoch 3, batch 1191
Training loss: 1.6016967296600342 

Epoch 3, batch 1192
Training loss: 1.7215698957443237 

Epoch 3, batch 1193
Training loss: 1.7049400806427002 

Epoch 3, batch 1194
Training loss: 1.6023147106170654 

Epoch 3, batch 1195
Training loss: 1.8427472114562988 

Epoch 3, batch 1196
Training loss: 1.7294220924377441 

Epoch 3, batch 1197
Training loss: 1.693955540657

Epoch 3, batch 1382
Training loss: 1.8846486806869507 

Epoch 3, batch 1383
Training loss: 1.8145776987075806 

Epoch 3, batch 1384
Training loss: 1.978813886642456 

Epoch 3, batch 1385
Training loss: 1.5041253566741943 

Epoch 3, batch 1386
Training loss: 1.7880091667175293 

Epoch 3, batch 1387
Training loss: 1.9051942825317383 

Epoch 3, batch 1388
Training loss: 1.8309118747711182 

Epoch 3, batch 1389
Training loss: 1.6224091053009033 

Epoch 3, batch 1390
Training loss: 1.524009346961975 

Epoch 3, batch 1391
Training loss: 1.502206802368164 

Epoch 3, batch 1392
Training loss: 1.7644717693328857 

Epoch 3, batch 1393
Training loss: 1.646828055381775 

Epoch 3, batch 1394
Training loss: 1.7997779846191406 

Epoch 3, batch 1395
Training loss: 1.612599492073059 

Epoch 3, batch 1396
Training loss: 1.9418361186981201 

Epoch 3, batch 1397
Training loss: 1.718687891960144 

Epoch 3, batch 1398
Training loss: 1.8214110136032104 

Epoch 3, batch 1399
Training loss: 1.6877812147140503 

Epoch 3, batch 1586
Training loss: 1.7764158248901367 

Epoch 3, batch 1587
Training loss: 1.8357664346694946 

Epoch 3, batch 1588
Training loss: 1.5940152406692505 

Epoch 3, batch 1589
Training loss: 1.7221046686172485 

Epoch 3, batch 1590
Training loss: 1.8985629081726074 

Epoch 3, batch 1591
Training loss: 1.787247896194458 

Epoch 3, batch 1592
Training loss: 1.8248913288116455 

Epoch 3, batch 1593
Training loss: 1.6645095348358154 

Epoch 3, batch 1594
Training loss: 1.650981068611145 

Epoch 3, batch 1595
Training loss: 2.0298216342926025 

Epoch 3, batch 1596
Training loss: 1.5595587491989136 

Epoch 3, batch 1597
Training loss: 2.0133094787597656 

Epoch 3, batch 1598
Training loss: 1.5797675848007202 

Epoch 3, batch 1599
Training loss: 1.7403144836425781 

Epoch 3, batch 1600
Training loss: 1.8891289234161377 

Epoch 3, batch 1601
Training loss: 1.758437156677246 

Epoch 3, batch 1602
Training loss: 1.7623815536499023 

Epoch 3, batch 1603
Training loss: 1.61732375621795

Epoch 3, batch 1789
Training loss: 1.6366689205169678 

Epoch 3, batch 1790
Training loss: 1.8935166597366333 

Epoch 3, batch 1791
Training loss: 1.7533135414123535 

Epoch 3, batch 1792
Training loss: 1.9009661674499512 

Epoch 3, batch 1793
Training loss: 1.5735127925872803 

Epoch 3, batch 1794
Training loss: 1.650928258895874 

Epoch 3, batch 1795
Training loss: 1.6655683517456055 

Epoch 3, batch 1796
Training loss: 1.608662486076355 

Epoch 3, batch 1797
Training loss: 1.724290370941162 

Epoch 3, batch 1798
Training loss: 1.752558708190918 

Epoch 3, batch 1799
Training loss: 1.7601211071014404 

Epoch 3, batch 1800
Training loss: 1.5873442888259888 

Epoch 3, batch 1801
Training loss: 1.7791879177093506 

Epoch 3, batch 1802
Training loss: 1.8480507135391235 

Epoch 3, batch 1803
Training loss: 1.6426726579666138 

Epoch 3, batch 1804
Training loss: 2.0332534313201904 

Epoch 3, batch 1805
Training loss: 1.8622560501098633 

Epoch 3, batch 1806
Training loss: 1.799318790435791

Epoch 3, batch 1985
Training loss: 1.836791753768921 

Epoch 3, batch 1986
Training loss: 1.6344130039215088 

Epoch 3, batch 1987
Training loss: 1.7536872625350952 

Epoch 3, batch 1988
Training loss: 1.800641417503357 

Epoch 3, batch 1989
Training loss: 1.6930259466171265 

Epoch 3, batch 1990
Training loss: 1.99546480178833 

Epoch 3, batch 1991
Training loss: 1.8104159832000732 

Epoch 3, batch 1992
Training loss: 1.842612862586975 

Epoch 3, batch 1993
Training loss: 1.6374374628067017 

Epoch 3, batch 1994
Training loss: 2.136171340942383 

Epoch 3, batch 1995
Training loss: 1.7522587776184082 

Epoch 3, batch 1996
Training loss: 1.7823013067245483 

Epoch 3, batch 1997
Training loss: 1.9498631954193115 

Epoch 3, batch 1998
Training loss: 1.670305609703064 

Epoch 3, batch 1999
Training loss: 1.6748526096343994 

Epoch 3, batch 2000
Training loss: 1.5398610830307007 

Epoch 3, batch 2001
Training loss: 1.8432221412658691 

Epoch 3, batch 2002
Training loss: 1.9227681159973145 


Epoch 3, batch 2188
Training loss: 1.6053322553634644 

Epoch 3, batch 2189
Training loss: 1.7441189289093018 

Epoch 3, batch 2190
Training loss: 1.6152950525283813 

Epoch 3, batch 2191
Training loss: 1.8107038736343384 

Epoch 3, batch 2192
Training loss: 1.9207830429077148 

Epoch 3, batch 2193
Training loss: 1.8437459468841553 

Epoch 3, batch 2194
Training loss: 1.7372233867645264 

Epoch 3, batch 2195
Training loss: 1.8153960704803467 

Epoch 3, batch 2196
Training loss: 1.8504940271377563 

Epoch 3, batch 2197
Training loss: 1.6048322916030884 

Epoch 3, batch 2198
Training loss: 1.5062808990478516 

Epoch 3, batch 2199
Training loss: 1.770827054977417 

Epoch 3, batch 2200
Training loss: 1.4805270433425903 

Epoch 3, batch 2201
Training loss: 1.7782106399536133 

Epoch 3, batch 2202
Training loss: 1.4755878448486328 

Epoch 3, batch 2203
Training loss: 1.631839394569397 

Epoch 3, batch 2204
Training loss: 1.7450796365737915 

Epoch 3, batch 2205
Training loss: 1.9389026165008

Epoch 3, batch 2394
Training loss: 1.750770092010498 

Epoch 3, batch 2395
Training loss: 1.9562726020812988 

Epoch 3, batch 2396
Training loss: 1.546658992767334 

Epoch 3, batch 2397
Training loss: 1.778549313545227 

Epoch 3, batch 2398
Training loss: 1.5960983037948608 

Epoch 3, batch 2399
Training loss: 1.9801719188690186 

Epoch 3, batch 2400
Training loss: 1.9118715524673462 

Epoch 3, batch 2401
Training loss: 1.514288067817688 

Epoch 3, batch 2402
Training loss: 1.8242771625518799 

Epoch 3, batch 2403
Training loss: 1.7529486417770386 

Epoch 3, batch 2404
Training loss: 1.6130012273788452 

Epoch 3, batch 2405
Training loss: 1.8090060949325562 

Epoch 3, batch 2406
Training loss: 1.7721271514892578 

Epoch 3, batch 2407
Training loss: 1.8073326349258423 

Epoch 3, batch 2408
Training loss: 1.6366026401519775 

Epoch 3, batch 2409
Training loss: 2.025099992752075 

Epoch 3, batch 2410
Training loss: 1.706923246383667 

Epoch 3, batch 2411
Training loss: 1.9179015159606934 

Epoch 3, batch 2597
Training loss: 1.8495521545410156 

Epoch 3, batch 2598
Training loss: 1.8314242362976074 

Epoch 3, batch 2599
Training loss: 1.7567867040634155 

Epoch 3, batch 2600
Training loss: 1.5788979530334473 

Epoch 3, batch 2601
Training loss: 1.5967618227005005 

Epoch 3, batch 2602
Training loss: 1.615256428718567 

Epoch 3, batch 2603
Training loss: 1.7141573429107666 

Epoch 3, batch 2604
Training loss: 1.8015508651733398 

Epoch 3, batch 2605
Training loss: 1.7765034437179565 

Epoch 3, batch 2606
Training loss: 1.882949709892273 

Epoch 3, batch 2607
Training loss: 2.0124151706695557 

Epoch 3, batch 2608
Training loss: 1.5335021018981934 

Epoch 3, batch 2609
Training loss: 1.9170076847076416 

Epoch 3, batch 2610
Training loss: 1.8361482620239258 

Epoch 3, batch 2611
Training loss: 1.7621852159500122 

Epoch 3, batch 2612
Training loss: 1.6259095668792725 

Epoch 3, batch 2613
Training loss: 1.6339061260223389 

Epoch 3, batch 2614
Training loss: 1.7672758102416

Epoch 3, batch 2801
Training loss: 1.732700228691101 

Epoch 3, batch 2802
Training loss: 1.773507833480835 

Epoch 3, batch 2803
Training loss: 1.801134467124939 

Epoch 3, batch 2804
Training loss: 1.6330255270004272 

Epoch 3, batch 2805
Training loss: 1.9633675813674927 

Epoch 3, batch 2806
Training loss: 1.6663885116577148 

Epoch 3, batch 2807
Training loss: 1.9063894748687744 

Epoch 3, batch 2808
Training loss: 1.8436462879180908 

Epoch 3, batch 2809
Training loss: 1.7145878076553345 

Epoch 3, batch 2810
Training loss: 1.5435258150100708 

Epoch 3, batch 2811
Training loss: 1.652624249458313 

Epoch 3, batch 2812
Training loss: 1.6419941186904907 

Epoch 3, batch 2813
Training loss: 1.7312147617340088 

Epoch 3, batch 2814
Training loss: 1.8629438877105713 

Epoch 3, batch 2815
Training loss: 1.977853775024414 

Epoch 3, batch 2816
Training loss: 1.924170732498169 

Epoch 3, batch 2817
Training loss: 1.812542200088501 

Epoch 3, batch 2818
Training loss: 1.7764408588409424 


Epoch 3, batch 2996
Training loss: 1.5928592681884766 

Epoch 3, batch 2997
Training loss: 1.6741522550582886 

Epoch 3, batch 2998
Training loss: 1.738093614578247 

Epoch 3, batch 2999
Training loss: 1.8485569953918457 

Epoch 3, batch 3000
Training loss: 1.6053773164749146 

Epoch 3, batch 3001
Training loss: 1.7476669549942017 

Epoch 3, batch 3002
Training loss: 2.0661065578460693 

Epoch 3, batch 3003
Training loss: 1.5242440700531006 

Epoch 3, batch 3004
Training loss: 1.6646125316619873 

Epoch 3, batch 3005
Training loss: 1.7395275831222534 

Epoch 3, batch 3006
Training loss: 1.9072283506393433 

Epoch 3, batch 3007
Training loss: 1.8888280391693115 

Epoch 3, batch 3008
Training loss: 1.6587971448898315 

Epoch 3, batch 3009
Training loss: 1.9009697437286377 

Epoch 3, batch 3010
Training loss: 1.6601215600967407 

Epoch 3, batch 3011
Training loss: 1.745131015777588 

Epoch 3, batch 3012
Training loss: 1.619357705116272 

Epoch 3, batch 3013
Training loss: 1.52213406562805

Epoch 3, batch 3196
Training loss: 1.6406652927398682 

Epoch 3, batch 3197
Training loss: 1.5959625244140625 

Epoch 3, batch 3198
Training loss: 1.8727972507476807 

Epoch 3, batch 3199
Training loss: 1.8341972827911377 

Epoch 3, batch 3200
Training loss: 1.7573163509368896 

Epoch 3, batch 3201
Training loss: 1.9099247455596924 

Epoch 3, batch 3202
Training loss: 1.798912763595581 

Epoch 3, batch 3203
Training loss: 1.7612003087997437 

Epoch 3, batch 3204
Training loss: 1.52762770652771 

Epoch 3, batch 3205
Training loss: 1.6918456554412842 

Epoch 3, batch 3206
Training loss: 1.6468925476074219 

Epoch 3, batch 3207
Training loss: 1.7448186874389648 

Epoch 3, batch 3208
Training loss: 1.6197189092636108 

Epoch 3, batch 3209
Training loss: 1.7331485748291016 

Epoch 3, batch 3210
Training loss: 1.5795948505401611 

Epoch 3, batch 3211
Training loss: 1.5371818542480469 

Epoch 3, batch 3212
Training loss: 1.5317707061767578 

Epoch 3, batch 3213
Training loss: 1.62899160385131

Epoch 3, batch 3398
Training loss: 1.8702576160430908 

Epoch 3, batch 3399
Training loss: 1.879249930381775 

Epoch 3, batch 3400
Training loss: 1.553905963897705 

Epoch 3, batch 3401
Training loss: 1.7820446491241455 

Epoch 3, batch 3402
Training loss: 1.8905484676361084 

Epoch 3, batch 3403
Training loss: 1.6795369386672974 

Epoch 3, batch 3404
Training loss: 1.6981627941131592 

Epoch 3, batch 3405
Training loss: 1.7680407762527466 

Epoch 3, batch 3406
Training loss: 1.9018319845199585 

Epoch 3, batch 3407
Training loss: 1.963128924369812 

Epoch 3, batch 3408
Training loss: 1.9514985084533691 

Epoch 3, batch 3409
Training loss: 1.7621345520019531 

Epoch 3, batch 3410
Training loss: 1.7602509260177612 

Epoch 3, batch 3411
Training loss: 1.6629878282546997 

Epoch 3, batch 3412
Training loss: 1.672938346862793 

Epoch 3, batch 3413
Training loss: 1.8454961776733398 

Epoch 3, batch 3414
Training loss: 1.6078888177871704 

Epoch 3, batch 3415
Training loss: 1.707921147346496

Epoch 3, batch 3605
Training loss: 1.5375207662582397 

Epoch 3, batch 3606
Training loss: 1.8613396883010864 

Epoch 3, batch 3607
Training loss: 1.9960343837738037 

Epoch 3, batch 3608
Training loss: 1.7745568752288818 

Epoch 3, batch 3609
Training loss: 1.7321248054504395 

Epoch 3, batch 3610
Training loss: 1.8711585998535156 

Epoch 3, batch 3611
Training loss: 1.4879192113876343 

Epoch 3, batch 3612
Training loss: 1.576167106628418 

Epoch 3, batch 3613
Training loss: 1.9730685949325562 

Epoch 3, batch 3614
Training loss: 1.569846749305725 

Epoch 3, batch 3615
Training loss: 1.5831667184829712 

Epoch 3, batch 3616
Training loss: 1.721184492111206 

Epoch 3, batch 3617
Training loss: 1.7646865844726562 

Epoch 3, batch 3618
Training loss: 1.5337693691253662 

Epoch 3, batch 3619
Training loss: 1.6197271347045898 

Epoch 3, batch 3620
Training loss: 1.827056884765625 

Epoch 3, batch 3621
Training loss: 1.6016794443130493 

Epoch 3, batch 3622
Training loss: 1.746418237686157

Epoch 3, batch 3811
Training loss: 1.558638095855713 

Epoch 3, batch 3812
Training loss: 1.7677321434020996 

Epoch 3, batch 3813
Training loss: 1.6076903343200684 

Epoch 3, batch 3814
Training loss: 1.5869154930114746 

Epoch 3, batch 3815
Training loss: 2.0152602195739746 

Epoch 3, batch 3816
Training loss: 1.68752121925354 

Epoch 3, batch 3817
Training loss: 1.8365964889526367 

Epoch 3, batch 3818
Training loss: 1.9508970975875854 

Epoch 3, batch 3819
Training loss: 1.7946385145187378 

Epoch 3, batch 3820
Training loss: 1.6553179025650024 

Epoch 3, batch 3821
Training loss: 1.725069284439087 

Epoch 3, batch 3822
Training loss: 2.0102057456970215 

Epoch 3, batch 3823
Training loss: 1.970510482788086 

Epoch 3, batch 3824
Training loss: 1.5261307954788208 

Epoch 3, batch 3825
Training loss: 1.8755877017974854 

Epoch 3, batch 3826
Training loss: 2.032954454421997 

Epoch 3, batch 3827
Training loss: 1.8253083229064941 

Epoch 3, batch 3828
Training loss: 1.7921295166015625 

Epoch 3, batch 4017
Training loss: 1.8063929080963135 

Epoch 3, batch 4018
Training loss: 1.6831426620483398 

Epoch 3, batch 4019
Training loss: 1.6070241928100586 

Epoch 3, batch 4020
Training loss: 1.537751317024231 

Epoch 3, batch 4021
Training loss: 1.6013474464416504 

Epoch 3, batch 4022
Training loss: 1.6590536832809448 

Epoch 3, batch 4023
Training loss: 1.8948049545288086 

Epoch 3, batch 4024
Training loss: 1.6677652597427368 

Epoch 3, batch 4025
Training loss: 1.9661295413970947 

Epoch 3, batch 4026
Training loss: 1.9935587644577026 

Epoch 3, batch 4027
Training loss: 1.9027019739151 

Epoch 3, batch 4028
Training loss: 1.885007619857788 

Epoch 3, batch 4029
Training loss: 1.469131588935852 

Epoch 3, batch 4030
Training loss: 1.615370750427246 

Epoch 3, batch 4031
Training loss: 1.5024683475494385 

Epoch 3, batch 4032
Training loss: 1.867779016494751 

Epoch 3, batch 4033
Training loss: 1.9277515411376953 

Epoch 3, batch 4034
Training loss: 1.843399167060852 

E

Epoch 3, batch 4221
Training loss: 1.836472511291504 

Epoch 3, batch 4222
Training loss: 1.6769707202911377 

Epoch 3, batch 4223
Training loss: 1.7731914520263672 

Epoch 3, batch 4224
Training loss: 1.6691310405731201 

Epoch 3, batch 4225
Training loss: 1.6202152967453003 

Epoch 3, batch 4226
Training loss: 1.958390235900879 

Epoch 3, batch 4227
Training loss: 1.6462652683258057 

Epoch 3, batch 4228
Training loss: 1.731855869293213 

Epoch 3, batch 4229
Training loss: 1.6866018772125244 

Epoch 3, batch 4230
Training loss: 1.671912431716919 

Epoch 3, batch 4231
Training loss: 1.7731770277023315 

Epoch 3, batch 4232
Training loss: 1.924821376800537 

Epoch 3, batch 4233
Training loss: 1.8266688585281372 

Epoch 3, batch 4234
Training loss: 1.8676209449768066 

Epoch 3, batch 4235
Training loss: 1.88059663772583 

Epoch 3, batch 4236
Training loss: 1.7904858589172363 

Epoch 3, batch 4237
Training loss: 1.7435917854309082 

Epoch 3, batch 4238
Training loss: 1.49287748336792 

E

Epoch 3, batch 4425
Training loss: 1.8379786014556885 

Epoch 3, batch 4426
Training loss: 1.8928937911987305 

Epoch 3, batch 4427
Training loss: 1.7185232639312744 

Epoch 3, batch 4428
Training loss: 1.8516837358474731 

Epoch 3, batch 4429
Training loss: 2.048977851867676 

Epoch 3, batch 4430
Training loss: 1.6100139617919922 

Epoch 3, batch 4431
Training loss: 1.7956006526947021 

Epoch 3, batch 4432
Training loss: 1.6234116554260254 

Epoch 3, batch 4433
Training loss: 1.6226578950881958 

Epoch 3, batch 4434
Training loss: 1.8851537704467773 

Epoch 3, batch 4435
Training loss: 1.8218035697937012 

Epoch 3, batch 4436
Training loss: 1.9018874168395996 

Epoch 3, batch 4437
Training loss: 1.6238526105880737 

Epoch 3, batch 4438
Training loss: 1.7381930351257324 

Epoch 3, batch 4439
Training loss: 1.9094077348709106 

Epoch 3, batch 4440
Training loss: 1.6584261655807495 

Epoch 3, batch 4441
Training loss: 1.8447734117507935 

Epoch 3, batch 4442
Training loss: 1.588716626167

Epoch 3, batch 4630
Training loss: 1.7121837139129639 

Epoch 3, batch 4631
Training loss: 1.8800619840621948 

Epoch 3, batch 4632
Training loss: 1.806837558746338 

Epoch 3, batch 4633
Training loss: 1.7286243438720703 

Epoch 3, batch 4634
Training loss: 1.9421361684799194 

Epoch 3, batch 4635
Training loss: 1.898903727531433 

Epoch 3, batch 4636
Training loss: 2.0009474754333496 

Epoch 3, batch 4637
Training loss: 1.669508457183838 

Epoch 3, batch 4638
Training loss: 1.6720823049545288 

Epoch 3, batch 4639
Training loss: 1.626917839050293 

Epoch 3, batch 4640
Training loss: 2.163909673690796 

Epoch 3, batch 4641
Training loss: 1.8494278192520142 

Epoch 3, batch 4642
Training loss: 1.667223572731018 

Epoch 3, batch 4643
Training loss: 1.697380542755127 

Epoch 3, batch 4644
Training loss: 1.8523499965667725 

Epoch 3, batch 4645
Training loss: 1.8484777212142944 

Epoch 3, batch 4646
Training loss: 1.6895203590393066 

Epoch 3, batch 4647
Training loss: 1.9349634647369385 


Epoch 3, batch 4835
Training loss: 1.7353148460388184 

Epoch 3, batch 4836
Training loss: 1.5821787118911743 

Epoch 3, batch 4837
Training loss: 1.6296465396881104 

Epoch 3, batch 4838
Training loss: 1.8380544185638428 

Epoch 3, batch 4839
Training loss: 1.6551382541656494 

Epoch 3, batch 4840
Training loss: 1.560934066772461 

Epoch 3, batch 4841
Training loss: 1.7153393030166626 

Epoch 3, batch 4842
Training loss: 1.7951037883758545 

Epoch 3, batch 4843
Training loss: 1.6292282342910767 

Epoch 3, batch 4844
Training loss: 1.6103143692016602 

Epoch 3, batch 4845
Training loss: 1.7498250007629395 

Epoch 3, batch 4846
Training loss: 1.7457425594329834 

Epoch 3, batch 4847
Training loss: 1.8144819736480713 

Epoch 3, batch 4848
Training loss: 1.7107460498809814 

Epoch 3, batch 4849
Training loss: 1.8967407941818237 

Epoch 3, batch 4850
Training loss: 1.8043549060821533 

Epoch 3, batch 4851
Training loss: 1.8571852445602417 

Epoch 3, batch 4852
Training loss: 1.538761854171

Epoch 3, batch 5037
Training loss: 1.7348620891571045 

Epoch 3, batch 5038
Training loss: 1.5950169563293457 

Epoch 3, batch 5039
Training loss: 1.6080187559127808 

Epoch 3, batch 5040
Training loss: 1.7625269889831543 

Epoch 3, batch 5041
Training loss: 1.6422017812728882 

Epoch 3, batch 5042
Training loss: 1.7548036575317383 

Epoch 3, batch 5043
Training loss: 1.8118358850479126 

Epoch 3, batch 5044
Training loss: 1.7645902633666992 

Epoch 3, batch 5045
Training loss: 1.8982752561569214 

Epoch 3, batch 5046
Training loss: 1.6566767692565918 

Epoch 3, batch 5047
Training loss: 1.5329302549362183 

Epoch 3, batch 5048
Training loss: 1.9583470821380615 

Epoch 3, batch 5049
Training loss: 1.865617036819458 

Epoch 3, batch 5050
Training loss: 1.6549005508422852 

Epoch 3, batch 5051
Training loss: 1.8919634819030762 

Epoch 3, batch 5052
Training loss: 1.6411973237991333 

Epoch 3, batch 5053
Training loss: 1.6432714462280273 

Epoch 3, batch 5054
Training loss: 1.514598965644

Epoch 3, batch 5240
Training loss: 1.786369800567627 

Epoch 3, batch 5241
Training loss: 1.65220308303833 

Epoch 3, batch 5242
Training loss: 1.6385986804962158 

Epoch 3, batch 5243
Training loss: 1.8887419700622559 

Epoch 3, batch 5244
Training loss: 1.8318777084350586 

Epoch 3, batch 5245
Training loss: 1.6091837882995605 

Epoch 3, batch 5246
Training loss: 1.5213977098464966 

Epoch 3, batch 5247
Training loss: 1.911374568939209 

Epoch 3, batch 5248
Training loss: 1.5243592262268066 

Epoch 3, batch 5249
Training loss: 1.7676708698272705 

Epoch 3, batch 5250
Training loss: 1.5710229873657227 

Epoch 3, batch 5251
Training loss: 1.7451019287109375 

Epoch 3, batch 5252
Training loss: 1.8574161529541016 

Epoch 3, batch 5253
Training loss: 1.8190953731536865 

Epoch 3, batch 5254
Training loss: 1.7740211486816406 

Epoch 3, batch 5255
Training loss: 1.7653088569641113 

Epoch 3, batch 5256
Training loss: 1.6127228736877441 

Epoch 3, batch 5257
Training loss: 1.806300163269043

Epoch 3, batch 5446
Training loss: 1.5983479022979736 

Epoch 3, batch 5447
Training loss: 1.9156687259674072 

Epoch 3, batch 5448
Training loss: 1.5520823001861572 

Epoch 3, batch 5449
Training loss: 1.9583195447921753 

Epoch 3, batch 5450
Training loss: 1.8235344886779785 

Epoch 3, batch 5451
Training loss: 1.791905403137207 

Epoch 3, batch 5452
Training loss: 1.6211329698562622 

Epoch 3, batch 5453
Training loss: 1.896996259689331 

Epoch 3, batch 5454
Training loss: 1.7454335689544678 

Epoch 3, batch 5455
Training loss: 1.7679460048675537 

Epoch 3, batch 5456
Training loss: 1.8512672185897827 

Epoch 3, batch 5457
Training loss: 2.0504603385925293 

Epoch 3, batch 5458
Training loss: 1.6066702604293823 

Epoch 3, batch 5459
Training loss: 1.7263554334640503 

Epoch 3, batch 5460
Training loss: 1.6657224893569946 

Epoch 3, batch 5461
Training loss: 1.669467806816101 

Epoch 3, batch 5462
Training loss: 1.8009705543518066 

Epoch 3, batch 5463
Training loss: 1.76768064498901

Epoch 3, batch 5651
Training loss: 1.9099643230438232 

Epoch 3, batch 5652
Training loss: 1.810402512550354 

Epoch 3, batch 5653
Training loss: 2.0821151733398438 

Epoch 3, batch 5654
Training loss: 1.7425596714019775 

Epoch 3, batch 5655
Training loss: 1.7976114749908447 

Epoch 3, batch 5656
Training loss: 1.5741844177246094 

Epoch 3, batch 5657
Training loss: 1.6409380435943604 

Epoch 3, batch 5658
Training loss: 1.9211556911468506 

Epoch 3, batch 5659
Training loss: 1.89402174949646 

Epoch 3, batch 5660
Training loss: 1.7894024848937988 

Epoch 3, batch 5661
Training loss: 1.7968223094940186 

Epoch 3, batch 5662
Training loss: 1.9991014003753662 

Epoch 3, batch 5663
Training loss: 1.7196714878082275 

Epoch 3, batch 5664
Training loss: 1.7883758544921875 

Epoch 3, batch 5665
Training loss: 1.665457010269165 

Epoch 3, batch 5666
Training loss: 1.7412700653076172 

Epoch 3, batch 5667
Training loss: 1.846127986907959 

Epoch 3, batch 5668
Training loss: 1.7942736148834229

Epoch 3, batch 5855
Training loss: 1.9824209213256836 

Epoch 3, batch 5856
Training loss: 1.6293580532073975 

Epoch 3, batch 5857
Training loss: 1.6614813804626465 

Epoch 3, batch 5858
Training loss: 1.7692279815673828 

Epoch 3, batch 5859
Training loss: 1.473933458328247 

Epoch 3, batch 5860
Training loss: 1.6010706424713135 

Epoch 3, batch 5861
Training loss: 1.827762246131897 

Epoch 3, batch 5862
Training loss: 1.7252053022384644 

Epoch 3, batch 5863
Training loss: 1.5679471492767334 

Epoch 3, batch 5864
Training loss: 1.883357286453247 

Epoch 3, batch 5865
Training loss: 1.83676278591156 

Epoch 3, batch 5866
Training loss: 1.6215405464172363 

Epoch 3, batch 5867
Training loss: 2.000138282775879 

Epoch 3, batch 5868
Training loss: 1.617087483406067 

Epoch 3, batch 5869
Training loss: 1.893503189086914 

Epoch 3, batch 5870
Training loss: 1.6931672096252441 

Epoch 3, batch 5871
Training loss: 1.7978622913360596 

Epoch 3, batch 5872
Training loss: 1.907832384109497 

E

Epoch 4, batch 56
Training loss: 1.521342158317566 

Epoch 4, batch 57
Training loss: 1.5710506439208984 

Epoch 4, batch 58
Training loss: 1.7806035280227661 

Epoch 4, batch 59
Training loss: 1.7261521816253662 

Epoch 4, batch 60
Training loss: 1.5408788919448853 

Epoch 4, batch 61
Training loss: 1.9519433975219727 

Epoch 4, batch 62
Training loss: 1.8208516836166382 

Epoch 4, batch 63
Training loss: 1.951812744140625 

Epoch 4, batch 64
Training loss: 1.9007577896118164 

Epoch 4, batch 65
Training loss: 1.8086003065109253 

Epoch 4, batch 66
Training loss: 1.9430065155029297 

Epoch 4, batch 67
Training loss: 1.8409423828125 

Epoch 4, batch 68
Training loss: 1.6024847030639648 

Epoch 4, batch 69
Training loss: 1.7586686611175537 

Epoch 4, batch 70
Training loss: 1.982564926147461 

Epoch 4, batch 71
Training loss: 1.495441198348999 

Epoch 4, batch 72
Training loss: 1.5710575580596924 

Epoch 4, batch 73
Training loss: 1.6834052801132202 

Epoch 4, batch 74
Training loss: 1.

Epoch 4, batch 256
Training loss: 1.7723997831344604 

Epoch 4, batch 257
Training loss: 1.5428190231323242 

Epoch 4, batch 258
Training loss: 1.6952202320098877 

Epoch 4, batch 259
Training loss: 1.6902421712875366 

Epoch 4, batch 260
Training loss: 1.84669029712677 

Epoch 4, batch 261
Training loss: 1.514149785041809 

Epoch 4, batch 262
Training loss: 1.752720832824707 

Epoch 4, batch 263
Training loss: 1.7928767204284668 

Epoch 4, batch 264
Training loss: 1.715803861618042 

Epoch 4, batch 265
Training loss: 1.6871867179870605 

Epoch 4, batch 266
Training loss: 1.533812403678894 

Epoch 4, batch 267
Training loss: 1.6232484579086304 

Epoch 4, batch 268
Training loss: 1.7268356084823608 

Epoch 4, batch 269
Training loss: 1.514929175376892 

Epoch 4, batch 270
Training loss: 1.790939211845398 

Epoch 4, batch 271
Training loss: 1.8502001762390137 

Epoch 4, batch 272
Training loss: 1.8443801403045654 

Epoch 4, batch 273
Training loss: 1.8703575134277344 

Epoch 4, batch 274

Epoch 4, batch 460
Training loss: 1.9532830715179443 

Epoch 4, batch 461
Training loss: 1.997110366821289 

Epoch 4, batch 462
Training loss: 1.5517001152038574 

Epoch 4, batch 463
Training loss: 1.7999120950698853 

Epoch 4, batch 464
Training loss: 1.9510462284088135 

Epoch 4, batch 465
Training loss: 1.7512794733047485 

Epoch 4, batch 466
Training loss: 1.558435082435608 

Epoch 4, batch 467
Training loss: 1.7262191772460938 

Epoch 4, batch 468
Training loss: 1.627055048942566 

Epoch 4, batch 469
Training loss: 1.6600450277328491 

Epoch 4, batch 470
Training loss: 1.7106997966766357 

Epoch 4, batch 471
Training loss: 1.8510539531707764 

Epoch 4, batch 472
Training loss: 1.6706740856170654 

Epoch 4, batch 473
Training loss: 1.909888744354248 

Epoch 4, batch 474
Training loss: 1.8893203735351562 

Epoch 4, batch 475
Training loss: 1.6302568912506104 

Epoch 4, batch 476
Training loss: 1.6590373516082764 

Epoch 4, batch 477
Training loss: 1.717317819595337 

Epoch 4, batch 

Epoch 4, batch 664
Training loss: 1.8258476257324219 

Epoch 4, batch 665
Training loss: 1.8523106575012207 

Epoch 4, batch 666
Training loss: 1.4757399559020996 

Epoch 4, batch 667
Training loss: 1.5697146654129028 

Epoch 4, batch 668
Training loss: 1.88966965675354 

Epoch 4, batch 669
Training loss: 1.7305560111999512 

Epoch 4, batch 670
Training loss: 1.6083306074142456 

Epoch 4, batch 671
Training loss: 1.697394847869873 

Epoch 4, batch 672
Training loss: 2.0334270000457764 

Epoch 4, batch 673
Training loss: 1.7419884204864502 

Epoch 4, batch 674
Training loss: 1.6416242122650146 

Epoch 4, batch 675
Training loss: 1.8272063732147217 

Epoch 4, batch 676
Training loss: 1.5828486680984497 

Epoch 4, batch 677
Training loss: 1.596427083015442 

Epoch 4, batch 678
Training loss: 1.6360610723495483 

Epoch 4, batch 679
Training loss: 1.6333131790161133 

Epoch 4, batch 680
Training loss: 1.730900526046753 

Epoch 4, batch 681
Training loss: 1.8601741790771484 

Epoch 4, batch 

Epoch 4, batch 866
Training loss: 1.5008599758148193 

Epoch 4, batch 867
Training loss: 1.9263761043548584 

Epoch 4, batch 868
Training loss: 1.8126099109649658 

Epoch 4, batch 869
Training loss: 1.7604165077209473 

Epoch 4, batch 870
Training loss: 1.9950419664382935 

Epoch 4, batch 871
Training loss: 1.7891634702682495 

Epoch 4, batch 872
Training loss: 1.5686898231506348 

Epoch 4, batch 873
Training loss: 1.7896852493286133 

Epoch 4, batch 874
Training loss: 1.7042315006256104 

Epoch 4, batch 875
Training loss: 1.808525562286377 

Epoch 4, batch 876
Training loss: 1.811204433441162 

Epoch 4, batch 877
Training loss: 1.6525566577911377 

Epoch 4, batch 878
Training loss: 1.871100902557373 

Epoch 4, batch 879
Training loss: 1.9362419843673706 

Epoch 4, batch 880
Training loss: 1.6435401439666748 

Epoch 4, batch 881
Training loss: 1.9929814338684082 

Epoch 4, batch 882
Training loss: 1.9277913570404053 

Epoch 4, batch 883
Training loss: 1.8872084617614746 

Epoch 4, batc

Epoch 4, batch 1066
Training loss: 1.4949394464492798 

Epoch 4, batch 1067
Training loss: 1.592545986175537 

Epoch 4, batch 1068
Training loss: 1.8370940685272217 

Epoch 4, batch 1069
Training loss: 1.80381178855896 

Epoch 4, batch 1070
Training loss: 1.6726046800613403 

Epoch 4, batch 1071
Training loss: 1.9464666843414307 

Epoch 4, batch 1072
Training loss: 1.860458254814148 

Epoch 4, batch 1073
Training loss: 1.824753761291504 

Epoch 4, batch 1074
Training loss: 1.8117940425872803 

Epoch 4, batch 1075
Training loss: 1.8461991548538208 

Epoch 4, batch 1076
Training loss: 1.6907143592834473 

Epoch 4, batch 1077
Training loss: 1.63480544090271 

Epoch 4, batch 1078
Training loss: 1.8884878158569336 

Epoch 4, batch 1079
Training loss: 1.7620651721954346 

Epoch 4, batch 1080
Training loss: 1.574552297592163 

Epoch 4, batch 1081
Training loss: 2.0262887477874756 

Epoch 4, batch 1082
Training loss: 1.5912654399871826 

Epoch 4, batch 1083
Training loss: 1.9279675483703613 



Epoch 4, batch 1268
Training loss: 1.5979273319244385 

Epoch 4, batch 1269
Training loss: 1.9551925659179688 

Epoch 4, batch 1270
Training loss: 1.6972137689590454 

Epoch 4, batch 1271
Training loss: 1.7845714092254639 

Epoch 4, batch 1272
Training loss: 1.877782940864563 

Epoch 4, batch 1273
Training loss: 1.6039777994155884 

Epoch 4, batch 1274
Training loss: 1.6777541637420654 

Epoch 4, batch 1275
Training loss: 1.716338872909546 

Epoch 4, batch 1276
Training loss: 1.7533801794052124 

Epoch 4, batch 1277
Training loss: 1.5117545127868652 

Epoch 4, batch 1278
Training loss: 1.607300043106079 

Epoch 4, batch 1279
Training loss: 1.6533598899841309 

Epoch 4, batch 1280
Training loss: 1.732187271118164 

Epoch 4, batch 1281
Training loss: 2.0066871643066406 

Epoch 4, batch 1282
Training loss: 1.9207981824874878 

Epoch 4, batch 1283
Training loss: 1.5742650032043457 

Epoch 4, batch 1284
Training loss: 1.6372631788253784 

Epoch 4, batch 1285
Training loss: 1.829452276229858

Epoch 4, batch 1470
Training loss: 1.6704597473144531 

Epoch 4, batch 1471
Training loss: 1.8052012920379639 

Epoch 4, batch 1472
Training loss: 1.7014943361282349 

Epoch 4, batch 1473
Training loss: 1.8368849754333496 

Epoch 4, batch 1474
Training loss: 1.5263513326644897 

Epoch 4, batch 1475
Training loss: 1.8603326082229614 

Epoch 4, batch 1476
Training loss: 1.8476285934448242 

Epoch 4, batch 1477
Training loss: 1.5469025373458862 

Epoch 4, batch 1478
Training loss: 1.6573376655578613 

Epoch 4, batch 1479
Training loss: 1.8858860731124878 

Epoch 4, batch 1480
Training loss: 1.8032324314117432 

Epoch 4, batch 1481
Training loss: 1.8999853134155273 

Epoch 4, batch 1482
Training loss: 1.7264330387115479 

Epoch 4, batch 1483
Training loss: 1.6845612525939941 

Epoch 4, batch 1484
Training loss: 1.5692906379699707 

Epoch 4, batch 1485
Training loss: 1.809736967086792 

Epoch 4, batch 1486
Training loss: 1.5821046829223633 

Epoch 4, batch 1487
Training loss: 1.924988031387

Epoch 4, batch 1667
Training loss: 1.6368885040283203 

Epoch 4, batch 1668
Training loss: 1.7361881732940674 

Epoch 4, batch 1669
Training loss: 1.7943248748779297 

Epoch 4, batch 1670
Training loss: 1.784717082977295 

Epoch 4, batch 1671
Training loss: 1.9579250812530518 

Epoch 4, batch 1672
Training loss: 1.5342484712600708 

Epoch 4, batch 1673
Training loss: 1.6059753894805908 

Epoch 4, batch 1674
Training loss: 2.019766330718994 

Epoch 4, batch 1675
Training loss: 1.6327710151672363 

Epoch 4, batch 1676
Training loss: 1.9780149459838867 

Epoch 4, batch 1677
Training loss: 1.9304299354553223 

Epoch 4, batch 1678
Training loss: 1.5962417125701904 

Epoch 4, batch 1679
Training loss: 1.6940207481384277 

Epoch 4, batch 1680
Training loss: 1.8347184658050537 

Epoch 4, batch 1681
Training loss: 1.780442714691162 

Epoch 4, batch 1682
Training loss: 1.6430115699768066 

Epoch 4, batch 1683
Training loss: 1.981596827507019 

Epoch 4, batch 1684
Training loss: 1.609841823577880

Epoch 4, batch 1871
Training loss: 2.0267646312713623 

Epoch 4, batch 1872
Training loss: 1.6548240184783936 

Epoch 4, batch 1873
Training loss: 1.7904584407806396 

Epoch 4, batch 1874
Training loss: 1.5332176685333252 

Epoch 4, batch 1875
Training loss: 1.8093496561050415 

Epoch 4, batch 1876
Training loss: 1.469542384147644 

Epoch 4, batch 1877
Training loss: 1.8960018157958984 

Epoch 4, batch 1878
Training loss: 1.6270952224731445 

Epoch 4, batch 1879
Training loss: 1.6012632846832275 

Epoch 4, batch 1880
Training loss: 1.6203914880752563 

Epoch 4, batch 1881
Training loss: 1.753659725189209 

Epoch 4, batch 1882
Training loss: 1.964881420135498 

Epoch 4, batch 1883
Training loss: 1.9330185651779175 

Epoch 4, batch 1884
Training loss: 1.9202628135681152 

Epoch 4, batch 1885
Training loss: 1.9172536134719849 

Epoch 4, batch 1886
Training loss: 1.9574878215789795 

Epoch 4, batch 1887
Training loss: 1.7257076501846313 

Epoch 4, batch 1888
Training loss: 1.96897494792938

Epoch 4, batch 2073
Training loss: 1.8610680103302002 

Epoch 4, batch 2074
Training loss: 1.788104772567749 

Epoch 4, batch 2075
Training loss: 1.8837404251098633 

Epoch 4, batch 2076
Training loss: 1.8303742408752441 

Epoch 4, batch 2077
Training loss: 1.959579586982727 

Epoch 4, batch 2078
Training loss: 1.7557039260864258 

Epoch 4, batch 2079
Training loss: 1.5936412811279297 

Epoch 4, batch 2080
Training loss: 1.7350542545318604 

Epoch 4, batch 2081
Training loss: 1.6862698793411255 

Epoch 4, batch 2082
Training loss: 1.7737798690795898 

Epoch 4, batch 2083
Training loss: 1.6022861003875732 

Epoch 4, batch 2084
Training loss: 1.6789323091506958 

Epoch 4, batch 2085
Training loss: 1.6489332914352417 

Epoch 4, batch 2086
Training loss: 1.6512006521224976 

Epoch 4, batch 2087
Training loss: 1.5757709741592407 

Epoch 4, batch 2088
Training loss: 1.802997350692749 

Epoch 4, batch 2089
Training loss: 1.8138878345489502 

Epoch 4, batch 2090
Training loss: 1.56044459342956

Epoch 4, batch 2265
Training loss: 1.5646300315856934 

Epoch 4, batch 2266
Training loss: 1.4983934164047241 

Epoch 4, batch 2267
Training loss: 1.6777836084365845 

Epoch 4, batch 2268
Training loss: 1.7229591608047485 

Epoch 4, batch 2269
Training loss: 1.5814462900161743 

Epoch 4, batch 2270
Training loss: 1.862851619720459 

Epoch 4, batch 2271
Training loss: 1.8169289827346802 

Epoch 4, batch 2272
Training loss: 1.5468796491622925 

Epoch 4, batch 2273
Training loss: 1.8893336057662964 

Epoch 4, batch 2274
Training loss: 1.5481503009796143 

Epoch 4, batch 2275
Training loss: 1.6490885019302368 

Epoch 4, batch 2276
Training loss: 1.8802584409713745 

Epoch 4, batch 2277
Training loss: 1.8956407308578491 

Epoch 4, batch 2278
Training loss: 1.7734596729278564 

Epoch 4, batch 2279
Training loss: 2.051034688949585 

Epoch 4, batch 2280
Training loss: 1.717699408531189 

Epoch 4, batch 2281
Training loss: 1.9361252784729004 

Epoch 4, batch 2282
Training loss: 1.73993134498596

Epoch 4, batch 2463
Training loss: 1.5617867708206177 

Epoch 4, batch 2464
Training loss: 1.7275075912475586 

Epoch 4, batch 2465
Training loss: 1.7529780864715576 

Epoch 4, batch 2466
Training loss: 1.8031977415084839 

Epoch 4, batch 2467
Training loss: 1.6700215339660645 

Epoch 4, batch 2468
Training loss: 1.8346319198608398 

Epoch 4, batch 2469
Training loss: 1.5959577560424805 

Epoch 4, batch 2470
Training loss: 1.7155290842056274 

Epoch 4, batch 2471
Training loss: 1.8025044202804565 

Epoch 4, batch 2472
Training loss: 1.8940365314483643 

Epoch 4, batch 2473
Training loss: 1.529280424118042 

Epoch 4, batch 2474
Training loss: 1.6273747682571411 

Epoch 4, batch 2475
Training loss: 1.7977182865142822 

Epoch 4, batch 2476
Training loss: 1.7579222917556763 

Epoch 4, batch 2477
Training loss: 1.7735651731491089 

Epoch 4, batch 2478
Training loss: 1.7798736095428467 

Epoch 4, batch 2479
Training loss: 1.6474990844726562 

Epoch 4, batch 2480
Training loss: 1.728979825973

Epoch 4, batch 2666
Training loss: 1.6243771314620972 

Epoch 4, batch 2667
Training loss: 1.8270721435546875 

Epoch 4, batch 2668
Training loss: 1.531569004058838 

Epoch 4, batch 2669
Training loss: 2.057183265686035 

Epoch 4, batch 2670
Training loss: 1.5377787351608276 

Epoch 4, batch 2671
Training loss: 1.5507704019546509 

Epoch 4, batch 2672
Training loss: 1.8997926712036133 

Epoch 4, batch 2673
Training loss: 1.8024203777313232 

Epoch 4, batch 2674
Training loss: 1.6179606914520264 

Epoch 4, batch 2675
Training loss: 1.5959511995315552 

Epoch 4, batch 2676
Training loss: 1.8035297393798828 

Epoch 4, batch 2677
Training loss: 1.936295986175537 

Epoch 4, batch 2678
Training loss: 1.5821837186813354 

Epoch 4, batch 2679
Training loss: 1.7097581624984741 

Epoch 4, batch 2680
Training loss: 1.8180402517318726 

Epoch 4, batch 2681
Training loss: 1.8623108863830566 

Epoch 4, batch 2682
Training loss: 1.7047171592712402 

Epoch 4, batch 2683
Training loss: 1.81332445144653

Epoch 4, batch 2868
Training loss: 1.5641905069351196 

Epoch 4, batch 2869
Training loss: 1.6283354759216309 

Epoch 4, batch 2870
Training loss: 1.9169609546661377 

Epoch 4, batch 2871
Training loss: 1.4918286800384521 

Epoch 4, batch 2872
Training loss: 1.8935892581939697 

Epoch 4, batch 2873
Training loss: 1.4676494598388672 

Epoch 4, batch 2874
Training loss: 1.5081913471221924 

Epoch 4, batch 2875
Training loss: 1.6197279691696167 

Epoch 4, batch 2876
Training loss: 1.714584469795227 

Epoch 4, batch 2877
Training loss: 1.7385756969451904 

Epoch 4, batch 2878
Training loss: 1.9178204536437988 

Epoch 4, batch 2879
Training loss: 1.87344229221344 

Epoch 4, batch 2880
Training loss: 1.7456762790679932 

Epoch 4, batch 2881
Training loss: 1.4959286451339722 

Epoch 4, batch 2882
Training loss: 1.7947945594787598 

Epoch 4, batch 2883
Training loss: 1.5438824892044067 

Epoch 4, batch 2884
Training loss: 2.023723602294922 

Epoch 4, batch 2885
Training loss: 1.759225726127624

Epoch 4, batch 3066
Training loss: 1.6086828708648682 

Epoch 4, batch 3067
Training loss: 1.8631930351257324 

Epoch 4, batch 3068
Training loss: 1.7190805673599243 

Epoch 4, batch 3069
Training loss: 1.9540855884552002 

Epoch 4, batch 3070
Training loss: 1.4843226671218872 

Epoch 4, batch 3071
Training loss: 1.656902551651001 

Epoch 4, batch 3072
Training loss: 1.5946041345596313 

Epoch 4, batch 3073
Training loss: 1.7987945079803467 

Epoch 4, batch 3074
Training loss: 1.8819797039031982 

Epoch 4, batch 3075
Training loss: 1.6752207279205322 

Epoch 4, batch 3076
Training loss: 1.9523907899856567 

Epoch 4, batch 3077
Training loss: 1.9666903018951416 

Epoch 4, batch 3078
Training loss: 1.5124588012695312 

Epoch 4, batch 3079
Training loss: 1.796471357345581 

Epoch 4, batch 3080
Training loss: 1.893911600112915 

Epoch 4, batch 3081
Training loss: 1.5291802883148193 

Epoch 4, batch 3082
Training loss: 1.5159488916397095 

Epoch 4, batch 3083
Training loss: 1.88626396656036

Epoch 4, batch 3269
Training loss: 1.640582799911499 

Epoch 4, batch 3270
Training loss: 1.6788884401321411 

Epoch 4, batch 3271
Training loss: 1.9063785076141357 

Epoch 4, batch 3272
Training loss: 1.5614817142486572 

Epoch 4, batch 3273
Training loss: 1.8234403133392334 

Epoch 4, batch 3274
Training loss: 1.5962085723876953 

Epoch 4, batch 3275
Training loss: 1.8952293395996094 

Epoch 4, batch 3276
Training loss: 1.7704846858978271 

Epoch 4, batch 3277
Training loss: 1.7500677108764648 

Epoch 4, batch 3278
Training loss: 1.9222838878631592 

Epoch 4, batch 3279
Training loss: 1.9383577108383179 

Epoch 4, batch 3280
Training loss: 1.7499037981033325 

Epoch 4, batch 3281
Training loss: 1.6395492553710938 

Epoch 4, batch 3282
Training loss: 1.512644648551941 

Epoch 4, batch 3283
Training loss: 1.6144713163375854 

Epoch 4, batch 3284
Training loss: 1.5783145427703857 

Epoch 4, batch 3285
Training loss: 1.5735375881195068 

Epoch 4, batch 3286
Training loss: 1.9270081520080

Epoch 4, batch 3471
Training loss: 1.6263582706451416 

Epoch 4, batch 3472
Training loss: 1.7439842224121094 

Epoch 4, batch 3473
Training loss: 1.5234270095825195 

Epoch 4, batch 3474
Training loss: 1.569008231163025 

Epoch 4, batch 3475
Training loss: 1.666643500328064 

Epoch 4, batch 3476
Training loss: 1.9931166172027588 

Epoch 4, batch 3477
Training loss: 1.9936723709106445 

Epoch 4, batch 3478
Training loss: 1.5982685089111328 

Epoch 4, batch 3479
Training loss: 2.011495351791382 

Epoch 4, batch 3480
Training loss: 1.8033156394958496 

Epoch 4, batch 3481
Training loss: 1.7111492156982422 

Epoch 4, batch 3482
Training loss: 1.834822416305542 

Epoch 4, batch 3483
Training loss: 1.8098968267440796 

Epoch 4, batch 3484
Training loss: 1.9714261293411255 

Epoch 4, batch 3485
Training loss: 1.7545946836471558 

Epoch 4, batch 3486
Training loss: 1.7161284685134888 

Epoch 4, batch 3487
Training loss: 1.8426589965820312 

Epoch 4, batch 3488
Training loss: 1.981791973114013

Epoch 4, batch 3675
Training loss: 1.9197001457214355 

Epoch 4, batch 3676
Training loss: 1.6970999240875244 

Epoch 4, batch 3677
Training loss: 1.65239679813385 

Epoch 4, batch 3678
Training loss: 1.8684964179992676 

Epoch 4, batch 3679
Training loss: 1.9060890674591064 

Epoch 4, batch 3680
Training loss: 1.8057713508605957 

Epoch 4, batch 3681
Training loss: 1.9887800216674805 

Epoch 4, batch 3682
Training loss: 1.9813921451568604 

Epoch 4, batch 3683
Training loss: 1.6205573081970215 

Epoch 4, batch 3684
Training loss: 2.0057621002197266 

Epoch 4, batch 3685
Training loss: 1.7608041763305664 

Epoch 4, batch 3686
Training loss: 1.7371015548706055 

Epoch 4, batch 3687
Training loss: 1.8694024085998535 

Epoch 4, batch 3688
Training loss: 2.098788022994995 

Epoch 4, batch 3689
Training loss: 1.7659966945648193 

Epoch 4, batch 3690
Training loss: 1.5626717805862427 

Epoch 4, batch 3691
Training loss: 2.039220094680786 

Epoch 4, batch 3692
Training loss: 1.736592054367065

Epoch 4, batch 3878
Training loss: 1.6064788103103638 

Epoch 4, batch 3879
Training loss: 1.822847843170166 

Epoch 4, batch 3880
Training loss: 1.6112724542617798 

Epoch 4, batch 3881
Training loss: 1.744659423828125 

Epoch 4, batch 3882
Training loss: 1.9967694282531738 

Epoch 4, batch 3883
Training loss: 1.5446970462799072 

Epoch 4, batch 3884
Training loss: 1.5118221044540405 

Epoch 4, batch 3885
Training loss: 1.6033138036727905 

Epoch 4, batch 3886
Training loss: 1.5308588743209839 

Epoch 4, batch 3887
Training loss: 1.8166381120681763 

Epoch 4, batch 3888
Training loss: 1.5480623245239258 

Epoch 4, batch 3889
Training loss: 1.810121774673462 

Epoch 4, batch 3890
Training loss: 1.8677154779434204 

Epoch 4, batch 3891
Training loss: 1.5019725561141968 

Epoch 4, batch 3892
Training loss: 1.764589548110962 

Epoch 4, batch 3893
Training loss: 1.9034347534179688 

Epoch 4, batch 3894
Training loss: 1.8463521003723145 

Epoch 4, batch 3895
Training loss: 1.732349157333374

Epoch 4, batch 4077
Training loss: 1.8795311450958252 

Epoch 4, batch 4078
Training loss: 1.7249641418457031 

Epoch 4, batch 4079
Training loss: 1.8893074989318848 

Epoch 4, batch 4080
Training loss: 1.5151844024658203 

Epoch 4, batch 4081
Training loss: 1.4999027252197266 

Epoch 4, batch 4082
Training loss: 1.8478628396987915 

Epoch 4, batch 4083
Training loss: 1.7331368923187256 

Epoch 4, batch 4084
Training loss: 1.614700198173523 

Epoch 4, batch 4085
Training loss: 1.8474645614624023 

Epoch 4, batch 4086
Training loss: 1.9139803647994995 

Epoch 4, batch 4087
Training loss: 1.7828483581542969 

Epoch 4, batch 4088
Training loss: 1.9612427949905396 

Epoch 4, batch 4089
Training loss: 1.5749497413635254 

Epoch 4, batch 4090
Training loss: 1.513905644416809 

Epoch 4, batch 4091
Training loss: 1.676304817199707 

Epoch 4, batch 4092
Training loss: 1.7755203247070312 

Epoch 4, batch 4093
Training loss: 1.904745101928711 

Epoch 4, batch 4094
Training loss: 1.553639888763427

Epoch 4, batch 4280
Training loss: 1.709494709968567 

Epoch 4, batch 4281
Training loss: 1.80002760887146 

Epoch 4, batch 4282
Training loss: 1.7415871620178223 

Epoch 4, batch 4283
Training loss: 1.9420087337493896 

Epoch 4, batch 4284
Training loss: 1.7976291179656982 

Epoch 4, batch 4285
Training loss: 1.802156686782837 

Epoch 4, batch 4286
Training loss: 1.6839711666107178 

Epoch 4, batch 4287
Training loss: 1.8364208936691284 

Epoch 4, batch 4288
Training loss: 1.9476943016052246 

Epoch 4, batch 4289
Training loss: 1.8128489255905151 

Epoch 4, batch 4290
Training loss: 1.825711727142334 

Epoch 4, batch 4291
Training loss: 1.5994172096252441 

Epoch 4, batch 4292
Training loss: 1.8639600276947021 

Epoch 4, batch 4293
Training loss: 1.5797821283340454 

Epoch 4, batch 4294
Training loss: 1.715699315071106 

Epoch 4, batch 4295
Training loss: 1.7168262004852295 

Epoch 4, batch 4296
Training loss: 1.7453700304031372 

Epoch 4, batch 4297
Training loss: 1.5258370637893677 

Epoch 4, batch 4484
Training loss: 1.815812110900879 

Epoch 4, batch 4485
Training loss: 1.8012149333953857 

Epoch 4, batch 4486
Training loss: 1.715592622756958 

Epoch 4, batch 4487
Training loss: 1.694471836090088 

Epoch 4, batch 4488
Training loss: 1.7561674118041992 

Epoch 4, batch 4489
Training loss: 1.7975168228149414 

Epoch 4, batch 4490
Training loss: 1.7599725723266602 

Epoch 4, batch 4491
Training loss: 1.5884069204330444 

Epoch 4, batch 4492
Training loss: 1.784985065460205 

Epoch 4, batch 4493
Training loss: 1.6726617813110352 

Epoch 4, batch 4494
Training loss: 1.7583603858947754 

Epoch 4, batch 4495
Training loss: 1.630081295967102 

Epoch 4, batch 4496
Training loss: 1.9283514022827148 

Epoch 4, batch 4497
Training loss: 1.7684204578399658 

Epoch 4, batch 4498
Training loss: 1.7994321584701538 

Epoch 4, batch 4499
Training loss: 1.9820866584777832 

Epoch 4, batch 4500
Training loss: 1.6608632802963257 

Epoch 4, batch 4501
Training loss: 1.7439510822296143

Epoch 4, batch 4689
Training loss: 1.7039144039154053 

Epoch 4, batch 4690
Training loss: 1.7619131803512573 

Epoch 4, batch 4691
Training loss: 1.7981231212615967 

Epoch 4, batch 4692
Training loss: 1.6671226024627686 

Epoch 4, batch 4693
Training loss: 1.7962844371795654 

Epoch 4, batch 4694
Training loss: 1.8045322895050049 

Epoch 4, batch 4695
Training loss: 1.677990436553955 

Epoch 4, batch 4696
Training loss: 1.7736268043518066 

Epoch 4, batch 4697
Training loss: 1.7499561309814453 

Epoch 4, batch 4698
Training loss: 1.6142430305480957 

Epoch 4, batch 4699
Training loss: 1.7013391256332397 

Epoch 4, batch 4700
Training loss: 1.8592289686203003 

Epoch 4, batch 4701
Training loss: 1.891464352607727 

Epoch 4, batch 4702
Training loss: 1.8035848140716553 

Epoch 4, batch 4703
Training loss: 1.640673041343689 

Epoch 4, batch 4704
Training loss: 1.5279057025909424 

Epoch 4, batch 4705
Training loss: 1.659940242767334 

Epoch 4, batch 4706
Training loss: 1.616641163825988

Epoch 4, batch 4891
Training loss: 1.7388113737106323 

Epoch 4, batch 4892
Training loss: 1.8168950080871582 

Epoch 4, batch 4893
Training loss: 1.7620282173156738 

Epoch 4, batch 4894
Training loss: 1.7075639963150024 

Epoch 4, batch 4895
Training loss: 1.5059866905212402 

Epoch 4, batch 4896
Training loss: 1.6264898777008057 

Epoch 4, batch 4897
Training loss: 1.5334019660949707 

Epoch 4, batch 4898
Training loss: 1.5085135698318481 

Epoch 4, batch 4899
Training loss: 1.8442885875701904 

Epoch 4, batch 4900
Training loss: 1.661841630935669 

Epoch 4, batch 4901
Training loss: 1.7576557397842407 

Epoch 4, batch 4902
Training loss: 1.5903130769729614 

Epoch 4, batch 4903
Training loss: 1.7938038110733032 

Epoch 4, batch 4904
Training loss: 1.7411854267120361 

Epoch 4, batch 4905
Training loss: 1.5308821201324463 

Epoch 4, batch 4906
Training loss: 1.5350143909454346 

Epoch 4, batch 4907
Training loss: 1.909095287322998 

Epoch 4, batch 4908
Training loss: 1.7390501499176

Epoch 4, batch 5093
Training loss: 1.6668270826339722 

Epoch 4, batch 5094
Training loss: 1.841647744178772 

Epoch 4, batch 5095
Training loss: 1.9616248607635498 

Epoch 4, batch 5096
Training loss: 1.6909443140029907 

Epoch 4, batch 5097
Training loss: 1.6026486158370972 

Epoch 4, batch 5098
Training loss: 1.58533775806427 

Epoch 4, batch 5099
Training loss: 1.9396941661834717 

Epoch 4, batch 5100
Training loss: 1.534271240234375 

Epoch 4, batch 5101
Training loss: 1.7333179712295532 

Epoch 4, batch 5102
Training loss: 1.8199052810668945 

Epoch 4, batch 5103
Training loss: 1.8269513845443726 

Epoch 4, batch 5104
Training loss: 1.7860898971557617 

Epoch 4, batch 5105
Training loss: 1.8358426094055176 

Epoch 4, batch 5106
Training loss: 1.5435714721679688 

Epoch 4, batch 5107
Training loss: 1.88330078125 

Epoch 4, batch 5108
Training loss: 1.7994341850280762 

Epoch 4, batch 5109
Training loss: 1.6977112293243408 

Epoch 4, batch 5110
Training loss: 1.7957966327667236 

E

Epoch 4, batch 5296
Training loss: 1.9857100248336792 

Epoch 4, batch 5297
Training loss: 1.6483608484268188 

Epoch 4, batch 5298
Training loss: 1.5521221160888672 

Epoch 4, batch 5299
Training loss: 1.7102056741714478 

Epoch 4, batch 5300
Training loss: 1.7959673404693604 

Epoch 4, batch 5301
Training loss: 1.7339913845062256 

Epoch 4, batch 5302
Training loss: 1.740225076675415 

Epoch 4, batch 5303
Training loss: 1.9793994426727295 

Epoch 4, batch 5304
Training loss: 1.7187583446502686 

Epoch 4, batch 5305
Training loss: 1.9150893688201904 

Epoch 4, batch 5306
Training loss: 1.8015549182891846 

Epoch 4, batch 5307
Training loss: 1.9180288314819336 

Epoch 4, batch 5308
Training loss: 1.8519420623779297 

Epoch 4, batch 5309
Training loss: 1.6096585988998413 

Epoch 4, batch 5310
Training loss: 1.5963445901870728 

Epoch 4, batch 5311
Training loss: 1.5887092351913452 

Epoch 4, batch 5312
Training loss: 1.9122061729431152 

Epoch 4, batch 5313
Training loss: 1.711495637893

Epoch 4, batch 5503
Training loss: 1.6167469024658203 

Epoch 4, batch 5504
Training loss: 2.0312082767486572 

Epoch 4, batch 5505
Training loss: 1.7599315643310547 

Epoch 4, batch 5506
Training loss: 1.7827410697937012 

Epoch 4, batch 5507
Training loss: 1.893040418624878 

Epoch 4, batch 5508
Training loss: 1.5276529788970947 

Epoch 4, batch 5509
Training loss: 1.5866637229919434 

Epoch 4, batch 5510
Training loss: 1.8833999633789062 

Epoch 4, batch 5511
Training loss: 1.8459198474884033 

Epoch 4, batch 5512
Training loss: 1.6027917861938477 

Epoch 4, batch 5513
Training loss: 1.6636638641357422 

Epoch 4, batch 5514
Training loss: 1.7924615144729614 

Epoch 4, batch 5515
Training loss: 1.6841342449188232 

Epoch 4, batch 5516
Training loss: 1.9655604362487793 

Epoch 4, batch 5517
Training loss: 1.7119566202163696 

Epoch 4, batch 5518
Training loss: 1.6682765483856201 

Epoch 4, batch 5519
Training loss: 1.5825769901275635 

Epoch 4, batch 5520
Training loss: 1.601034164428

Epoch 4, batch 5706
Training loss: 1.673532485961914 

Epoch 4, batch 5707
Training loss: 1.5980192422866821 

Epoch 4, batch 5708
Training loss: 1.6111692190170288 

Epoch 4, batch 5709
Training loss: 1.6225727796554565 

Epoch 4, batch 5710
Training loss: 1.8174972534179688 

Epoch 4, batch 5711
Training loss: 1.9022884368896484 

Epoch 4, batch 5712
Training loss: 1.9931831359863281 

Epoch 4, batch 5713
Training loss: 1.9945124387741089 

Epoch 4, batch 5714
Training loss: 1.7848056554794312 

Epoch 4, batch 5715
Training loss: 1.7705117464065552 

Epoch 4, batch 5716
Training loss: 1.6674809455871582 

Epoch 4, batch 5717
Training loss: 1.5727559328079224 

Epoch 4, batch 5718
Training loss: 1.9226233959197998 

Epoch 4, batch 5719
Training loss: 1.5790660381317139 

Epoch 4, batch 5720
Training loss: 1.6258827447891235 

Epoch 4, batch 5721
Training loss: 1.559065818786621 

Epoch 4, batch 5722
Training loss: 1.7540113925933838 

Epoch 4, batch 5723
Training loss: 1.5611929893493

Epoch 4, batch 5907
Training loss: 1.7419313192367554 

Epoch 4, batch 5908
Training loss: 1.7142634391784668 

Epoch 4, batch 5909
Training loss: 1.6360160112380981 

Epoch 4, batch 5910
Training loss: 1.5620982646942139 

Epoch 4, batch 5911
Training loss: 1.7656927108764648 

Epoch 4, batch 5912
Training loss: 1.5908489227294922 

Epoch 4, batch 5913
Training loss: 1.6464948654174805 

Epoch 4, batch 5914
Training loss: 1.9292113780975342 

Epoch 4, batch 5915
Training loss: 1.5955551862716675 

Epoch 4, batch 5916
Training loss: 1.7975795269012451 

Epoch 4, batch 5917
Training loss: 1.756439208984375 

Epoch 4, batch 5918
Training loss: 1.7997965812683105 

Epoch 4, batch 5919
Training loss: 1.5376169681549072 

Epoch 4, batch 5920
Training loss: 1.5580885410308838 

Epoch 4, batch 5921
Training loss: 2.0001981258392334 

Epoch 4, batch 5922
Training loss: 1.7682490348815918 

Epoch 4, batch 5923
Training loss: 1.6189864873886108 

Epoch 4, batch 5924
Training loss: 1.795931339263

Epoch 5, batch 105
Training loss: 1.7283594608306885 

Epoch 5, batch 106
Training loss: 1.8898001909255981 

Epoch 5, batch 107
Training loss: 1.7803254127502441 

Epoch 5, batch 108
Training loss: 1.5447466373443604 

Epoch 5, batch 109
Training loss: 1.8252003192901611 

Epoch 5, batch 110
Training loss: 1.9387153387069702 

Epoch 5, batch 111
Training loss: 1.5392608642578125 

Epoch 5, batch 112
Training loss: 1.9250898361206055 

Epoch 5, batch 113
Training loss: 1.6648417711257935 

Epoch 5, batch 114
Training loss: 1.8302440643310547 

Epoch 5, batch 115
Training loss: 1.7879457473754883 

Epoch 5, batch 116
Training loss: 1.7847505807876587 

Epoch 5, batch 117
Training loss: 1.5277392864227295 

Epoch 5, batch 118
Training loss: 1.7241774797439575 

Epoch 5, batch 119
Training loss: 1.6937260627746582 

Epoch 5, batch 120
Training loss: 1.7057636976242065 

Epoch 5, batch 121
Training loss: 1.6827398538589478 

Epoch 5, batch 122
Training loss: 1.82738196849823 

Epoch 5, bat

Epoch 5, batch 308
Training loss: 1.70307195186615 

Epoch 5, batch 309
Training loss: 1.6457293033599854 

Epoch 5, batch 310
Training loss: 1.6455100774765015 

Epoch 5, batch 311
Training loss: 1.6888134479522705 

Epoch 5, batch 312
Training loss: 1.7255011796951294 

Epoch 5, batch 313
Training loss: 1.6362465620040894 

Epoch 5, batch 314
Training loss: 1.7213013172149658 

Epoch 5, batch 315
Training loss: 1.6413671970367432 

Epoch 5, batch 316
Training loss: 1.6389211416244507 

Epoch 5, batch 317
Training loss: 1.7527440786361694 

Epoch 5, batch 318
Training loss: 1.7837920188903809 

Epoch 5, batch 319
Training loss: 1.6775994300842285 

Epoch 5, batch 320
Training loss: 1.8944323062896729 

Epoch 5, batch 321
Training loss: 1.7631940841674805 

Epoch 5, batch 322
Training loss: 1.5174447298049927 

Epoch 5, batch 323
Training loss: 1.5701332092285156 

Epoch 5, batch 324
Training loss: 1.7069281339645386 

Epoch 5, batch 325
Training loss: 1.6947362422943115 

Epoch 5, bat

Epoch 5, batch 511
Training loss: 1.818514347076416 

Epoch 5, batch 512
Training loss: 1.8871854543685913 

Epoch 5, batch 513
Training loss: 1.5294299125671387 

Epoch 5, batch 514
Training loss: 1.8104546070098877 

Epoch 5, batch 515
Training loss: 1.6476651430130005 

Epoch 5, batch 516
Training loss: 1.868293285369873 

Epoch 5, batch 517
Training loss: 1.974501132965088 

Epoch 5, batch 518
Training loss: 1.7412883043289185 

Epoch 5, batch 519
Training loss: 1.8566758632659912 

Epoch 5, batch 520
Training loss: 1.6168819665908813 

Epoch 5, batch 521
Training loss: 1.4886215925216675 

Epoch 5, batch 522
Training loss: 1.8369994163513184 

Epoch 5, batch 523
Training loss: 1.946232795715332 

Epoch 5, batch 524
Training loss: 1.6316773891448975 

Epoch 5, batch 525
Training loss: 1.67648184299469 

Epoch 5, batch 526
Training loss: 2.1808371543884277 

Epoch 5, batch 527
Training loss: 1.8708608150482178 

Epoch 5, batch 528
Training loss: 1.5688109397888184 

Epoch 5, batch 5

Epoch 5, batch 712
Training loss: 1.872741937637329 

Epoch 5, batch 713
Training loss: 1.6033331155776978 

Epoch 5, batch 714
Training loss: 1.6192207336425781 

Epoch 5, batch 715
Training loss: 1.8800134658813477 

Epoch 5, batch 716
Training loss: 1.835609793663025 

Epoch 5, batch 717
Training loss: 1.5923136472702026 

Epoch 5, batch 718
Training loss: 1.9611923694610596 

Epoch 5, batch 719
Training loss: 1.7539819478988647 

Epoch 5, batch 720
Training loss: 1.8760418891906738 

Epoch 5, batch 721
Training loss: 1.9763669967651367 

Epoch 5, batch 722
Training loss: 1.7927360534667969 

Epoch 5, batch 723
Training loss: 1.7434165477752686 

Epoch 5, batch 724
Training loss: 1.8904008865356445 

Epoch 5, batch 725
Training loss: 1.8440088033676147 

Epoch 5, batch 726
Training loss: 1.8330388069152832 

Epoch 5, batch 727
Training loss: 1.7757408618927002 

Epoch 5, batch 728
Training loss: 1.6474918127059937 

Epoch 5, batch 729
Training loss: 1.6297848224639893 

Epoch 5, bat

Epoch 5, batch 897
Training loss: 1.9262466430664062 

Epoch 5, batch 898
Training loss: 1.6769903898239136 

Epoch 5, batch 899
Training loss: 1.5622241497039795 

Epoch 5, batch 900
Training loss: 1.7423595190048218 

Epoch 5, batch 901
Training loss: 1.5760838985443115 

Epoch 5, batch 902
Training loss: 1.7859277725219727 

Epoch 5, batch 903
Training loss: 1.8085942268371582 

Epoch 5, batch 904
Training loss: 1.6467307806015015 

Epoch 5, batch 905
Training loss: 1.6960210800170898 

Epoch 5, batch 906
Training loss: 1.821724772453308 

Epoch 5, batch 907
Training loss: 1.595301628112793 

Epoch 5, batch 908
Training loss: 1.6844305992126465 

Epoch 5, batch 909
Training loss: 1.5943763256072998 

Epoch 5, batch 910
Training loss: 1.512499213218689 

Epoch 5, batch 911
Training loss: 1.6466965675354004 

Epoch 5, batch 912
Training loss: 1.4989640712738037 

Epoch 5, batch 913
Training loss: 1.9610134363174438 

Epoch 5, batch 914
Training loss: 1.867764949798584 

Epoch 5, batch

Epoch 5, batch 1096
Training loss: 1.9054343700408936 

Epoch 5, batch 1097
Training loss: 1.6662402153015137 

Epoch 5, batch 1098
Training loss: 1.8882782459259033 

Epoch 5, batch 1099
Training loss: 1.9832526445388794 

Epoch 5, batch 1100
Training loss: 1.8651922941207886 

Epoch 5, batch 1101
Training loss: 1.857743501663208 

Epoch 5, batch 1102
Training loss: 1.7103679180145264 

Epoch 5, batch 1103
Training loss: 1.5363163948059082 

Epoch 5, batch 1104
Training loss: 1.8048810958862305 

Epoch 5, batch 1105
Training loss: 1.4782586097717285 

Epoch 5, batch 1106
Training loss: 1.5539827346801758 

Epoch 5, batch 1107
Training loss: 1.874708652496338 

Epoch 5, batch 1108
Training loss: 1.5281271934509277 

Epoch 5, batch 1109
Training loss: 1.6427110433578491 

Epoch 5, batch 1110
Training loss: 1.8053981065750122 

Epoch 5, batch 1111
Training loss: 1.896196722984314 

Epoch 5, batch 1112
Training loss: 1.940216302871704 

Epoch 5, batch 1113
Training loss: 1.981908559799194

Epoch 5, batch 1297
Training loss: 1.4702003002166748 

Epoch 5, batch 1298
Training loss: 1.68885338306427 

Epoch 5, batch 1299
Training loss: 1.6605678796768188 

Epoch 5, batch 1300
Training loss: 1.6964433193206787 

Epoch 5, batch 1301
Training loss: 1.8775066137313843 

Epoch 5, batch 1302
Training loss: 1.734621524810791 

Epoch 5, batch 1303
Training loss: 1.7606029510498047 

Epoch 5, batch 1304
Training loss: 1.5735920667648315 

Epoch 5, batch 1305
Training loss: 1.6250311136245728 

Epoch 5, batch 1306
Training loss: 1.6367583274841309 

Epoch 5, batch 1307
Training loss: 1.8654634952545166 

Epoch 5, batch 1308
Training loss: 1.7898460626602173 

Epoch 5, batch 1309
Training loss: 1.659095048904419 

Epoch 5, batch 1310
Training loss: 1.66532301902771 

Epoch 5, batch 1311
Training loss: 1.6208853721618652 

Epoch 5, batch 1312
Training loss: 1.806298017501831 

Epoch 5, batch 1313
Training loss: 1.6211941242218018 

Epoch 5, batch 1314
Training loss: 1.8355770111083984 


Epoch 5, batch 1499
Training loss: 1.5069804191589355 

Epoch 5, batch 1500
Training loss: 1.4630405902862549 

Epoch 5, batch 1501
Training loss: 1.6684927940368652 

Epoch 5, batch 1502
Training loss: 1.8592543601989746 

Epoch 5, batch 1503
Training loss: 1.8826179504394531 

Epoch 5, batch 1504
Training loss: 1.760451316833496 

Epoch 5, batch 1505
Training loss: 1.7368547916412354 

Epoch 5, batch 1506
Training loss: 1.8631947040557861 

Epoch 5, batch 1507
Training loss: 1.6548612117767334 

Epoch 5, batch 1508
Training loss: 1.6310758590698242 

Epoch 5, batch 1509
Training loss: 1.712579369544983 

Epoch 5, batch 1510
Training loss: 1.9231905937194824 

Epoch 5, batch 1511
Training loss: 1.5041359663009644 

Epoch 5, batch 1512
Training loss: 1.6157755851745605 

Epoch 5, batch 1513
Training loss: 1.4903783798217773 

Epoch 5, batch 1514
Training loss: 1.93917715549469 

Epoch 5, batch 1515
Training loss: 1.71958327293396 

Epoch 5, batch 1516
Training loss: 1.7904822826385498 

Epoch 5, batch 1701
Training loss: 1.6104109287261963 

Epoch 5, batch 1702
Training loss: 1.7298593521118164 

Epoch 5, batch 1703
Training loss: 1.8852553367614746 

Epoch 5, batch 1704
Training loss: 1.694224238395691 

Epoch 5, batch 1705
Training loss: 1.5971906185150146 

Epoch 5, batch 1706
Training loss: 2.056654691696167 

Epoch 5, batch 1707
Training loss: 1.6161781549453735 

Epoch 5, batch 1708
Training loss: 1.5690546035766602 

Epoch 5, batch 1709
Training loss: 1.5169248580932617 

Epoch 5, batch 1710
Training loss: 1.8852949142456055 

Epoch 5, batch 1711
Training loss: 1.5865294933319092 

Epoch 5, batch 1712
Training loss: 1.9283783435821533 

Epoch 5, batch 1713
Training loss: 1.872878909111023 

Epoch 5, batch 1714
Training loss: 1.5148532390594482 

Epoch 5, batch 1715
Training loss: 1.8921767473220825 

Epoch 5, batch 1716
Training loss: 1.769007682800293 

Epoch 5, batch 1717
Training loss: 1.6411020755767822 

Epoch 5, batch 1718
Training loss: 1.683156609535217

Epoch 5, batch 1898
Training loss: 1.6226487159729004 

Epoch 5, batch 1899
Training loss: 1.805755853652954 

Epoch 5, batch 1900
Training loss: 1.735938549041748 

Epoch 5, batch 1901
Training loss: 1.6927549839019775 

Epoch 5, batch 1902
Training loss: 1.698786973953247 

Epoch 5, batch 1903
Training loss: 1.9510198831558228 

Epoch 5, batch 1904
Training loss: 1.7787551879882812 

Epoch 5, batch 1905
Training loss: 2.0248935222625732 

Epoch 5, batch 1906
Training loss: 1.613481044769287 

Epoch 5, batch 1907
Training loss: 1.75948965549469 

Epoch 5, batch 1908
Training loss: 1.9584176540374756 

Epoch 5, batch 1909
Training loss: 2.0043089389801025 

Epoch 5, batch 1910
Training loss: 1.833714485168457 

Epoch 5, batch 1911
Training loss: 1.9315019845962524 

Epoch 5, batch 1912
Training loss: 1.7790405750274658 

Epoch 5, batch 1913
Training loss: 1.6034176349639893 

Epoch 5, batch 1914
Training loss: 1.7229174375534058 

Epoch 5, batch 1915
Training loss: 1.635859727859497 



Epoch 5, batch 2096
Training loss: 1.9734885692596436 

Epoch 5, batch 2097
Training loss: 1.9112560749053955 

Epoch 5, batch 2098
Training loss: 1.9460783004760742 

Epoch 5, batch 2099
Training loss: 1.6350884437561035 

Epoch 5, batch 2100
Training loss: 1.9270164966583252 

Epoch 5, batch 2101
Training loss: 1.9708305597305298 

Epoch 5, batch 2102
Training loss: 1.6856614351272583 

Epoch 5, batch 2103
Training loss: 1.974365234375 

Epoch 5, batch 2104
Training loss: 1.8852237462997437 

Epoch 5, batch 2105
Training loss: 1.9618804454803467 

Epoch 5, batch 2106
Training loss: 1.5108929872512817 

Epoch 5, batch 2107
Training loss: 1.5891417264938354 

Epoch 5, batch 2108
Training loss: 1.7199255228042603 

Epoch 5, batch 2109
Training loss: 1.6520295143127441 

Epoch 5, batch 2110
Training loss: 1.8626116514205933 

Epoch 5, batch 2111
Training loss: 1.8116528987884521 

Epoch 5, batch 2112
Training loss: 1.6343308687210083 

Epoch 5, batch 2113
Training loss: 1.792453765869140

Epoch 5, batch 2295
Training loss: 1.7417449951171875 

Epoch 5, batch 2296
Training loss: 1.7356386184692383 

Epoch 5, batch 2297
Training loss: 1.7080044746398926 

Epoch 5, batch 2298
Training loss: 1.8350929021835327 

Epoch 5, batch 2299
Training loss: 1.8212411403656006 

Epoch 5, batch 2300
Training loss: 1.735455870628357 

Epoch 5, batch 2301
Training loss: 1.4932953119277954 

Epoch 5, batch 2302
Training loss: 1.7793948650360107 

Epoch 5, batch 2303
Training loss: 1.688563585281372 

Epoch 5, batch 2304
Training loss: 1.7803072929382324 

Epoch 5, batch 2305
Training loss: 1.823822021484375 

Epoch 5, batch 2306
Training loss: 1.6737432479858398 

Epoch 5, batch 2307
Training loss: 1.7335331439971924 

Epoch 5, batch 2308
Training loss: 1.5953948497772217 

Epoch 5, batch 2309
Training loss: 1.6742565631866455 

Epoch 5, batch 2310
Training loss: 1.6312053203582764 

Epoch 5, batch 2311
Training loss: 1.7889734506607056 

Epoch 5, batch 2312
Training loss: 1.75581812858581

Epoch 5, batch 2472
Training loss: 1.8226035833358765 

Epoch 5, batch 2473
Training loss: 1.560009241104126 

Epoch 5, batch 2474
Training loss: 1.6348663568496704 

Epoch 5, batch 2475
Training loss: 1.7823253870010376 

Epoch 5, batch 2476
Training loss: 1.6722851991653442 

Epoch 5, batch 2477
Training loss: 1.5840076208114624 

Epoch 5, batch 2478
Training loss: 1.9035234451293945 

Epoch 5, batch 2479
Training loss: 2.001678943634033 

Epoch 5, batch 2480
Training loss: 1.9438585042953491 

Epoch 5, batch 2481
Training loss: 1.8355424404144287 

Epoch 5, batch 2482
Training loss: 1.8166875839233398 

Epoch 5, batch 2483
Training loss: 1.9670190811157227 

Epoch 5, batch 2484
Training loss: 1.5954827070236206 

Epoch 5, batch 2485
Training loss: 1.520451545715332 

Epoch 5, batch 2486
Training loss: 1.7999203205108643 

Epoch 5, batch 2487
Training loss: 1.6135926246643066 

Epoch 5, batch 2488
Training loss: 1.750889539718628 

Epoch 5, batch 2489
Training loss: 1.834432005882263

Epoch 5, batch 2668
Training loss: 1.7243340015411377 

Epoch 5, batch 2669
Training loss: 2.039787530899048 

Epoch 5, batch 2670
Training loss: 1.735677719116211 

Epoch 5, batch 2671
Training loss: 1.8785814046859741 

Epoch 5, batch 2672
Training loss: 1.899390459060669 

Epoch 5, batch 2673
Training loss: 1.8109744787216187 

Epoch 5, batch 2674
Training loss: 1.7348864078521729 

Epoch 5, batch 2675
Training loss: 1.4691312313079834 

Epoch 5, batch 2676
Training loss: 1.555114984512329 

Epoch 5, batch 2677
Training loss: 1.5742450952529907 

Epoch 5, batch 2678
Training loss: 1.9432567358016968 

Epoch 5, batch 2679
Training loss: 1.6526093482971191 

Epoch 5, batch 2680
Training loss: 1.6018460988998413 

Epoch 5, batch 2681
Training loss: 1.6735363006591797 

Epoch 5, batch 2682
Training loss: 1.6506130695343018 

Epoch 5, batch 2683
Training loss: 1.743185043334961 

Epoch 5, batch 2684
Training loss: 1.9499305486679077 

Epoch 5, batch 2685
Training loss: 1.6758383512496948

Epoch 5, batch 2852
Training loss: 1.6020002365112305 

Epoch 5, batch 2853
Training loss: 1.8579130172729492 

Epoch 5, batch 2854
Training loss: 1.799412727355957 

Epoch 5, batch 2855
Training loss: 1.8359031677246094 

Epoch 5, batch 2856
Training loss: 1.622599720954895 

Epoch 5, batch 2857
Training loss: 1.7170816659927368 

Epoch 5, batch 2858
Training loss: 1.6536078453063965 

Epoch 5, batch 2859
Training loss: 1.6251318454742432 

Epoch 5, batch 2860
Training loss: 1.865299105644226 

Epoch 5, batch 2861
Training loss: 1.696656584739685 

Epoch 5, batch 2862
Training loss: 1.5920765399932861 

Epoch 5, batch 2863
Training loss: 1.6717088222503662 

Epoch 5, batch 2864
Training loss: 1.8922051191329956 

Epoch 5, batch 2865
Training loss: 1.6079432964324951 

Epoch 5, batch 2866
Training loss: 1.8806798458099365 

Epoch 5, batch 2867
Training loss: 1.7963106632232666 

Epoch 5, batch 2868
Training loss: 1.9797329902648926 

Epoch 5, batch 2869
Training loss: 1.997340917587280

Epoch 5, batch 3040
Training loss: 1.7735140323638916 

Epoch 5, batch 3041
Training loss: 1.7059063911437988 

Epoch 5, batch 3042
Training loss: 1.8877196311950684 

Epoch 5, batch 3043
Training loss: 1.942962408065796 

Epoch 5, batch 3044
Training loss: 1.6597912311553955 

Epoch 5, batch 3045
Training loss: 1.8037391901016235 

Epoch 5, batch 3046
Training loss: 1.7172088623046875 

Epoch 5, batch 3047
Training loss: 1.6959941387176514 

Epoch 5, batch 3048
Training loss: 1.8106883764266968 

Epoch 5, batch 3049
Training loss: 1.9588823318481445 

Epoch 5, batch 3050
Training loss: 1.6305441856384277 

Epoch 5, batch 3051
Training loss: 1.6646792888641357 

Epoch 5, batch 3052
Training loss: 1.6651220321655273 

Epoch 5, batch 3053
Training loss: 1.5103007555007935 

Epoch 5, batch 3054
Training loss: 1.870305061340332 

Epoch 5, batch 3055
Training loss: 1.7827198505401611 

Epoch 5, batch 3056
Training loss: 1.6084115505218506 

Epoch 5, batch 3057
Training loss: 1.8543316125869

Epoch 5, batch 3243
Training loss: 1.9335826635360718 

Epoch 5, batch 3244
Training loss: 1.752946138381958 

Epoch 5, batch 3245
Training loss: 1.6547117233276367 

Epoch 5, batch 3246
Training loss: 1.5983976125717163 

Epoch 5, batch 3247
Training loss: 1.8373221158981323 

Epoch 5, batch 3248
Training loss: 2.00618839263916 

Epoch 5, batch 3249
Training loss: 1.7967902421951294 

Epoch 5, batch 3250
Training loss: 1.7776172161102295 

Epoch 5, batch 3251
Training loss: 1.8350582122802734 

Epoch 5, batch 3252
Training loss: 1.7846167087554932 

Epoch 5, batch 3253
Training loss: 1.5918169021606445 

Epoch 5, batch 3254
Training loss: 1.872841715812683 

Epoch 5, batch 3255
Training loss: 2.0440657138824463 

Epoch 5, batch 3256
Training loss: 2.03317928314209 

Epoch 5, batch 3257
Training loss: 1.7750325202941895 

Epoch 5, batch 3258
Training loss: 1.6280062198638916 

Epoch 5, batch 3259
Training loss: 1.616977334022522 

Epoch 5, batch 3260
Training loss: 1.9599058628082275 


Epoch 5, batch 3442
Training loss: 1.7773442268371582 

Epoch 5, batch 3443
Training loss: 1.6850537061691284 

Epoch 5, batch 3444
Training loss: 1.9199583530426025 

Epoch 5, batch 3445
Training loss: 1.8262107372283936 

Epoch 5, batch 3446
Training loss: 1.8905918598175049 

Epoch 5, batch 3447
Training loss: 1.7083353996276855 

Epoch 5, batch 3448
Training loss: 1.575974702835083 

Epoch 5, batch 3449
Training loss: 1.9259223937988281 

Epoch 5, batch 3450
Training loss: 1.6959593296051025 

Epoch 5, batch 3451
Training loss: 2.021641731262207 

Epoch 5, batch 3452
Training loss: 1.7835875749588013 

Epoch 5, batch 3453
Training loss: 1.7761428356170654 

Epoch 5, batch 3454
Training loss: 1.8545520305633545 

Epoch 5, batch 3455
Training loss: 1.9594810009002686 

Epoch 5, batch 3456
Training loss: 1.7577447891235352 

Epoch 5, batch 3457
Training loss: 1.7061662673950195 

Epoch 5, batch 3458
Training loss: 1.849182367324829 

Epoch 5, batch 3459
Training loss: 1.63229775428771

Epoch 5, batch 3641
Training loss: 1.6876572370529175 

Epoch 5, batch 3642
Training loss: 1.6386008262634277 

Epoch 5, batch 3643
Training loss: 1.5859848260879517 

Epoch 5, batch 3644
Training loss: 1.6506785154342651 

Epoch 5, batch 3645
Training loss: 1.5343775749206543 

Epoch 5, batch 3646
Training loss: 1.9083281755447388 

Epoch 5, batch 3647
Training loss: 1.8215137720108032 

Epoch 5, batch 3648
Training loss: 1.8851970434188843 

Epoch 5, batch 3649
Training loss: 1.9320006370544434 

Epoch 5, batch 3650
Training loss: 1.5903241634368896 

Epoch 5, batch 3651
Training loss: 1.8169059753417969 

Epoch 5, batch 3652
Training loss: 1.8248097896575928 

Epoch 5, batch 3653
Training loss: 1.8225293159484863 

Epoch 5, batch 3654
Training loss: 1.7012052536010742 

Epoch 5, batch 3655
Training loss: 1.4979289770126343 

Epoch 5, batch 3656
Training loss: 1.6456782817840576 

Epoch 5, batch 3657
Training loss: 1.8234589099884033 

Epoch 5, batch 3658
Training loss: 1.83067905902

Epoch 5, batch 3839
Training loss: 1.8335461616516113 

Epoch 5, batch 3840
Training loss: 1.6782742738723755 

Epoch 5, batch 3841
Training loss: 1.7373648881912231 

Epoch 5, batch 3842
Training loss: 2.0555591583251953 

Epoch 5, batch 3843
Training loss: 1.5818707942962646 

Epoch 5, batch 3844
Training loss: 1.9284539222717285 

Epoch 5, batch 3845
Training loss: 1.5358296632766724 

Epoch 5, batch 3846
Training loss: 1.940294623374939 

Epoch 5, batch 3847
Training loss: 1.6311336755752563 

Epoch 5, batch 3848
Training loss: 1.944762945175171 

Epoch 5, batch 3849
Training loss: 1.698274850845337 

Epoch 5, batch 3850
Training loss: 1.8366397619247437 

Epoch 5, batch 3851
Training loss: 1.930253267288208 

Epoch 5, batch 3852
Training loss: 1.696088433265686 

Epoch 5, batch 3853
Training loss: 1.857470154762268 

Epoch 5, batch 3854
Training loss: 1.9151042699813843 

Epoch 5, batch 3855
Training loss: 1.7627274990081787 

Epoch 5, batch 3856
Training loss: 1.6852306127548218 

Epoch 5, batch 4043
Training loss: 1.7664986848831177 

Epoch 5, batch 4044
Training loss: 1.550609827041626 

Epoch 5, batch 4045
Training loss: 1.8580256700515747 

Epoch 5, batch 4046
Training loss: 1.8183996677398682 

Epoch 5, batch 4047
Training loss: 1.7604924440383911 

Epoch 5, batch 4048
Training loss: 1.753770112991333 

Epoch 5, batch 4049
Training loss: 1.5185132026672363 

Epoch 5, batch 4050
Training loss: 1.7776947021484375 

Epoch 5, batch 4051
Training loss: 1.7935582399368286 

Epoch 5, batch 4052
Training loss: 1.945778489112854 

Epoch 5, batch 4053
Training loss: 1.6953246593475342 

Epoch 5, batch 4054
Training loss: 1.6340914964675903 

Epoch 5, batch 4055
Training loss: 1.6795002222061157 

Epoch 5, batch 4056
Training loss: 1.6132557392120361 

Epoch 5, batch 4057
Training loss: 2.04441499710083 

Epoch 5, batch 4058
Training loss: 1.6113635301589966 

Epoch 5, batch 4059
Training loss: 1.9573835134506226 

Epoch 5, batch 4060
Training loss: 1.6078176498413086

Epoch 5, batch 4246
Training loss: 1.5714218616485596 

Epoch 5, batch 4247
Training loss: 1.5524901151657104 

Epoch 5, batch 4248
Training loss: 1.8529380559921265 

Epoch 5, batch 4249
Training loss: 1.5642873048782349 

Epoch 5, batch 4250
Training loss: 1.755752444267273 

Epoch 5, batch 4251
Training loss: 1.667177438735962 

Epoch 5, batch 4252
Training loss: 1.8441956043243408 

Epoch 5, batch 4253
Training loss: 1.8534774780273438 

Epoch 5, batch 4254
Training loss: 1.5780366659164429 

Epoch 5, batch 4255
Training loss: 1.820471167564392 

Epoch 5, batch 4256
Training loss: 1.5448685884475708 

Epoch 5, batch 4257
Training loss: 1.521918773651123 

Epoch 5, batch 4258
Training loss: 1.768951416015625 

Epoch 5, batch 4259
Training loss: 1.9037314653396606 

Epoch 5, batch 4260
Training loss: 1.6134790182113647 

Epoch 5, batch 4261
Training loss: 1.9452059268951416 

Epoch 5, batch 4262
Training loss: 2.0195634365081787 

Epoch 5, batch 4263
Training loss: 1.5585545301437378

Epoch 5, batch 4447
Training loss: 1.6306018829345703 

Epoch 5, batch 4448
Training loss: 1.6532535552978516 

Epoch 5, batch 4449
Training loss: 1.6171694993972778 

Epoch 5, batch 4450
Training loss: 1.760826587677002 

Epoch 5, batch 4451
Training loss: 1.9247190952301025 

Epoch 5, batch 4452
Training loss: 1.816270351409912 

Epoch 5, batch 4453
Training loss: 1.9394524097442627 

Epoch 5, batch 4454
Training loss: 1.5783672332763672 

Epoch 5, batch 4455
Training loss: 1.8317434787750244 

Epoch 5, batch 4456
Training loss: 1.7576669454574585 

Epoch 5, batch 4457
Training loss: 1.6000254154205322 

Epoch 5, batch 4458
Training loss: 1.8462698459625244 

Epoch 5, batch 4459
Training loss: 1.8223669528961182 

Epoch 5, batch 4460
Training loss: 1.920642375946045 

Epoch 5, batch 4461
Training loss: 2.008085250854492 

Epoch 5, batch 4462
Training loss: 1.5964670181274414 

Epoch 5, batch 4463
Training loss: 1.7963511943817139 

Epoch 5, batch 4464
Training loss: 1.752388715744018

Epoch 5, batch 4651
Training loss: 1.6959725618362427 

Epoch 5, batch 4652
Training loss: 1.6557948589324951 

Epoch 5, batch 4653
Training loss: 1.73594331741333 

Epoch 5, batch 4654
Training loss: 1.5762629508972168 

Epoch 5, batch 4655
Training loss: 1.827669620513916 

Epoch 5, batch 4656
Training loss: 1.8280556201934814 

Epoch 5, batch 4657
Training loss: 1.571683645248413 

Epoch 5, batch 4658
Training loss: 1.9102566242218018 

Epoch 5, batch 4659
Training loss: 1.8537732362747192 

Epoch 5, batch 4660
Training loss: 1.8026719093322754 

Epoch 5, batch 4661
Training loss: 1.9494245052337646 

Epoch 5, batch 4662
Training loss: 1.83509361743927 

Epoch 5, batch 4663
Training loss: 1.6106362342834473 

Epoch 5, batch 4664
Training loss: 1.5882668495178223 

Epoch 5, batch 4665
Training loss: 1.5529885292053223 

Epoch 5, batch 4666
Training loss: 1.7546144723892212 

Epoch 5, batch 4667
Training loss: 1.831251621246338 

Epoch 5, batch 4668
Training loss: 1.8083319664001465 


Epoch 5, batch 4850
Training loss: 1.8970502614974976 

Epoch 5, batch 4851
Training loss: 1.905110239982605 

Epoch 5, batch 4852
Training loss: 1.633913516998291 

Epoch 5, batch 4853
Training loss: 1.6651909351348877 

Epoch 5, batch 4854
Training loss: 1.6233136653900146 

Epoch 5, batch 4855
Training loss: 1.7332208156585693 

Epoch 5, batch 4856
Training loss: 1.6062180995941162 

Epoch 5, batch 4857
Training loss: 1.859445571899414 

Epoch 5, batch 4858
Training loss: 1.9067093133926392 

Epoch 5, batch 4859
Training loss: 1.7138314247131348 

Epoch 5, batch 4860
Training loss: 1.6662217378616333 

Epoch 5, batch 4861
Training loss: 1.832566499710083 

Epoch 5, batch 4862
Training loss: 1.606226921081543 

Epoch 5, batch 4863
Training loss: 1.7802507877349854 

Epoch 5, batch 4864
Training loss: 1.661659598350525 

Epoch 5, batch 4865
Training loss: 1.9056625366210938 

Epoch 5, batch 4866
Training loss: 1.721894383430481 

Epoch 5, batch 4867
Training loss: 1.9093092679977417 


Epoch 5, batch 5049
Training loss: 1.5796540975570679 

Epoch 5, batch 5050
Training loss: 1.7442245483398438 

Epoch 5, batch 5051
Training loss: 2.04000186920166 

Epoch 5, batch 5052
Training loss: 1.7663428783416748 

Epoch 5, batch 5053
Training loss: 1.6452974081039429 

Epoch 5, batch 5054
Training loss: 1.7846286296844482 

Epoch 5, batch 5055
Training loss: 1.7028870582580566 

Epoch 5, batch 5056
Training loss: 1.7037347555160522 

Epoch 5, batch 5057
Training loss: 1.7123658657073975 

Epoch 5, batch 5058
Training loss: 1.8878517150878906 

Epoch 5, batch 5059
Training loss: 2.076117753982544 

Epoch 5, batch 5060
Training loss: 1.467133641242981 

Epoch 5, batch 5061
Training loss: 1.816669225692749 

Epoch 5, batch 5062
Training loss: 1.6967947483062744 

Epoch 5, batch 5063
Training loss: 1.8232593536376953 

Epoch 5, batch 5064
Training loss: 1.561769962310791 

Epoch 5, batch 5065
Training loss: 1.58256196975708 

Epoch 5, batch 5066
Training loss: 1.5370721817016602 



Epoch 5, batch 5247
Training loss: 1.9015295505523682 

Epoch 5, batch 5248
Training loss: 1.7980625629425049 

Epoch 5, batch 5249
Training loss: 1.7078659534454346 

Epoch 5, batch 5250
Training loss: 1.7618699073791504 

Epoch 5, batch 5251
Training loss: 1.9543397426605225 

Epoch 5, batch 5252
Training loss: 1.7974990606307983 

Epoch 5, batch 5253
Training loss: 1.7119660377502441 

Epoch 5, batch 5254
Training loss: 1.6619983911514282 

Epoch 5, batch 5255
Training loss: 1.5311411619186401 

Epoch 5, batch 5256
Training loss: 1.8457609415054321 

Epoch 5, batch 5257
Training loss: 1.6892344951629639 

Epoch 5, batch 5258
Training loss: 1.6221089363098145 

Epoch 5, batch 5259
Training loss: 2.0304131507873535 

Epoch 5, batch 5260
Training loss: 1.5419222116470337 

Epoch 5, batch 5261
Training loss: 1.5089974403381348 

Epoch 5, batch 5262
Training loss: 1.8035032749176025 

Epoch 5, batch 5263
Training loss: 1.9024218320846558 

Epoch 5, batch 5264
Training loss: 1.76133775711

Epoch 5, batch 5449
Training loss: 1.983227252960205 

Epoch 5, batch 5450
Training loss: 1.5882155895233154 

Epoch 5, batch 5451
Training loss: 1.7245075702667236 

Epoch 5, batch 5452
Training loss: 1.594190239906311 

Epoch 5, batch 5453
Training loss: 1.7188106775283813 

Epoch 5, batch 5454
Training loss: 1.5438586473464966 

Epoch 5, batch 5455
Training loss: 1.6358413696289062 

Epoch 5, batch 5456
Training loss: 1.5702687501907349 

Epoch 5, batch 5457
Training loss: 1.882366418838501 

Epoch 5, batch 5458
Training loss: 1.8635166883468628 

Epoch 5, batch 5459
Training loss: 1.7027400732040405 

Epoch 5, batch 5460
Training loss: 1.7141902446746826 

Epoch 5, batch 5461
Training loss: 1.9064640998840332 

Epoch 5, batch 5462
Training loss: 1.6708924770355225 

Epoch 5, batch 5463
Training loss: 1.862178087234497 

Epoch 5, batch 5464
Training loss: 1.652820110321045 

Epoch 5, batch 5465
Training loss: 1.7534642219543457 

Epoch 5, batch 5466
Training loss: 1.8559218645095825

Epoch 5, batch 5653
Training loss: 1.7329504489898682 

Epoch 5, batch 5654
Training loss: 1.6231054067611694 

Epoch 5, batch 5655
Training loss: 1.7471067905426025 

Epoch 5, batch 5656
Training loss: 1.764328956604004 

Epoch 5, batch 5657
Training loss: 1.6474223136901855 

Epoch 5, batch 5658
Training loss: 1.631348729133606 

Epoch 5, batch 5659
Training loss: 1.6240817308425903 

Epoch 5, batch 5660
Training loss: 1.7836159467697144 

Epoch 5, batch 5661
Training loss: 1.7263703346252441 

Epoch 5, batch 5662
Training loss: 1.5328813791275024 

Epoch 5, batch 5663
Training loss: 1.6566542387008667 

Epoch 5, batch 5664
Training loss: 1.624911904335022 

Epoch 5, batch 5665
Training loss: 1.6581499576568604 

Epoch 5, batch 5666
Training loss: 1.613094449043274 

Epoch 5, batch 5667
Training loss: 1.820212483406067 

Epoch 5, batch 5668
Training loss: 1.6377297639846802 

Epoch 5, batch 5669
Training loss: 1.7127511501312256 

Epoch 5, batch 5670
Training loss: 1.913550615310669 

Epoch 5, batch 5852
Training loss: 1.695288896560669 

Epoch 5, batch 5853
Training loss: 1.6895464658737183 

Epoch 5, batch 5854
Training loss: 1.6193526983261108 

Epoch 5, batch 5855
Training loss: 1.590438723564148 

Epoch 5, batch 5856
Training loss: 1.566845178604126 

Epoch 5, batch 5857
Training loss: 1.58783757686615 

Epoch 5, batch 5858
Training loss: 1.6273128986358643 

Epoch 5, batch 5859
Training loss: 1.7576699256896973 

Epoch 5, batch 5860
Training loss: 1.930857539176941 

Epoch 5, batch 5861
Training loss: 2.0628137588500977 

Epoch 5, batch 5862
Training loss: 1.8046411275863647 

Epoch 5, batch 5863
Training loss: 1.8650248050689697 

Epoch 5, batch 5864
Training loss: 1.9095656871795654 

Epoch 5, batch 5865
Training loss: 1.8791999816894531 

Epoch 5, batch 5866
Training loss: 1.9511175155639648 

Epoch 5, batch 5867
Training loss: 1.8416695594787598 

Epoch 5, batch 5868
Training loss: 1.7680349349975586 

Epoch 5, batch 5869
Training loss: 1.7723255157470703 

Epoch 6, batch 51
Training loss: 1.6191307306289673 

Epoch 6, batch 52
Training loss: 1.9068357944488525 

Epoch 6, batch 53
Training loss: 1.686367392539978 

Epoch 6, batch 54
Training loss: 1.6499180793762207 

Epoch 6, batch 55
Training loss: 1.7677414417266846 

Epoch 6, batch 56
Training loss: 2.02469539642334 

Epoch 6, batch 57
Training loss: 1.9669016599655151 

Epoch 6, batch 58
Training loss: 1.4906384944915771 

Epoch 6, batch 59
Training loss: 1.883618712425232 

Epoch 6, batch 60
Training loss: 1.615978717803955 

Epoch 6, batch 61
Training loss: 1.8220527172088623 

Epoch 6, batch 62
Training loss: 1.4934258460998535 

Epoch 6, batch 63
Training loss: 1.9252451658248901 

Epoch 6, batch 64
Training loss: 1.7272231578826904 

Epoch 6, batch 65
Training loss: 1.9053146839141846 

Epoch 6, batch 66
Training loss: 1.5542833805084229 

Epoch 6, batch 67
Training loss: 1.924564003944397 

Epoch 6, batch 68
Training loss: 1.7042677402496338 

Epoch 6, batch 69
Training loss: 1

Epoch 6, batch 246
Training loss: 1.988820195198059 

Epoch 6, batch 247
Training loss: 1.930835247039795 

Epoch 6, batch 248
Training loss: 1.6006395816802979 

Epoch 6, batch 249
Training loss: 1.7879096269607544 

Epoch 6, batch 250
Training loss: 1.7835015058517456 

Epoch 6, batch 251
Training loss: 1.8166310787200928 

Epoch 6, batch 252
Training loss: 1.7276661396026611 

Epoch 6, batch 253
Training loss: 1.772407054901123 

Epoch 6, batch 254
Training loss: 1.6377720832824707 

Epoch 6, batch 255
Training loss: 1.7899727821350098 

Epoch 6, batch 256
Training loss: 1.6209787130355835 

Epoch 6, batch 257
Training loss: 1.7777718305587769 

Epoch 6, batch 258
Training loss: 1.8919098377227783 

Epoch 6, batch 259
Training loss: 1.6881521940231323 

Epoch 6, batch 260
Training loss: 1.9409843683242798 

Epoch 6, batch 261
Training loss: 1.9524530172348022 

Epoch 6, batch 262
Training loss: 1.6943267583847046 

Epoch 6, batch 263
Training loss: 1.6339561939239502 

Epoch 6, batc

Epoch 6, batch 447
Training loss: 2.0050954818725586 

Epoch 6, batch 448
Training loss: 1.941695213317871 

Epoch 6, batch 449
Training loss: 1.8090720176696777 

Epoch 6, batch 450
Training loss: 1.809375286102295 

Epoch 6, batch 451
Training loss: 1.6083505153656006 

Epoch 6, batch 452
Training loss: 1.6464667320251465 

Epoch 6, batch 453
Training loss: 1.9155771732330322 

Epoch 6, batch 454
Training loss: 1.914501667022705 

Epoch 6, batch 455
Training loss: 1.8333048820495605 

Epoch 6, batch 456
Training loss: 1.7585320472717285 

Epoch 6, batch 457
Training loss: 1.6173193454742432 

Epoch 6, batch 458
Training loss: 1.562957525253296 

Epoch 6, batch 459
Training loss: 1.4671192169189453 

Epoch 6, batch 460
Training loss: 1.575621247291565 

Epoch 6, batch 461
Training loss: 1.5886646509170532 

Epoch 6, batch 462
Training loss: 1.750918984413147 

Epoch 6, batch 463
Training loss: 1.7621508836746216 

Epoch 6, batch 464
Training loss: 1.9931280612945557 

Epoch 6, batch 4

Epoch 6, batch 650
Training loss: 1.7569303512573242 

Epoch 6, batch 651
Training loss: 1.579653263092041 

Epoch 6, batch 652
Training loss: 1.736082673072815 

Epoch 6, batch 653
Training loss: 2.097019672393799 

Epoch 6, batch 654
Training loss: 1.551076054573059 

Epoch 6, batch 655
Training loss: 1.9237720966339111 

Epoch 6, batch 656
Training loss: 1.8384400606155396 

Epoch 6, batch 657
Training loss: 1.747191071510315 

Epoch 6, batch 658
Training loss: 1.5512782335281372 

Epoch 6, batch 659
Training loss: 1.575453281402588 

Epoch 6, batch 660
Training loss: 1.9798271656036377 

Epoch 6, batch 661
Training loss: 1.5069166421890259 

Epoch 6, batch 662
Training loss: 2.0541832447052 

Epoch 6, batch 663
Training loss: 1.722101092338562 

Epoch 6, batch 664
Training loss: 1.8117778301239014 

Epoch 6, batch 665
Training loss: 2.035909652709961 

Epoch 6, batch 666
Training loss: 1.6832585334777832 

Epoch 6, batch 667
Training loss: 1.4848490953445435 

Epoch 6, batch 668
Tr

Epoch 6, batch 851
Training loss: 1.6822361946105957 

Epoch 6, batch 852
Training loss: 1.6195050477981567 

Epoch 6, batch 853
Training loss: 1.8560349941253662 

Epoch 6, batch 854
Training loss: 1.744442105293274 

Epoch 6, batch 855
Training loss: 1.9328360557556152 

Epoch 6, batch 856
Training loss: 1.9666751623153687 

Epoch 6, batch 857
Training loss: 1.6145883798599243 

Epoch 6, batch 858
Training loss: 1.909318208694458 

Epoch 6, batch 859
Training loss: 1.8267121315002441 

Epoch 6, batch 860
Training loss: 1.9410159587860107 

Epoch 6, batch 861
Training loss: 1.7316739559173584 

Epoch 6, batch 862
Training loss: 1.5995595455169678 

Epoch 6, batch 863
Training loss: 1.7156758308410645 

Epoch 6, batch 864
Training loss: 1.6958975791931152 

Epoch 6, batch 865
Training loss: 1.6963162422180176 

Epoch 6, batch 866
Training loss: 1.7895185947418213 

Epoch 6, batch 867
Training loss: 1.6207499504089355 

Epoch 6, batch 868
Training loss: 1.9024407863616943 

Epoch 6, bat

Epoch 6, batch 1049
Training loss: 1.7704124450683594 

Epoch 6, batch 1050
Training loss: 1.9032044410705566 

Epoch 6, batch 1051
Training loss: 1.8512386083602905 

Epoch 6, batch 1052
Training loss: 1.9201090335845947 

Epoch 6, batch 1053
Training loss: 1.5080416202545166 

Epoch 6, batch 1054
Training loss: 1.6128215789794922 

Epoch 6, batch 1055
Training loss: 1.6770942211151123 

Epoch 6, batch 1056
Training loss: 1.6181199550628662 

Epoch 6, batch 1057
Training loss: 1.5318242311477661 

Epoch 6, batch 1058
Training loss: 1.7828738689422607 

Epoch 6, batch 1059
Training loss: 1.7676801681518555 

Epoch 6, batch 1060
Training loss: 1.9364290237426758 

Epoch 6, batch 1061
Training loss: 1.862245798110962 

Epoch 6, batch 1062
Training loss: 1.9096852540969849 

Epoch 6, batch 1063
Training loss: 1.8023678064346313 

Epoch 6, batch 1064
Training loss: 1.910603404045105 

Epoch 6, batch 1065
Training loss: 1.7156118154525757 

Epoch 6, batch 1066
Training loss: 1.7284637689590

Epoch 6, batch 1252
Training loss: 1.9651800394058228 

Epoch 6, batch 1253
Training loss: 1.9803911447525024 

Epoch 6, batch 1254
Training loss: 1.6333630084991455 

Epoch 6, batch 1255
Training loss: 1.7410681247711182 

Epoch 6, batch 1256
Training loss: 1.8995623588562012 

Epoch 6, batch 1257
Training loss: 1.5095638036727905 

Epoch 6, batch 1258
Training loss: 1.8652409315109253 

Epoch 6, batch 1259
Training loss: 1.7285875082015991 

Epoch 6, batch 1260
Training loss: 1.600203275680542 

Epoch 6, batch 1261
Training loss: 1.6924580335617065 

Epoch 6, batch 1262
Training loss: 1.8849314451217651 

Epoch 6, batch 1263
Training loss: 1.7428624629974365 

Epoch 6, batch 1264
Training loss: 1.6680099964141846 

Epoch 6, batch 1265
Training loss: 1.83501136302948 

Epoch 6, batch 1266
Training loss: 1.584660530090332 

Epoch 6, batch 1267
Training loss: 1.8779703378677368 

Epoch 6, batch 1268
Training loss: 1.9979788064956665 

Epoch 6, batch 1269
Training loss: 1.529326200485229

Epoch 6, batch 1452
Training loss: 1.533927083015442 

Epoch 6, batch 1453
Training loss: 1.7753393650054932 

Epoch 6, batch 1454
Training loss: 1.4989980459213257 

Epoch 6, batch 1455
Training loss: 1.706847906112671 

Epoch 6, batch 1456
Training loss: 1.6844297647476196 

Epoch 6, batch 1457
Training loss: 1.757906436920166 

Epoch 6, batch 1458
Training loss: 1.8284170627593994 

Epoch 6, batch 1459
Training loss: 1.873357892036438 

Epoch 6, batch 1460
Training loss: 1.731221079826355 

Epoch 6, batch 1461
Training loss: 1.6487412452697754 

Epoch 6, batch 1462
Training loss: 1.803039789199829 

Epoch 6, batch 1463
Training loss: 1.5641295909881592 

Epoch 6, batch 1464
Training loss: 2.007436513900757 

Epoch 6, batch 1465
Training loss: 1.5781391859054565 

Epoch 6, batch 1466
Training loss: 1.7784181833267212 

Epoch 6, batch 1467
Training loss: 1.900970220565796 

Epoch 6, batch 1468
Training loss: 1.848329782485962 

Epoch 6, batch 1469
Training loss: 1.888607144355774 

Ep

Epoch 6, batch 1651
Training loss: 1.6753844022750854 

Epoch 6, batch 1652
Training loss: 1.7161784172058105 

Epoch 6, batch 1653
Training loss: 1.8999090194702148 

Epoch 6, batch 1654
Training loss: 1.917931079864502 

Epoch 6, batch 1655
Training loss: 1.9008095264434814 

Epoch 6, batch 1656
Training loss: 1.7474945783615112 

Epoch 6, batch 1657
Training loss: 1.7665233612060547 

Epoch 6, batch 1658
Training loss: 1.8599456548690796 

Epoch 6, batch 1659
Training loss: 1.5009267330169678 

Epoch 6, batch 1660
Training loss: 1.757054328918457 

Epoch 6, batch 1661
Training loss: 1.7123929262161255 

Epoch 6, batch 1662
Training loss: 1.5929994583129883 

Epoch 6, batch 1663
Training loss: 1.9321506023406982 

Epoch 6, batch 1664
Training loss: 1.9362422227859497 

Epoch 6, batch 1665
Training loss: 1.6834216117858887 

Epoch 6, batch 1666
Training loss: 1.6069153547286987 

Epoch 6, batch 1667
Training loss: 1.6102044582366943 

Epoch 6, batch 1668
Training loss: 1.9356160163879

Epoch 6, batch 1852
Training loss: 1.7879455089569092 

Epoch 6, batch 1853
Training loss: 1.7493455410003662 

Epoch 6, batch 1854
Training loss: 1.7827188968658447 

Epoch 6, batch 1855
Training loss: 1.504034399986267 

Epoch 6, batch 1856
Training loss: 1.8230791091918945 

Epoch 6, batch 1857
Training loss: 1.6293919086456299 

Epoch 6, batch 1858
Training loss: 1.4903533458709717 

Epoch 6, batch 1859
Training loss: 1.6160961389541626 

Epoch 6, batch 1860
Training loss: 1.7822723388671875 

Epoch 6, batch 1861
Training loss: 1.6746493577957153 

Epoch 6, batch 1862
Training loss: 1.7318612337112427 

Epoch 6, batch 1863
Training loss: 1.7794599533081055 

Epoch 6, batch 1864
Training loss: 1.550907850265503 

Epoch 6, batch 1865
Training loss: 1.6996549367904663 

Epoch 6, batch 1866
Training loss: 1.7897987365722656 

Epoch 6, batch 1867
Training loss: 2.043928384780884 

Epoch 6, batch 1868
Training loss: 1.8055806159973145 

Epoch 6, batch 1869
Training loss: 1.74413704872131

Epoch 6, batch 2053
Training loss: 1.9533586502075195 

Epoch 6, batch 2054
Training loss: 1.808634638786316 

Epoch 6, batch 2055
Training loss: 1.563166856765747 

Epoch 6, batch 2056
Training loss: 2.056333065032959 

Epoch 6, batch 2057
Training loss: 1.6818630695343018 

Epoch 6, batch 2058
Training loss: 1.7811942100524902 

Epoch 6, batch 2059
Training loss: 1.849542260169983 

Epoch 6, batch 2060
Training loss: 2.0512354373931885 

Epoch 6, batch 2061
Training loss: 1.4677814245224 

Epoch 6, batch 2062
Training loss: 2.048475980758667 

Epoch 6, batch 2063
Training loss: 1.7336688041687012 

Epoch 6, batch 2064
Training loss: 1.7399048805236816 

Epoch 6, batch 2065
Training loss: 1.4783697128295898 

Epoch 6, batch 2066
Training loss: 1.7563709020614624 

Epoch 6, batch 2067
Training loss: 1.5132336616516113 

Epoch 6, batch 2068
Training loss: 1.6710872650146484 

Epoch 6, batch 2069
Training loss: 1.6523349285125732 

Epoch 6, batch 2070
Training loss: 1.8790538311004639 



Epoch 6, batch 2256
Training loss: 1.8255805969238281 

Epoch 6, batch 2257
Training loss: 1.4804706573486328 

Epoch 6, batch 2258
Training loss: 1.887759804725647 

Epoch 6, batch 2259
Training loss: 1.8205746412277222 

Epoch 6, batch 2260
Training loss: 1.5833079814910889 

Epoch 6, batch 2261
Training loss: 1.7934659719467163 

Epoch 6, batch 2262
Training loss: 1.742742896080017 

Epoch 6, batch 2263
Training loss: 1.8307546377182007 

Epoch 6, batch 2264
Training loss: 1.5939342975616455 

Epoch 6, batch 2265
Training loss: 1.7274411916732788 

Epoch 6, batch 2266
Training loss: 1.8009697198867798 

Epoch 6, batch 2267
Training loss: 1.9902263879776 

Epoch 6, batch 2268
Training loss: 1.592024803161621 

Epoch 6, batch 2269
Training loss: 1.6257573366165161 

Epoch 6, batch 2270
Training loss: 1.8251128196716309 

Epoch 6, batch 2271
Training loss: 1.8926477432250977 

Epoch 6, batch 2272
Training loss: 1.5805385112762451 

Epoch 6, batch 2273
Training loss: 1.746565341949463 


Epoch 6, batch 2454
Training loss: 1.5066882371902466 

Epoch 6, batch 2455
Training loss: 1.7104763984680176 

Epoch 6, batch 2456
Training loss: 1.8645368814468384 

Epoch 6, batch 2457
Training loss: 1.8604819774627686 

Epoch 6, batch 2458
Training loss: 1.7235627174377441 

Epoch 6, batch 2459
Training loss: 1.7773103713989258 

Epoch 6, batch 2460
Training loss: 1.8388376235961914 

Epoch 6, batch 2461
Training loss: 1.696733832359314 

Epoch 6, batch 2462
Training loss: 1.7898029088974 

Epoch 6, batch 2463
Training loss: 1.8536814451217651 

Epoch 6, batch 2464
Training loss: 1.495309829711914 

Epoch 6, batch 2465
Training loss: 1.96514892578125 

Epoch 6, batch 2466
Training loss: 1.7802457809448242 

Epoch 6, batch 2467
Training loss: 1.7598652839660645 

Epoch 6, batch 2468
Training loss: 1.927101492881775 

Epoch 6, batch 2469
Training loss: 1.7281816005706787 

Epoch 6, batch 2470
Training loss: 1.6633751392364502 

Epoch 6, batch 2471
Training loss: 2.056342840194702 

E

Epoch 6, batch 2656
Training loss: 1.724291205406189 

Epoch 6, batch 2657
Training loss: 1.7077388763427734 

Epoch 6, batch 2658
Training loss: 2.0333409309387207 

Epoch 6, batch 2659
Training loss: 1.8855454921722412 

Epoch 6, batch 2660
Training loss: 1.6575076580047607 

Epoch 6, batch 2661
Training loss: 1.6107263565063477 

Epoch 6, batch 2662
Training loss: 1.8249611854553223 

Epoch 6, batch 2663
Training loss: 1.7281672954559326 

Epoch 6, batch 2664
Training loss: 1.8030240535736084 

Epoch 6, batch 2665
Training loss: 1.8222455978393555 

Epoch 6, batch 2666
Training loss: 1.654012680053711 

Epoch 6, batch 2667
Training loss: 1.9189538955688477 

Epoch 6, batch 2668
Training loss: 1.7061667442321777 

Epoch 6, batch 2669
Training loss: 1.6773295402526855 

Epoch 6, batch 2670
Training loss: 1.9323184490203857 

Epoch 6, batch 2671
Training loss: 1.6905328035354614 

Epoch 6, batch 2672
Training loss: 1.7168009281158447 

Epoch 6, batch 2673
Training loss: 1.6161731481552

Epoch 6, batch 2855
Training loss: 1.6948120594024658 

Epoch 6, batch 2856
Training loss: 1.6833574771881104 

Epoch 6, batch 2857
Training loss: 1.9060649871826172 

Epoch 6, batch 2858
Training loss: 1.8821017742156982 

Epoch 6, batch 2859
Training loss: 1.8075404167175293 

Epoch 6, batch 2860
Training loss: 1.7271716594696045 

Epoch 6, batch 2861
Training loss: 1.7612252235412598 

Epoch 6, batch 2862
Training loss: 1.8516252040863037 

Epoch 6, batch 2863
Training loss: 1.6750733852386475 

Epoch 6, batch 2864
Training loss: 1.629998803138733 

Epoch 6, batch 2865
Training loss: 1.7226762771606445 

Epoch 6, batch 2866
Training loss: 1.7866154909133911 

Epoch 6, batch 2867
Training loss: 1.582991361618042 

Epoch 6, batch 2868
Training loss: 1.5888200998306274 

Epoch 6, batch 2869
Training loss: 1.6586214303970337 

Epoch 6, batch 2870
Training loss: 1.9598629474639893 

Epoch 6, batch 2871
Training loss: 1.84246027469635 

Epoch 6, batch 2872
Training loss: 1.660714864730835

Epoch 6, batch 3054
Training loss: 1.6637738943099976 

Epoch 6, batch 3055
Training loss: 1.5238579511642456 

Epoch 6, batch 3056
Training loss: 1.5866503715515137 

Epoch 6, batch 3057
Training loss: 1.5811469554901123 

Epoch 6, batch 3058
Training loss: 2.0111193656921387 

Epoch 6, batch 3059
Training loss: 1.6126441955566406 

Epoch 6, batch 3060
Training loss: 1.9304927587509155 

Epoch 6, batch 3061
Training loss: 1.6486763954162598 

Epoch 6, batch 3062
Training loss: 1.7287380695343018 

Epoch 6, batch 3063
Training loss: 1.4620503187179565 

Epoch 6, batch 3064
Training loss: 1.8970621824264526 

Epoch 6, batch 3065
Training loss: 1.654127597808838 

Epoch 6, batch 3066
Training loss: 1.6998651027679443 

Epoch 6, batch 3067
Training loss: 1.6013903617858887 

Epoch 6, batch 3068
Training loss: 1.4631911516189575 

Epoch 6, batch 3069
Training loss: 1.5197932720184326 

Epoch 6, batch 3070
Training loss: 1.8636276721954346 

Epoch 6, batch 3071
Training loss: 1.625230789184

Epoch 6, batch 3250
Training loss: 1.719076156616211 

Epoch 6, batch 3251
Training loss: 1.9361075162887573 

Epoch 6, batch 3252
Training loss: 1.570584774017334 

Epoch 6, batch 3253
Training loss: 1.8840903043746948 

Epoch 6, batch 3254
Training loss: 1.727912187576294 

Epoch 6, batch 3255
Training loss: 1.6635830402374268 

Epoch 6, batch 3256
Training loss: 1.7200508117675781 

Epoch 6, batch 3257
Training loss: 1.8546390533447266 

Epoch 6, batch 3258
Training loss: 1.7682600021362305 

Epoch 6, batch 3259
Training loss: 1.9093284606933594 

Epoch 6, batch 3260
Training loss: 1.6484450101852417 

Epoch 6, batch 3261
Training loss: 1.6758649349212646 

Epoch 6, batch 3262
Training loss: 1.899287223815918 

Epoch 6, batch 3263
Training loss: 1.994558572769165 

Epoch 6, batch 3264
Training loss: 1.4814891815185547 

Epoch 6, batch 3265
Training loss: 1.541655421257019 

Epoch 6, batch 3266
Training loss: 1.6131659746170044 

Epoch 6, batch 3267
Training loss: 1.5466294288635254 

Epoch 6, batch 3453
Training loss: 1.6138873100280762 

Epoch 6, batch 3454
Training loss: 1.847386360168457 

Epoch 6, batch 3455
Training loss: 1.5701924562454224 

Epoch 6, batch 3456
Training loss: 1.872585415840149 

Epoch 6, batch 3457
Training loss: 1.5474823713302612 

Epoch 6, batch 3458
Training loss: 1.6536626815795898 

Epoch 6, batch 3459
Training loss: 1.931786060333252 

Epoch 6, batch 3460
Training loss: 1.7114291191101074 

Epoch 6, batch 3461
Training loss: 1.8881195783615112 

Epoch 6, batch 3462
Training loss: 1.8268451690673828 

Epoch 6, batch 3463
Training loss: 1.874561071395874 

Epoch 6, batch 3464
Training loss: 2.010136842727661 

Epoch 6, batch 3465
Training loss: 1.779513955116272 

Epoch 6, batch 3466
Training loss: 1.8744421005249023 

Epoch 6, batch 3467
Training loss: 1.5727436542510986 

Epoch 6, batch 3468
Training loss: 1.687353253364563 

Epoch 6, batch 3469
Training loss: 1.8321607112884521 

Epoch 6, batch 3470
Training loss: 1.7050024271011353 


Epoch 6, batch 3654
Training loss: 1.4721012115478516 

Epoch 6, batch 3655
Training loss: 1.9250624179840088 

Epoch 6, batch 3656
Training loss: 1.8041293621063232 

Epoch 6, batch 3657
Training loss: 1.5583865642547607 

Epoch 6, batch 3658
Training loss: 1.9799222946166992 

Epoch 6, batch 3659
Training loss: 1.7225730419158936 

Epoch 6, batch 3660
Training loss: 1.9259178638458252 

Epoch 6, batch 3661
Training loss: 1.8074302673339844 

Epoch 6, batch 3662
Training loss: 1.746986746788025 

Epoch 6, batch 3663
Training loss: 1.8555243015289307 

Epoch 6, batch 3664
Training loss: 1.4976489543914795 

Epoch 6, batch 3665
Training loss: 1.6378655433654785 

Epoch 6, batch 3666
Training loss: 1.7351216077804565 

Epoch 6, batch 3667
Training loss: 1.9997096061706543 

Epoch 6, batch 3668
Training loss: 1.7643332481384277 

Epoch 6, batch 3669
Training loss: 1.5290606021881104 

Epoch 6, batch 3670
Training loss: 1.8348307609558105 

Epoch 6, batch 3671
Training loss: 1.857283830642

Epoch 6, batch 3851
Training loss: 1.661120057106018 

Epoch 6, batch 3852
Training loss: 1.6559563875198364 

Epoch 6, batch 3853
Training loss: 1.8846957683563232 

Epoch 6, batch 3854
Training loss: 1.782464623451233 

Epoch 6, batch 3855
Training loss: 1.73622727394104 

Epoch 6, batch 3856
Training loss: 1.8044580221176147 

Epoch 6, batch 3857
Training loss: 1.8593535423278809 

Epoch 6, batch 3858
Training loss: 1.5463433265686035 

Epoch 6, batch 3859
Training loss: 1.9534988403320312 

Epoch 6, batch 3860
Training loss: 1.6891882419586182 

Epoch 6, batch 3861
Training loss: 1.5340907573699951 

Epoch 6, batch 3862
Training loss: 1.783158779144287 

Epoch 6, batch 3863
Training loss: 1.8629040718078613 

Epoch 6, batch 3864
Training loss: 2.049069404602051 

Epoch 6, batch 3865
Training loss: 1.689555287361145 

Epoch 6, batch 3866
Training loss: 2.0007483959198 

Epoch 6, batch 3867
Training loss: 1.6272897720336914 

Epoch 6, batch 3868
Training loss: 1.6309754848480225 

Ep

Epoch 6, batch 4052
Training loss: 1.8408420085906982 

Epoch 6, batch 4053
Training loss: 1.869314432144165 

Epoch 6, batch 4054
Training loss: 1.710912823677063 

Epoch 6, batch 4055
Training loss: 1.643086552619934 

Epoch 6, batch 4056
Training loss: 1.6042864322662354 

Epoch 6, batch 4057
Training loss: 1.7993415594100952 

Epoch 6, batch 4058
Training loss: 1.921836018562317 

Epoch 6, batch 4059
Training loss: 1.6573936939239502 

Epoch 6, batch 4060
Training loss: 1.9928542375564575 

Epoch 6, batch 4061
Training loss: 1.8351434469223022 

Epoch 6, batch 4062
Training loss: 1.5900808572769165 

Epoch 6, batch 4063
Training loss: 1.7906906604766846 

Epoch 6, batch 4064
Training loss: 1.591221809387207 

Epoch 6, batch 4065
Training loss: 1.7523988485336304 

Epoch 6, batch 4066
Training loss: 1.7277910709381104 

Epoch 6, batch 4067
Training loss: 2.0187885761260986 

Epoch 6, batch 4068
Training loss: 1.994422435760498 

Epoch 6, batch 4069
Training loss: 1.7407402992248535 

Epoch 6, batch 4255
Training loss: 2.1117703914642334 

Epoch 6, batch 4256
Training loss: 1.6273934841156006 

Epoch 6, batch 4257
Training loss: 1.5946414470672607 

Epoch 6, batch 4258
Training loss: 1.6914098262786865 

Epoch 6, batch 4259
Training loss: 1.6031144857406616 

Epoch 6, batch 4260
Training loss: 1.5653588771820068 

Epoch 6, batch 4261
Training loss: 1.6846365928649902 

Epoch 6, batch 4262
Training loss: 1.8608574867248535 

Epoch 6, batch 4263
Training loss: 1.682633399963379 

Epoch 6, batch 4264
Training loss: 1.794681191444397 

Epoch 6, batch 4265
Training loss: 1.6330945491790771 

Epoch 6, batch 4266
Training loss: 1.9604804515838623 

Epoch 6, batch 4267
Training loss: 1.600452184677124 

Epoch 6, batch 4268
Training loss: 1.7967966794967651 

Epoch 6, batch 4269
Training loss: 1.4881970882415771 

Epoch 6, batch 4270
Training loss: 1.9090843200683594 

Epoch 6, batch 4271
Training loss: 1.6985650062561035 

Epoch 6, batch 4272
Training loss: 1.68097305297851

Epoch 6, batch 4458
Training loss: 1.813518762588501 

Epoch 6, batch 4459
Training loss: 1.5951961278915405 

Epoch 6, batch 4460
Training loss: 1.7643948793411255 

Epoch 6, batch 4461
Training loss: 1.9969146251678467 

Epoch 6, batch 4462
Training loss: 1.9262176752090454 

Epoch 6, batch 4463
Training loss: 1.6282621622085571 

Epoch 6, batch 4464
Training loss: 1.624765396118164 

Epoch 6, batch 4465
Training loss: 1.6831786632537842 

Epoch 6, batch 4466
Training loss: 1.9529197216033936 

Epoch 6, batch 4467
Training loss: 1.5685502290725708 

Epoch 6, batch 4468
Training loss: 1.698035717010498 

Epoch 6, batch 4469
Training loss: 1.6924195289611816 

Epoch 6, batch 4470
Training loss: 1.7424287796020508 

Epoch 6, batch 4471
Training loss: 1.6526894569396973 

Epoch 6, batch 4472
Training loss: 1.7606315612792969 

Epoch 6, batch 4473
Training loss: 1.9108625650405884 

Epoch 6, batch 4474
Training loss: 1.575362205505371 

Epoch 6, batch 4475
Training loss: 1.821843862533569

Epoch 6, batch 4655
Training loss: 1.5899406671524048 

Epoch 6, batch 4656
Training loss: 1.6596753597259521 

Epoch 6, batch 4657
Training loss: 1.5372023582458496 

Epoch 6, batch 4658
Training loss: 1.6611250638961792 

Epoch 6, batch 4659
Training loss: 1.5598936080932617 

Epoch 6, batch 4660
Training loss: 1.5172849893569946 

Epoch 6, batch 4661
Training loss: 1.8674042224884033 

Epoch 6, batch 4662
Training loss: 1.643062710762024 

Epoch 6, batch 4663
Training loss: 1.5047802925109863 

Epoch 6, batch 4664
Training loss: 1.7983956336975098 

Epoch 6, batch 4665
Training loss: 1.8501181602478027 

Epoch 6, batch 4666
Training loss: 1.862499713897705 

Epoch 6, batch 4667
Training loss: 1.770300030708313 

Epoch 6, batch 4668
Training loss: 1.7222570180892944 

Epoch 6, batch 4669
Training loss: 1.6094486713409424 

Epoch 6, batch 4670
Training loss: 1.7165021896362305 

Epoch 6, batch 4671
Training loss: 1.6663652658462524 

Epoch 6, batch 4672
Training loss: 1.51912188529968

Epoch 6, batch 4858
Training loss: 1.6145057678222656 

Epoch 6, batch 4859
Training loss: 1.829484462738037 

Epoch 6, batch 4860
Training loss: 1.5515459775924683 

Epoch 6, batch 4861
Training loss: 1.7824718952178955 

Epoch 6, batch 4862
Training loss: 1.607067584991455 

Epoch 6, batch 4863
Training loss: 1.862002968788147 

Epoch 6, batch 4864
Training loss: 1.469422698020935 

Epoch 6, batch 4865
Training loss: 1.8719265460968018 

Epoch 6, batch 4866
Training loss: 1.7951843738555908 

Epoch 6, batch 4867
Training loss: 1.6852372884750366 

Epoch 6, batch 4868
Training loss: 1.5319321155548096 

Epoch 6, batch 4869
Training loss: 1.6934802532196045 

Epoch 6, batch 4870
Training loss: 1.7135298252105713 

Epoch 6, batch 4871
Training loss: 1.8295676708221436 

Epoch 6, batch 4872
Training loss: 1.8439793586730957 

Epoch 6, batch 4873
Training loss: 1.8506805896759033 

Epoch 6, batch 4874
Training loss: 1.978467345237732 

Epoch 6, batch 4875
Training loss: 1.7634527683258057

Epoch 6, batch 5059
Training loss: 1.9194231033325195 

Epoch 6, batch 5060
Training loss: 1.8928329944610596 

Epoch 6, batch 5061
Training loss: 1.507132887840271 

Epoch 6, batch 5062
Training loss: 1.772212266921997 

Epoch 6, batch 5063
Training loss: 1.6929560899734497 

Epoch 6, batch 5064
Training loss: 1.6276915073394775 

Epoch 6, batch 5065
Training loss: 1.663963794708252 

Epoch 6, batch 5066
Training loss: 1.8447116613388062 

Epoch 6, batch 5067
Training loss: 1.9685665369033813 

Epoch 6, batch 5068
Training loss: 1.8756095170974731 

Epoch 6, batch 5069
Training loss: 1.9031660556793213 

Epoch 6, batch 5070
Training loss: 1.8425767421722412 

Epoch 6, batch 5071
Training loss: 1.6671838760375977 

Epoch 6, batch 5072
Training loss: 1.959942102432251 

Epoch 6, batch 5073
Training loss: 1.579688310623169 

Epoch 6, batch 5074
Training loss: 1.880575180053711 

Epoch 6, batch 5075
Training loss: 1.7995173931121826 

Epoch 6, batch 5076
Training loss: 1.806862235069275 


Epoch 6, batch 5258
Training loss: 1.5917695760726929 

Epoch 6, batch 5259
Training loss: 2.0367746353149414 

Epoch 6, batch 5260
Training loss: 1.6126667261123657 

Epoch 6, batch 5261
Training loss: 1.6031246185302734 

Epoch 6, batch 5262
Training loss: 1.654548168182373 

Epoch 6, batch 5263
Training loss: 1.9051233530044556 

Epoch 6, batch 5264
Training loss: 1.6285845041275024 

Epoch 6, batch 5265
Training loss: 1.980395793914795 

Epoch 6, batch 5266
Training loss: 1.8782896995544434 

Epoch 6, batch 5267
Training loss: 1.851393461227417 

Epoch 6, batch 5268
Training loss: 1.6760656833648682 

Epoch 6, batch 5269
Training loss: 1.6299484968185425 

Epoch 6, batch 5270
Training loss: 1.8553491830825806 

Epoch 6, batch 5271
Training loss: 1.5930261611938477 

Epoch 6, batch 5272
Training loss: 1.8275563716888428 

Epoch 6, batch 5273
Training loss: 1.7156492471694946 

Epoch 6, batch 5274
Training loss: 1.7704942226409912 

Epoch 6, batch 5275
Training loss: 1.64998137950897

Epoch 6, batch 5458
Training loss: 1.5027923583984375 

Epoch 6, batch 5459
Training loss: 1.738031268119812 

Epoch 6, batch 5460
Training loss: 1.6132574081420898 

Epoch 6, batch 5461
Training loss: 1.7885504961013794 

Epoch 6, batch 5462
Training loss: 1.7139809131622314 

Epoch 6, batch 5463
Training loss: 1.5402195453643799 

Epoch 6, batch 5464
Training loss: 1.96405029296875 

Epoch 6, batch 5465
Training loss: 1.6490317583084106 

Epoch 6, batch 5466
Training loss: 1.6145439147949219 

Epoch 6, batch 5467
Training loss: 1.9936190843582153 

Epoch 6, batch 5468
Training loss: 1.8036260604858398 

Epoch 6, batch 5469
Training loss: 1.5072120428085327 

Epoch 6, batch 5470
Training loss: 1.6548279523849487 

Epoch 6, batch 5471
Training loss: 1.9062013626098633 

Epoch 6, batch 5472
Training loss: 1.638838768005371 

Epoch 6, batch 5473
Training loss: 1.6638728380203247 

Epoch 6, batch 5474
Training loss: 1.8932950496673584 

Epoch 6, batch 5475
Training loss: 1.739733457565307

Epoch 6, batch 5657
Training loss: 1.8815912008285522 

Epoch 6, batch 5658
Training loss: 1.7164864540100098 

Epoch 6, batch 5659
Training loss: 1.8818459510803223 

Epoch 6, batch 5660
Training loss: 1.96744966506958 

Epoch 6, batch 5661
Training loss: 2.0285069942474365 

Epoch 6, batch 5662
Training loss: 1.6212000846862793 

Epoch 6, batch 5663
Training loss: 1.6296887397766113 

Epoch 6, batch 5664
Training loss: 1.5769857168197632 

Epoch 6, batch 5665
Training loss: 1.541986107826233 

Epoch 6, batch 5666
Training loss: 1.839996337890625 

Epoch 6, batch 5667
Training loss: 1.5948749780654907 

Epoch 6, batch 5668
Training loss: 1.988131046295166 

Epoch 6, batch 5669
Training loss: 1.7423198223114014 

Epoch 6, batch 5670
Training loss: 2.0499155521392822 

Epoch 6, batch 5671
Training loss: 1.7701163291931152 

Epoch 6, batch 5672
Training loss: 1.9012556076049805 

Epoch 6, batch 5673
Training loss: 1.7706904411315918 

Epoch 6, batch 5674
Training loss: 1.951479196548462 

Epoch 6, batch 5848
Training loss: 1.6947834491729736 

Epoch 6, batch 5849
Training loss: 1.7457462549209595 

Epoch 6, batch 5850
Training loss: 1.9441068172454834 

Epoch 6, batch 5851
Training loss: 1.5957733392715454 

Epoch 6, batch 5852
Training loss: 1.8319514989852905 

Epoch 6, batch 5853
Training loss: 1.554473638534546 

Epoch 6, batch 5854
Training loss: 1.6447917222976685 

Epoch 6, batch 5855
Training loss: 1.9304802417755127 

Epoch 6, batch 5856
Training loss: 1.8149045705795288 

Epoch 6, batch 5857
Training loss: 1.6522622108459473 

Epoch 6, batch 5858
Training loss: 1.6270556449890137 

Epoch 6, batch 5859
Training loss: 1.9099042415618896 

Epoch 6, batch 5860
Training loss: 1.813340425491333 

Epoch 6, batch 5861
Training loss: 1.9050016403198242 

Epoch 6, batch 5862
Training loss: 1.6202139854431152 

Epoch 6, batch 5863
Training loss: 1.6044915914535522 

Epoch 6, batch 5864
Training loss: 1.937110424041748 

Epoch 6, batch 5865
Training loss: 1.63637721538543

Epoch 7, batch 35
Training loss: 1.651577353477478 

Epoch 7, batch 36
Training loss: 1.6038823127746582 

Epoch 7, batch 37
Training loss: 1.7165396213531494 

Epoch 7, batch 38
Training loss: 1.5651347637176514 

Epoch 7, batch 39
Training loss: 1.7615675926208496 

Epoch 7, batch 40
Training loss: 1.5897451639175415 

Epoch 7, batch 41
Training loss: 1.7934905290603638 

Epoch 7, batch 42
Training loss: 1.8356153964996338 

Epoch 7, batch 43
Training loss: 1.645133137702942 

Epoch 7, batch 44
Training loss: 1.7094285488128662 

Epoch 7, batch 45
Training loss: 1.6233817338943481 

Epoch 7, batch 46
Training loss: 1.5668694972991943 

Epoch 7, batch 47
Training loss: 1.8336163759231567 

Epoch 7, batch 48
Training loss: 1.5107471942901611 

Epoch 7, batch 49
Training loss: 1.8616524934768677 

Epoch 7, batch 50
Training loss: 1.8032371997833252 

Epoch 7, batch 51
Training loss: 1.9116674661636353 

Epoch 7, batch 52
Training loss: 1.6163033246994019 

Epoch 7, batch 53
Training los

Epoch 7, batch 238
Training loss: 1.6738642454147339 

Epoch 7, batch 239
Training loss: 1.6750684976577759 

Epoch 7, batch 240
Training loss: 1.6989781856536865 

Epoch 7, batch 241
Training loss: 1.52738618850708 

Epoch 7, batch 242
Training loss: 1.5658470392227173 

Epoch 7, batch 243
Training loss: 1.6305533647537231 

Epoch 7, batch 244
Training loss: 1.55489182472229 

Epoch 7, batch 245
Training loss: 1.5216941833496094 

Epoch 7, batch 246
Training loss: 1.998661994934082 

Epoch 7, batch 247
Training loss: 1.574539303779602 

Epoch 7, batch 248
Training loss: 1.5162296295166016 

Epoch 7, batch 249
Training loss: 1.890338659286499 

Epoch 7, batch 250
Training loss: 2.029674530029297 

Epoch 7, batch 251
Training loss: 1.8384673595428467 

Epoch 7, batch 252
Training loss: 1.7300140857696533 

Epoch 7, batch 253
Training loss: 1.6446588039398193 

Epoch 7, batch 254
Training loss: 1.6966907978057861 

Epoch 7, batch 255
Training loss: 1.7015495300292969 

Epoch 7, batch 256

Epoch 7, batch 439
Training loss: 1.7259553670883179 

Epoch 7, batch 440
Training loss: 1.9151558876037598 

Epoch 7, batch 441
Training loss: 1.7392436265945435 

Epoch 7, batch 442
Training loss: 1.6211819648742676 

Epoch 7, batch 443
Training loss: 1.887158751487732 

Epoch 7, batch 444
Training loss: 1.6698861122131348 

Epoch 7, batch 445
Training loss: 1.9180793762207031 

Epoch 7, batch 446
Training loss: 1.7513930797576904 

Epoch 7, batch 447
Training loss: 1.7816247940063477 

Epoch 7, batch 448
Training loss: 1.83524751663208 

Epoch 7, batch 449
Training loss: 1.8734618425369263 

Epoch 7, batch 450
Training loss: 1.59931218624115 

Epoch 7, batch 451
Training loss: 1.596150517463684 

Epoch 7, batch 452
Training loss: 1.5052638053894043 

Epoch 7, batch 453
Training loss: 1.8128454685211182 

Epoch 7, batch 454
Training loss: 1.8349957466125488 

Epoch 7, batch 455
Training loss: 1.6111764907836914 

Epoch 7, batch 456
Training loss: 1.603666067123413 

Epoch 7, batch 45

Epoch 7, batch 640
Training loss: 2.0660159587860107 

Epoch 7, batch 641
Training loss: 1.4858837127685547 

Epoch 7, batch 642
Training loss: 1.6343026161193848 

Epoch 7, batch 643
Training loss: 1.8447778224945068 

Epoch 7, batch 644
Training loss: 1.837372064590454 

Epoch 7, batch 645
Training loss: 1.6992493867874146 

Epoch 7, batch 646
Training loss: 1.6154885292053223 

Epoch 7, batch 647
Training loss: 1.7195782661437988 

Epoch 7, batch 648
Training loss: 1.8430979251861572 

Epoch 7, batch 649
Training loss: 1.8639333248138428 

Epoch 7, batch 650
Training loss: 1.6670429706573486 

Epoch 7, batch 651
Training loss: 1.5546401739120483 

Epoch 7, batch 652
Training loss: 1.8575433492660522 

Epoch 7, batch 653
Training loss: 1.672019600868225 

Epoch 7, batch 654
Training loss: 1.8196159601211548 

Epoch 7, batch 655
Training loss: 1.8442270755767822 

Epoch 7, batch 656
Training loss: 1.9751458168029785 

Epoch 7, batch 657
Training loss: 1.6424331665039062 

Epoch 7, bat

Epoch 7, batch 838
Training loss: 1.5663912296295166 

Epoch 7, batch 839
Training loss: 1.574475646018982 

Epoch 7, batch 840
Training loss: 1.7440215349197388 

Epoch 7, batch 841
Training loss: 1.732362985610962 

Epoch 7, batch 842
Training loss: 1.9204277992248535 

Epoch 7, batch 843
Training loss: 1.521646499633789 

Epoch 7, batch 844
Training loss: 1.6097698211669922 

Epoch 7, batch 845
Training loss: 1.979684591293335 

Epoch 7, batch 846
Training loss: 1.5413740873336792 

Epoch 7, batch 847
Training loss: 1.856827974319458 

Epoch 7, batch 848
Training loss: 1.6067731380462646 

Epoch 7, batch 849
Training loss: 1.6848320960998535 

Epoch 7, batch 850
Training loss: 1.7790578603744507 

Epoch 7, batch 851
Training loss: 2.0025341510772705 

Epoch 7, batch 852
Training loss: 1.7492387294769287 

Epoch 7, batch 853
Training loss: 1.7348277568817139 

Epoch 7, batch 854
Training loss: 1.7383193969726562 

Epoch 7, batch 855
Training loss: 1.84932541847229 

Epoch 7, batch 85

Epoch 7, batch 1037
Training loss: 1.830378532409668 

Epoch 7, batch 1038
Training loss: 1.616856336593628 

Epoch 7, batch 1039
Training loss: 1.766125202178955 

Epoch 7, batch 1040
Training loss: 1.509111762046814 

Epoch 7, batch 1041
Training loss: 1.6064305305480957 

Epoch 7, batch 1042
Training loss: 1.9259577989578247 

Epoch 7, batch 1043
Training loss: 1.5753473043441772 

Epoch 7, batch 1044
Training loss: 1.595998764038086 

Epoch 7, batch 1045
Training loss: 1.9313178062438965 

Epoch 7, batch 1046
Training loss: 1.814204454421997 

Epoch 7, batch 1047
Training loss: 1.6642745733261108 

Epoch 7, batch 1048
Training loss: 1.7942534685134888 

Epoch 7, batch 1049
Training loss: 1.8435410261154175 

Epoch 7, batch 1050
Training loss: 1.684257984161377 

Epoch 7, batch 1051
Training loss: 1.8538293838500977 

Epoch 7, batch 1052
Training loss: 1.7739968299865723 

Epoch 7, batch 1053
Training loss: 1.7105859518051147 

Epoch 7, batch 1054
Training loss: 1.764033555984497 



Epoch 7, batch 1239
Training loss: 1.8439512252807617 

Epoch 7, batch 1240
Training loss: 1.9013502597808838 

Epoch 7, batch 1241
Training loss: 1.5577688217163086 

Epoch 7, batch 1242
Training loss: 1.7361148595809937 

Epoch 7, batch 1243
Training loss: 1.859061598777771 

Epoch 7, batch 1244
Training loss: 1.6654980182647705 

Epoch 7, batch 1245
Training loss: 1.913846731185913 

Epoch 7, batch 1246
Training loss: 1.7477145195007324 

Epoch 7, batch 1247
Training loss: 1.7351808547973633 

Epoch 7, batch 1248
Training loss: 1.9961777925491333 

Epoch 7, batch 1249
Training loss: 1.6816942691802979 

Epoch 7, batch 1250
Training loss: 1.688661813735962 

Epoch 7, batch 1251
Training loss: 1.5757962465286255 

Epoch 7, batch 1252
Training loss: 1.6708929538726807 

Epoch 7, batch 1253
Training loss: 1.9627492427825928 

Epoch 7, batch 1254
Training loss: 1.599686622619629 

Epoch 7, batch 1255
Training loss: 1.7527985572814941 

Epoch 7, batch 1256
Training loss: 1.685218095779419

Epoch 7, batch 1438
Training loss: 1.7677513360977173 

Epoch 7, batch 1439
Training loss: 1.6354522705078125 

Epoch 7, batch 1440
Training loss: 1.5397875308990479 

Epoch 7, batch 1441
Training loss: 1.5671000480651855 

Epoch 7, batch 1442
Training loss: 2.007965564727783 

Epoch 7, batch 1443
Training loss: 1.879235029220581 

Epoch 7, batch 1444
Training loss: 1.901129126548767 

Epoch 7, batch 1445
Training loss: 1.5580264329910278 

Epoch 7, batch 1446
Training loss: 1.557663917541504 

Epoch 7, batch 1447
Training loss: 1.6481060981750488 

Epoch 7, batch 1448
Training loss: 1.9076133966445923 

Epoch 7, batch 1449
Training loss: 1.861847996711731 

Epoch 7, batch 1450
Training loss: 1.8426496982574463 

Epoch 7, batch 1451
Training loss: 1.7746142148971558 

Epoch 7, batch 1452
Training loss: 1.7999303340911865 

Epoch 7, batch 1453
Training loss: 1.9475722312927246 

Epoch 7, batch 1454
Training loss: 1.8432223796844482 

Epoch 7, batch 1455
Training loss: 1.5330730676651 



Epoch 7, batch 1639
Training loss: 1.8407566547393799 

Epoch 7, batch 1640
Training loss: 1.8694448471069336 

Epoch 7, batch 1641
Training loss: 1.9068392515182495 

Epoch 7, batch 1642
Training loss: 1.630080223083496 

Epoch 7, batch 1643
Training loss: 1.5363333225250244 

Epoch 7, batch 1644
Training loss: 1.9009602069854736 

Epoch 7, batch 1645
Training loss: 1.657848834991455 

Epoch 7, batch 1646
Training loss: 1.5905647277832031 

Epoch 7, batch 1647
Training loss: 1.6056439876556396 

Epoch 7, batch 1648
Training loss: 1.6994106769561768 

Epoch 7, batch 1649
Training loss: 1.6287846565246582 

Epoch 7, batch 1650
Training loss: 1.6699788570404053 

Epoch 7, batch 1651
Training loss: 1.626996636390686 

Epoch 7, batch 1652
Training loss: 1.9258885383605957 

Epoch 7, batch 1653
Training loss: 1.8974016904830933 

Epoch 7, batch 1654
Training loss: 1.9622302055358887 

Epoch 7, batch 1655
Training loss: 1.538845419883728 

Epoch 7, batch 1656
Training loss: 1.755233764648437

Epoch 7, batch 1839
Training loss: 1.770338773727417 

Epoch 7, batch 1840
Training loss: 1.744303822517395 

Epoch 7, batch 1841
Training loss: 1.7228999137878418 

Epoch 7, batch 1842
Training loss: 1.6165926456451416 

Epoch 7, batch 1843
Training loss: 1.4732049703598022 

Epoch 7, batch 1844
Training loss: 1.8359565734863281 

Epoch 7, batch 1845
Training loss: 1.8310704231262207 

Epoch 7, batch 1846
Training loss: 1.6133911609649658 

Epoch 7, batch 1847
Training loss: 1.8564445972442627 

Epoch 7, batch 1848
Training loss: 1.7948963642120361 

Epoch 7, batch 1849
Training loss: 1.911348581314087 

Epoch 7, batch 1850
Training loss: 1.8143360614776611 

Epoch 7, batch 1851
Training loss: 1.719483733177185 

Epoch 7, batch 1852
Training loss: 1.648184061050415 

Epoch 7, batch 1853
Training loss: 1.8867816925048828 

Epoch 7, batch 1854
Training loss: 1.8742051124572754 

Epoch 7, batch 1855
Training loss: 1.7396783828735352 

Epoch 7, batch 1856
Training loss: 1.9133886098861694

Epoch 7, batch 2039
Training loss: 1.9598960876464844 

Epoch 7, batch 2040
Training loss: 1.9050565958023071 

Epoch 7, batch 2041
Training loss: 1.7191768884658813 

Epoch 7, batch 2042
Training loss: 1.7498111724853516 

Epoch 7, batch 2043
Training loss: 1.8410465717315674 

Epoch 7, batch 2044
Training loss: 1.635378122329712 

Epoch 7, batch 2045
Training loss: 1.4711993932724 

Epoch 7, batch 2046
Training loss: 1.7171704769134521 

Epoch 7, batch 2047
Training loss: 1.5528557300567627 

Epoch 7, batch 2048
Training loss: 1.8471729755401611 

Epoch 7, batch 2049
Training loss: 1.9104924201965332 

Epoch 7, batch 2050
Training loss: 1.9148961305618286 

Epoch 7, batch 2051
Training loss: 1.7264701128005981 

Epoch 7, batch 2052
Training loss: 1.944244146347046 

Epoch 7, batch 2053
Training loss: 1.8498836755752563 

Epoch 7, batch 2054
Training loss: 1.907517433166504 

Epoch 7, batch 2055
Training loss: 1.4849724769592285 

Epoch 7, batch 2056
Training loss: 1.7373387813568115 

Epoch 7, batch 2240
Training loss: 1.549641728401184 

Epoch 7, batch 2241
Training loss: 1.7540894746780396 

Epoch 7, batch 2242
Training loss: 1.951022744178772 

Epoch 7, batch 2243
Training loss: 1.6275769472122192 

Epoch 7, batch 2244
Training loss: 1.7331372499465942 

Epoch 7, batch 2245
Training loss: 1.9330896139144897 

Epoch 7, batch 2246
Training loss: 1.9303350448608398 

Epoch 7, batch 2247
Training loss: 1.8394217491149902 

Epoch 7, batch 2248
Training loss: 1.9933552742004395 

Epoch 7, batch 2249
Training loss: 1.6314496994018555 

Epoch 7, batch 2250
Training loss: 1.8445203304290771 

Epoch 7, batch 2251
Training loss: 1.7649376392364502 

Epoch 7, batch 2252
Training loss: 1.6749098300933838 

Epoch 7, batch 2253
Training loss: 1.887758731842041 

Epoch 7, batch 2254
Training loss: 1.8791539669036865 

Epoch 7, batch 2255
Training loss: 1.8269331455230713 

Epoch 7, batch 2256
Training loss: 1.636986255645752 

Epoch 7, batch 2257
Training loss: 1.694786190986633

Epoch 7, batch 2442
Training loss: 1.555208444595337 

Epoch 7, batch 2443
Training loss: 1.5167665481567383 

Epoch 7, batch 2444
Training loss: 1.6305127143859863 

Epoch 7, batch 2445
Training loss: 1.7077089548110962 

Epoch 7, batch 2446
Training loss: 1.8715505599975586 

Epoch 7, batch 2447
Training loss: 1.620917558670044 

Epoch 7, batch 2448
Training loss: 1.612234115600586 

Epoch 7, batch 2449
Training loss: 1.9156527519226074 

Epoch 7, batch 2450
Training loss: 1.7952107191085815 

Epoch 7, batch 2451
Training loss: 1.6394357681274414 

Epoch 7, batch 2452
Training loss: 1.725529432296753 

Epoch 7, batch 2453
Training loss: 1.8988420963287354 

Epoch 7, batch 2454
Training loss: 2.019465923309326 

Epoch 7, batch 2455
Training loss: 1.9170172214508057 

Epoch 7, batch 2456
Training loss: 1.6094666719436646 

Epoch 7, batch 2457
Training loss: 1.9320766925811768 

Epoch 7, batch 2458
Training loss: 1.8592567443847656 

Epoch 7, batch 2459
Training loss: 1.668703317642212 

Epoch 7, batch 2642
Training loss: 2.0008294582366943 

Epoch 7, batch 2643
Training loss: 1.8047012090682983 

Epoch 7, batch 2644
Training loss: 1.8320361375808716 

Epoch 7, batch 2645
Training loss: 1.7437151670455933 

Epoch 7, batch 2646
Training loss: 1.9644477367401123 

Epoch 7, batch 2647
Training loss: 1.6494890451431274 

Epoch 7, batch 2648
Training loss: 1.60075843334198 

Epoch 7, batch 2649
Training loss: 1.7531683444976807 

Epoch 7, batch 2650
Training loss: 1.9652683734893799 

Epoch 7, batch 2651
Training loss: 2.0091776847839355 

Epoch 7, batch 2652
Training loss: 1.9776794910430908 

Epoch 7, batch 2653
Training loss: 1.5540308952331543 

Epoch 7, batch 2654
Training loss: 1.6283717155456543 

Epoch 7, batch 2655
Training loss: 1.917831540107727 

Epoch 7, batch 2656
Training loss: 1.7002671957015991 

Epoch 7, batch 2657
Training loss: 1.9566020965576172 

Epoch 7, batch 2658
Training loss: 1.8336353302001953 

Epoch 7, batch 2659
Training loss: 1.68343329429626

Epoch 7, batch 2840
Training loss: 1.606124758720398 

Epoch 7, batch 2841
Training loss: 1.841689109802246 

Epoch 7, batch 2842
Training loss: 1.847074270248413 

Epoch 7, batch 2843
Training loss: 1.511695146560669 

Epoch 7, batch 2844
Training loss: 1.8557448387145996 

Epoch 7, batch 2845
Training loss: 1.6210272312164307 

Epoch 7, batch 2846
Training loss: 1.6141200065612793 

Epoch 7, batch 2847
Training loss: 1.8036012649536133 

Epoch 7, batch 2848
Training loss: 1.9002351760864258 

Epoch 7, batch 2849
Training loss: 1.8662245273590088 

Epoch 7, batch 2850
Training loss: 1.511171817779541 

Epoch 7, batch 2851
Training loss: 2.058225154876709 

Epoch 7, batch 2852
Training loss: 1.9671835899353027 

Epoch 7, batch 2853
Training loss: 1.7574689388275146 

Epoch 7, batch 2854
Training loss: 1.707249641418457 

Epoch 7, batch 2855
Training loss: 1.5025612115859985 

Epoch 7, batch 2856
Training loss: 1.6490567922592163 

Epoch 7, batch 2857
Training loss: 1.7859673500061035 


Epoch 7, batch 3039
Training loss: 1.4915251731872559 

Epoch 7, batch 3040
Training loss: 1.5538055896759033 

Epoch 7, batch 3041
Training loss: 1.6883270740509033 

Epoch 7, batch 3042
Training loss: 2.030308246612549 

Epoch 7, batch 3043
Training loss: 1.8244330883026123 

Epoch 7, batch 3044
Training loss: 1.601348876953125 

Epoch 7, batch 3045
Training loss: 1.7486019134521484 

Epoch 7, batch 3046
Training loss: 1.557188868522644 

Epoch 7, batch 3047
Training loss: 2.012167453765869 

Epoch 7, batch 3048
Training loss: 1.8589963912963867 

Epoch 7, batch 3049
Training loss: 1.7381141185760498 

Epoch 7, batch 3050
Training loss: 1.4900394678115845 

Epoch 7, batch 3051
Training loss: 1.804551362991333 

Epoch 7, batch 3052
Training loss: 1.755631923675537 

Epoch 7, batch 3053
Training loss: 1.8980270624160767 

Epoch 7, batch 3054
Training loss: 1.5695827007293701 

Epoch 7, batch 3055
Training loss: 1.7151566743850708 

Epoch 7, batch 3056
Training loss: 1.622412085533142 


Epoch 7, batch 3239
Training loss: 1.7896589040756226 

Epoch 7, batch 3240
Training loss: 1.559601902961731 

Epoch 7, batch 3241
Training loss: 1.8809462785720825 

Epoch 7, batch 3242
Training loss: 1.875829815864563 

Epoch 7, batch 3243
Training loss: 1.7993037700653076 

Epoch 7, batch 3244
Training loss: 1.7510769367218018 

Epoch 7, batch 3245
Training loss: 1.9979870319366455 

Epoch 7, batch 3246
Training loss: 1.7989802360534668 

Epoch 7, batch 3247
Training loss: 1.852036952972412 

Epoch 7, batch 3248
Training loss: 1.7558881044387817 

Epoch 7, batch 3249
Training loss: 1.582476258277893 

Epoch 7, batch 3250
Training loss: 1.9332354068756104 

Epoch 7, batch 3251
Training loss: 1.8304998874664307 

Epoch 7, batch 3252
Training loss: 1.9350183010101318 

Epoch 7, batch 3253
Training loss: 1.844787836074829 

Epoch 7, batch 3254
Training loss: 1.97896146774292 

Epoch 7, batch 3255
Training loss: 1.5263466835021973 

Epoch 7, batch 3256
Training loss: 1.4679657220840454 


Epoch 7, batch 3440
Training loss: 1.6846065521240234 

Epoch 7, batch 3441
Training loss: 1.7690309286117554 

Epoch 7, batch 3442
Training loss: 1.9444992542266846 

Epoch 7, batch 3443
Training loss: 1.8009839057922363 

Epoch 7, batch 3444
Training loss: 1.620654821395874 

Epoch 7, batch 3445
Training loss: 1.88062584400177 

Epoch 7, batch 3446
Training loss: 2.0150129795074463 

Epoch 7, batch 3447
Training loss: 1.7916923761367798 

Epoch 7, batch 3448
Training loss: 1.8669416904449463 

Epoch 7, batch 3449
Training loss: 1.9554977416992188 

Epoch 7, batch 3450
Training loss: 1.6712983846664429 

Epoch 7, batch 3451
Training loss: 1.569553256034851 

Epoch 7, batch 3452
Training loss: 1.6952725648880005 

Epoch 7, batch 3453
Training loss: 1.6558033227920532 

Epoch 7, batch 3454
Training loss: 1.7613434791564941 

Epoch 7, batch 3455
Training loss: 1.6192646026611328 

Epoch 7, batch 3456
Training loss: 1.9693199396133423 

Epoch 7, batch 3457
Training loss: 1.649209022521972

Epoch 7, batch 3640
Training loss: 1.5776840448379517 

Epoch 7, batch 3641
Training loss: 1.6746947765350342 

Epoch 7, batch 3642
Training loss: 1.609641432762146 

Epoch 7, batch 3643
Training loss: 1.649352788925171 

Epoch 7, batch 3644
Training loss: 1.7226516008377075 

Epoch 7, batch 3645
Training loss: 1.5574095249176025 

Epoch 7, batch 3646
Training loss: 1.8162970542907715 

Epoch 7, batch 3647
Training loss: 1.5568727254867554 

Epoch 7, batch 3648
Training loss: 1.897263526916504 

Epoch 7, batch 3649
Training loss: 1.6534106731414795 

Epoch 7, batch 3650
Training loss: 1.7536120414733887 

Epoch 7, batch 3651
Training loss: 1.8448588848114014 

Epoch 7, batch 3652
Training loss: 1.9544628858566284 

Epoch 7, batch 3653
Training loss: 1.745771884918213 

Epoch 7, batch 3654
Training loss: 1.7038596868515015 

Epoch 7, batch 3655
Training loss: 1.6912016868591309 

Epoch 7, batch 3656
Training loss: 1.9276564121246338 

Epoch 7, batch 3657
Training loss: 1.904989957809448

Epoch 7, batch 3838
Training loss: 1.552640438079834 

Epoch 7, batch 3839
Training loss: 1.8241466283798218 

Epoch 7, batch 3840
Training loss: 1.4926775693893433 

Epoch 7, batch 3841
Training loss: 1.5634682178497314 

Epoch 7, batch 3842
Training loss: 1.6575934886932373 

Epoch 7, batch 3843
Training loss: 1.7103323936462402 

Epoch 7, batch 3844
Training loss: 1.9310097694396973 

Epoch 7, batch 3845
Training loss: 1.9013359546661377 

Epoch 7, batch 3846
Training loss: 1.8690271377563477 

Epoch 7, batch 3847
Training loss: 1.9187803268432617 

Epoch 7, batch 3848
Training loss: 1.6571533679962158 

Epoch 7, batch 3849
Training loss: 1.7159104347229004 

Epoch 7, batch 3850
Training loss: 1.768530249595642 

Epoch 7, batch 3851
Training loss: 1.9846570491790771 

Epoch 7, batch 3852
Training loss: 1.7200298309326172 

Epoch 7, batch 3853
Training loss: 1.661268711090088 

Epoch 7, batch 3854
Training loss: 1.8085330724716187 

Epoch 7, batch 3855
Training loss: 1.82734763622283

Epoch 7, batch 4039
Training loss: 1.778391718864441 

Epoch 7, batch 4040
Training loss: 1.8553369045257568 

Epoch 7, batch 4041
Training loss: 1.5888426303863525 

Epoch 7, batch 4042
Training loss: 1.5771371126174927 

Epoch 7, batch 4043
Training loss: 1.7462283372879028 

Epoch 7, batch 4044
Training loss: 1.5872918367385864 

Epoch 7, batch 4045
Training loss: 1.8470110893249512 

Epoch 7, batch 4046
Training loss: 1.6971395015716553 

Epoch 7, batch 4047
Training loss: 1.6817022562026978 

Epoch 7, batch 4048
Training loss: 2.0095109939575195 

Epoch 7, batch 4049
Training loss: 1.8171675205230713 

Epoch 7, batch 4050
Training loss: 1.8497682809829712 

Epoch 7, batch 4051
Training loss: 1.6603487730026245 

Epoch 7, batch 4052
Training loss: 1.7428447008132935 

Epoch 7, batch 4053
Training loss: 1.8222227096557617 

Epoch 7, batch 4054
Training loss: 1.8089029788970947 

Epoch 7, batch 4055
Training loss: 1.855299472808838 

Epoch 7, batch 4056
Training loss: 1.6366478204727

Epoch 7, batch 4242
Training loss: 1.469126582145691 

Epoch 7, batch 4243
Training loss: 1.5868369340896606 

Epoch 7, batch 4244
Training loss: 1.524567723274231 

Epoch 7, batch 4245
Training loss: 1.9000047445297241 

Epoch 7, batch 4246
Training loss: 2.048384666442871 

Epoch 7, batch 4247
Training loss: 1.6017893552780151 

Epoch 7, batch 4248
Training loss: 1.5850592851638794 

Epoch 7, batch 4249
Training loss: 1.7681382894515991 

Epoch 7, batch 4250
Training loss: 1.9170136451721191 

Epoch 7, batch 4251
Training loss: 1.8773841857910156 

Epoch 7, batch 4252
Training loss: 1.5317095518112183 

Epoch 7, batch 4253
Training loss: 1.874941349029541 

Epoch 7, batch 4254
Training loss: 1.7569580078125 

Epoch 7, batch 4255
Training loss: 1.8553135395050049 

Epoch 7, batch 4256
Training loss: 1.8525199890136719 

Epoch 7, batch 4257
Training loss: 1.5800094604492188 

Epoch 7, batch 4258
Training loss: 1.5313806533813477 

Epoch 7, batch 4259
Training loss: 1.7694766521453857 


Epoch 7, batch 4444
Training loss: 1.560542106628418 

Epoch 7, batch 4445
Training loss: 1.763070821762085 

Epoch 7, batch 4446
Training loss: 1.78139066696167 

Epoch 7, batch 4447
Training loss: 1.535958170890808 

Epoch 7, batch 4448
Training loss: 1.6059476137161255 

Epoch 7, batch 4449
Training loss: 1.8135603666305542 

Epoch 7, batch 4450
Training loss: 1.8962733745574951 

Epoch 7, batch 4451
Training loss: 1.905334711074829 

Epoch 7, batch 4452
Training loss: 1.6958773136138916 

Epoch 7, batch 4453
Training loss: 1.6610348224639893 

Epoch 7, batch 4454
Training loss: 1.6578867435455322 

Epoch 7, batch 4455
Training loss: 1.7575434446334839 

Epoch 7, batch 4456
Training loss: 1.7747786045074463 

Epoch 7, batch 4457
Training loss: 1.7758907079696655 

Epoch 7, batch 4458
Training loss: 2.044177532196045 

Epoch 7, batch 4459
Training loss: 1.7378382682800293 

Epoch 7, batch 4460
Training loss: 1.6734206676483154 

Epoch 7, batch 4461
Training loss: 1.899566411972046 



Epoch 7, batch 4646
Training loss: 1.6898999214172363 

Epoch 7, batch 4647
Training loss: 1.6549654006958008 

Epoch 7, batch 4648
Training loss: 1.9462223052978516 

Epoch 7, batch 4649
Training loss: 1.5882936716079712 

Epoch 7, batch 4650
Training loss: 1.8270063400268555 

Epoch 7, batch 4651
Training loss: 1.7233412265777588 

Epoch 7, batch 4652
Training loss: 1.7880291938781738 

Epoch 7, batch 4653
Training loss: 1.7792317867279053 

Epoch 7, batch 4654
Training loss: 1.5827245712280273 

Epoch 7, batch 4655
Training loss: 1.6397470235824585 

Epoch 7, batch 4656
Training loss: 1.5163843631744385 

Epoch 7, batch 4657
Training loss: 1.8096287250518799 

Epoch 7, batch 4658
Training loss: 1.708989143371582 

Epoch 7, batch 4659
Training loss: 1.961421251296997 

Epoch 7, batch 4660
Training loss: 1.7524700164794922 

Epoch 7, batch 4661
Training loss: 1.926612377166748 

Epoch 7, batch 4662
Training loss: 1.9626837968826294 

Epoch 7, batch 4663
Training loss: 2.12760972976684

Epoch 7, batch 4848
Training loss: 1.5277220010757446 

Epoch 7, batch 4849
Training loss: 1.532538652420044 

Epoch 7, batch 4850
Training loss: 1.740699052810669 

Epoch 7, batch 4851
Training loss: 1.9153239727020264 

Epoch 7, batch 4852
Training loss: 1.7091693878173828 

Epoch 7, batch 4853
Training loss: 1.9435293674468994 

Epoch 7, batch 4854
Training loss: 1.6791596412658691 

Epoch 7, batch 4855
Training loss: 1.805847406387329 

Epoch 7, batch 4856
Training loss: 1.77837336063385 

Epoch 7, batch 4857
Training loss: 1.788316249847412 

Epoch 7, batch 4858
Training loss: 1.6484551429748535 

Epoch 7, batch 4859
Training loss: 1.5873448848724365 

Epoch 7, batch 4860
Training loss: 1.898026466369629 

Epoch 7, batch 4861
Training loss: 1.9165656566619873 

Epoch 7, batch 4862
Training loss: 1.8684191703796387 

Epoch 7, batch 4863
Training loss: 1.8136711120605469 

Epoch 7, batch 4864
Training loss: 1.787235975265503 

Epoch 7, batch 4865
Training loss: 1.5265235900878906 



Epoch 7, batch 5049
Training loss: 1.66485595703125 

Epoch 7, batch 5050
Training loss: 1.6529560089111328 

Epoch 7, batch 5051
Training loss: 1.857169508934021 

Epoch 7, batch 5052
Training loss: 1.7433879375457764 

Epoch 7, batch 5053
Training loss: 1.866921067237854 

Epoch 7, batch 5054
Training loss: 1.9165340662002563 

Epoch 7, batch 5055
Training loss: 1.4985623359680176 

Epoch 7, batch 5056
Training loss: 1.4643492698669434 

Epoch 7, batch 5057
Training loss: 1.780583381652832 

Epoch 7, batch 5058
Training loss: 1.773232102394104 

Epoch 7, batch 5059
Training loss: 1.7210686206817627 

Epoch 7, batch 5060
Training loss: 1.792115330696106 

Epoch 7, batch 5061
Training loss: 1.694196105003357 

Epoch 7, batch 5062
Training loss: 1.7604660987854004 

Epoch 7, batch 5063
Training loss: 1.6637998819351196 

Epoch 7, batch 5064
Training loss: 1.7163705825805664 

Epoch 7, batch 5065
Training loss: 1.5915101766586304 

Epoch 7, batch 5066
Training loss: 1.9551289081573486 



Epoch 7, batch 5253
Training loss: 1.7725106477737427 

Epoch 7, batch 5254
Training loss: 1.8045706748962402 

Epoch 7, batch 5255
Training loss: 1.900071620941162 

Epoch 7, batch 5256
Training loss: 1.8447117805480957 

Epoch 7, batch 5257
Training loss: 1.664745569229126 

Epoch 7, batch 5258
Training loss: 1.9100298881530762 

Epoch 7, batch 5259
Training loss: 1.7492430210113525 

Epoch 7, batch 5260
Training loss: 1.5941283702850342 

Epoch 7, batch 5261
Training loss: 1.9545519351959229 

Epoch 7, batch 5262
Training loss: 1.9317567348480225 

Epoch 7, batch 5263
Training loss: 1.5967776775360107 

Epoch 7, batch 5264
Training loss: 1.7406212091445923 

Epoch 7, batch 5265
Training loss: 1.770871877670288 

Epoch 7, batch 5266
Training loss: 1.6269813776016235 

Epoch 7, batch 5267
Training loss: 1.6439313888549805 

Epoch 7, batch 5268
Training loss: 1.6928925514221191 

Epoch 7, batch 5269
Training loss: 1.7208162546157837 

Epoch 7, batch 5270
Training loss: 1.91225659847259

Epoch 7, batch 5456
Training loss: 2.139941930770874 

Epoch 7, batch 5457
Training loss: 1.769880771636963 

Epoch 7, batch 5458
Training loss: 1.9520654678344727 

Epoch 7, batch 5459
Training loss: 1.9061613082885742 

Epoch 7, batch 5460
Training loss: 1.8573269844055176 

Epoch 7, batch 5461
Training loss: 1.8111340999603271 

Epoch 7, batch 5462
Training loss: 1.9641224145889282 

Epoch 7, batch 5463
Training loss: 1.6609601974487305 

Epoch 7, batch 5464
Training loss: 1.8751773834228516 

Epoch 7, batch 5465
Training loss: 1.879429578781128 

Epoch 7, batch 5466
Training loss: 1.615805745124817 

Epoch 7, batch 5467
Training loss: 1.740401268005371 

Epoch 7, batch 5468
Training loss: 1.8645306825637817 

Epoch 7, batch 5469
Training loss: 1.6586836576461792 

Epoch 7, batch 5470
Training loss: 1.8208365440368652 

Epoch 7, batch 5471
Training loss: 1.4901553392410278 

Epoch 7, batch 5472
Training loss: 1.6734819412231445 

Epoch 7, batch 5473
Training loss: 1.9115509986877441

Epoch 7, batch 5659
Training loss: 1.5252610445022583 

Epoch 7, batch 5660
Training loss: 1.6126335859298706 

Epoch 7, batch 5661
Training loss: 1.9446032047271729 

Epoch 7, batch 5662
Training loss: 1.6606253385543823 

Epoch 7, batch 5663
Training loss: 1.657649040222168 

Epoch 7, batch 5664
Training loss: 1.8503071069717407 

Epoch 7, batch 5665
Training loss: 1.904916524887085 

Epoch 7, batch 5666
Training loss: 1.869980812072754 

Epoch 7, batch 5667
Training loss: 1.7177592515945435 

Epoch 7, batch 5668
Training loss: 1.7966728210449219 

Epoch 7, batch 5669
Training loss: 1.7403486967086792 

Epoch 7, batch 5670
Training loss: 1.5791281461715698 

Epoch 7, batch 5671
Training loss: 1.5820084810256958 

Epoch 7, batch 5672
Training loss: 1.8618193864822388 

Epoch 7, batch 5673
Training loss: 1.6978600025177002 

Epoch 7, batch 5674
Training loss: 1.8699524402618408 

Epoch 7, batch 5675
Training loss: 1.7108148336410522 

Epoch 7, batch 5676
Training loss: 1.55120909214019

Epoch 7, batch 5855
Training loss: 1.6580475568771362 

Epoch 7, batch 5856
Training loss: 1.5559619665145874 

Epoch 7, batch 5857
Training loss: 1.790969729423523 

Epoch 7, batch 5858
Training loss: 1.6094756126403809 

Epoch 7, batch 5859
Training loss: 1.624068260192871 

Epoch 7, batch 5860
Training loss: 1.6718075275421143 

Epoch 7, batch 5861
Training loss: 1.8710371255874634 

Epoch 7, batch 5862
Training loss: 1.7655240297317505 

Epoch 7, batch 5863
Training loss: 1.94978666305542 

Epoch 7, batch 5864
Training loss: 1.4958077669143677 

Epoch 7, batch 5865
Training loss: 1.6595194339752197 

Epoch 7, batch 5866
Training loss: 2.1204440593719482 

Epoch 7, batch 5867
Training loss: 1.7013205289840698 

Epoch 7, batch 5868
Training loss: 1.8033092021942139 

Epoch 7, batch 5869
Training loss: 1.81424880027771 

Epoch 7, batch 5870
Training loss: 2.040468692779541 

Epoch 7, batch 5871
Training loss: 1.7248215675354004 

Epoch 7, batch 5872
Training loss: 1.8495454788208008 


Epoch 8, batch 58
Training loss: 1.70189368724823 

Epoch 8, batch 59
Training loss: 1.8257508277893066 

Epoch 8, batch 60
Training loss: 1.4838976860046387 

Epoch 8, batch 61
Training loss: 1.5734241008758545 

Epoch 8, batch 62
Training loss: 1.7751811742782593 

Epoch 8, batch 63
Training loss: 1.5158236026763916 

Epoch 8, batch 64
Training loss: 1.8396656513214111 

Epoch 8, batch 65
Training loss: 1.5034642219543457 

Epoch 8, batch 66
Training loss: 1.762134313583374 

Epoch 8, batch 67
Training loss: 1.9623833894729614 

Epoch 8, batch 68
Training loss: 1.7667784690856934 

Epoch 8, batch 69
Training loss: 1.8142331838607788 

Epoch 8, batch 70
Training loss: 1.6927227973937988 

Epoch 8, batch 71
Training loss: 1.583525538444519 

Epoch 8, batch 72
Training loss: 1.5952844619750977 

Epoch 8, batch 73
Training loss: 1.765822172164917 

Epoch 8, batch 74
Training loss: 1.8624639511108398 

Epoch 8, batch 75
Training loss: 1.6745421886444092 

Epoch 8, batch 76
Training loss: 

Epoch 8, batch 262
Training loss: 1.8760616779327393 

Epoch 8, batch 263
Training loss: 1.5145840644836426 

Epoch 8, batch 264
Training loss: 1.5289667844772339 

Epoch 8, batch 265
Training loss: 1.8628790378570557 

Epoch 8, batch 266
Training loss: 1.6853597164154053 

Epoch 8, batch 267
Training loss: 1.6103930473327637 

Epoch 8, batch 268
Training loss: 1.5983980894088745 

Epoch 8, batch 269
Training loss: 1.8616313934326172 

Epoch 8, batch 270
Training loss: 1.7226274013519287 

Epoch 8, batch 271
Training loss: 1.5560879707336426 

Epoch 8, batch 272
Training loss: 1.7148951292037964 

Epoch 8, batch 273
Training loss: 1.5085581541061401 

Epoch 8, batch 274
Training loss: 1.855501651763916 

Epoch 8, batch 275
Training loss: 1.815826177597046 

Epoch 8, batch 276
Training loss: 1.5151493549346924 

Epoch 8, batch 277
Training loss: 1.5362999439239502 

Epoch 8, batch 278
Training loss: 1.9205021858215332 

Epoch 8, batch 279
Training loss: 2.057924270629883 

Epoch 8, batc

Epoch 8, batch 464
Training loss: 1.862349510192871 

Epoch 8, batch 465
Training loss: 1.6576900482177734 

Epoch 8, batch 466
Training loss: 1.5069915056228638 

Epoch 8, batch 467
Training loss: 1.6296271085739136 

Epoch 8, batch 468
Training loss: 1.660382866859436 

Epoch 8, batch 469
Training loss: 1.8693647384643555 

Epoch 8, batch 470
Training loss: 1.637068510055542 

Epoch 8, batch 471
Training loss: 1.7571451663970947 

Epoch 8, batch 472
Training loss: 1.7268424034118652 

Epoch 8, batch 473
Training loss: 1.6243516206741333 

Epoch 8, batch 474
Training loss: 1.5941319465637207 

Epoch 8, batch 475
Training loss: 1.8452105522155762 

Epoch 8, batch 476
Training loss: 1.8117338418960571 

Epoch 8, batch 477
Training loss: 1.8713876008987427 

Epoch 8, batch 478
Training loss: 1.6796880960464478 

Epoch 8, batch 479
Training loss: 1.6701505184173584 

Epoch 8, batch 480
Training loss: 1.9519684314727783 

Epoch 8, batch 481
Training loss: 1.8525006771087646 

Epoch 8, batc

Epoch 8, batch 667
Training loss: 1.7610971927642822 

Epoch 8, batch 668
Training loss: 1.5683280229568481 

Epoch 8, batch 669
Training loss: 1.948483943939209 

Epoch 8, batch 670
Training loss: 1.9624345302581787 

Epoch 8, batch 671
Training loss: 1.546491026878357 

Epoch 8, batch 672
Training loss: 1.5774630308151245 

Epoch 8, batch 673
Training loss: 1.6856255531311035 

Epoch 8, batch 674
Training loss: 1.6369338035583496 

Epoch 8, batch 675
Training loss: 1.5663244724273682 

Epoch 8, batch 676
Training loss: 1.9457993507385254 

Epoch 8, batch 677
Training loss: 1.837699055671692 

Epoch 8, batch 678
Training loss: 1.5667343139648438 

Epoch 8, batch 679
Training loss: 1.8166775703430176 

Epoch 8, batch 680
Training loss: 1.7708206176757812 

Epoch 8, batch 681
Training loss: 1.5608843564987183 

Epoch 8, batch 682
Training loss: 2.030745267868042 

Epoch 8, batch 683
Training loss: 1.9615669250488281 

Epoch 8, batch 684
Training loss: 1.860147476196289 

Epoch 8, batch 

Epoch 8, batch 871
Training loss: 1.5695098638534546 

Epoch 8, batch 872
Training loss: 1.6143642663955688 

Epoch 8, batch 873
Training loss: 1.7243223190307617 

Epoch 8, batch 874
Training loss: 1.5648465156555176 

Epoch 8, batch 875
Training loss: 1.8284101486206055 

Epoch 8, batch 876
Training loss: 1.9644393920898438 

Epoch 8, batch 877
Training loss: 1.8387813568115234 

Epoch 8, batch 878
Training loss: 1.9798665046691895 

Epoch 8, batch 879
Training loss: 1.7218871116638184 

Epoch 8, batch 880
Training loss: 1.680532455444336 

Epoch 8, batch 881
Training loss: 1.865915060043335 

Epoch 8, batch 882
Training loss: 1.9696422815322876 

Epoch 8, batch 883
Training loss: 1.8989734649658203 

Epoch 8, batch 884
Training loss: 1.7307710647583008 

Epoch 8, batch 885
Training loss: 1.9925265312194824 

Epoch 8, batch 886
Training loss: 1.601222038269043 

Epoch 8, batch 887
Training loss: 1.7087373733520508 

Epoch 8, batch 888
Training loss: 1.737962007522583 

Epoch 8, batch

Epoch 8, batch 1073
Training loss: 1.8871235847473145 

Epoch 8, batch 1074
Training loss: 1.757325530052185 

Epoch 8, batch 1075
Training loss: 1.7875806093215942 

Epoch 8, batch 1076
Training loss: 1.7340826988220215 

Epoch 8, batch 1077
Training loss: 1.5698001384735107 

Epoch 8, batch 1078
Training loss: 1.7412745952606201 

Epoch 8, batch 1079
Training loss: 1.9629827737808228 

Epoch 8, batch 1080
Training loss: 1.684604287147522 

Epoch 8, batch 1081
Training loss: 1.8310978412628174 

Epoch 8, batch 1082
Training loss: 1.4815258979797363 

Epoch 8, batch 1083
Training loss: 1.5531222820281982 

Epoch 8, batch 1084
Training loss: 1.7938019037246704 

Epoch 8, batch 1085
Training loss: 1.8469371795654297 

Epoch 8, batch 1086
Training loss: 1.9022786617279053 

Epoch 8, batch 1087
Training loss: 1.5176624059677124 

Epoch 8, batch 1088
Training loss: 1.859187126159668 

Epoch 8, batch 1089
Training loss: 1.9259700775146484 

Epoch 8, batch 1090
Training loss: 1.73983216285705

Epoch 8, batch 1277
Training loss: 1.6894006729125977 

Epoch 8, batch 1278
Training loss: 1.6714223623275757 

Epoch 8, batch 1279
Training loss: 1.9848904609680176 

Epoch 8, batch 1280
Training loss: 2.0077552795410156 

Epoch 8, batch 1281
Training loss: 1.8584747314453125 

Epoch 8, batch 1282
Training loss: 1.6368290185928345 

Epoch 8, batch 1283
Training loss: 1.4694749116897583 

Epoch 8, batch 1284
Training loss: 1.604254961013794 

Epoch 8, batch 1285
Training loss: 1.671466588973999 

Epoch 8, batch 1286
Training loss: 1.4826985597610474 

Epoch 8, batch 1287
Training loss: 1.8745001554489136 

Epoch 8, batch 1288
Training loss: 1.9337310791015625 

Epoch 8, batch 1289
Training loss: 1.9969336986541748 

Epoch 8, batch 1290
Training loss: 1.706103801727295 

Epoch 8, batch 1291
Training loss: 1.8191578388214111 

Epoch 8, batch 1292
Training loss: 1.5338222980499268 

Epoch 8, batch 1293
Training loss: 1.5558571815490723 

Epoch 8, batch 1294
Training loss: 1.81652331352233

Epoch 8, batch 1481
Training loss: 1.8907139301300049 

Epoch 8, batch 1482
Training loss: 1.7050917148590088 

Epoch 8, batch 1483
Training loss: 2.011063575744629 

Epoch 8, batch 1484
Training loss: 1.672454595565796 

Epoch 8, batch 1485
Training loss: 1.8593833446502686 

Epoch 8, batch 1486
Training loss: 2.027921676635742 

Epoch 8, batch 1487
Training loss: 1.648601770401001 

Epoch 8, batch 1488
Training loss: 1.8411363363265991 

Epoch 8, batch 1489
Training loss: 1.7766565084457397 

Epoch 8, batch 1490
Training loss: 1.9331248998641968 

Epoch 8, batch 1491
Training loss: 1.574578046798706 

Epoch 8, batch 1492
Training loss: 1.9322688579559326 

Epoch 8, batch 1493
Training loss: 1.5431764125823975 

Epoch 8, batch 1494
Training loss: 1.8220856189727783 

Epoch 8, batch 1495
Training loss: 1.9759793281555176 

Epoch 8, batch 1496
Training loss: 1.6963523626327515 

Epoch 8, batch 1497
Training loss: 1.933975100517273 

Epoch 8, batch 1498
Training loss: 1.9173450469970703 

Epoch 8, batch 1685
Training loss: 1.5884804725646973 

Epoch 8, batch 1686
Training loss: 1.908301830291748 

Epoch 8, batch 1687
Training loss: 1.9226086139678955 

Epoch 8, batch 1688
Training loss: 1.6566822528839111 

Epoch 8, batch 1689
Training loss: 1.8808255195617676 

Epoch 8, batch 1690
Training loss: 1.6887471675872803 

Epoch 8, batch 1691
Training loss: 1.6210448741912842 

Epoch 8, batch 1692
Training loss: 1.632429838180542 

Epoch 8, batch 1693
Training loss: 1.8553783893585205 

Epoch 8, batch 1694
Training loss: 1.6746153831481934 

Epoch 8, batch 1695
Training loss: 1.8561780452728271 

Epoch 8, batch 1696
Training loss: 2.0220842361450195 

Epoch 8, batch 1697
Training loss: 1.7807210683822632 

Epoch 8, batch 1698
Training loss: 1.8075380325317383 

Epoch 8, batch 1699
Training loss: 1.8096022605895996 

Epoch 8, batch 1700
Training loss: 1.7867398262023926 

Epoch 8, batch 1701
Training loss: 1.8553980588912964 

Epoch 8, batch 1702
Training loss: 1.4739351272583

Epoch 8, batch 1889
Training loss: 1.7277549505233765 

Epoch 8, batch 1890
Training loss: 1.4968268871307373 

Epoch 8, batch 1891
Training loss: 1.9647619724273682 

Epoch 8, batch 1892
Training loss: 1.649442195892334 

Epoch 8, batch 1893
Training loss: 1.7064846754074097 

Epoch 8, batch 1894
Training loss: 1.7472922801971436 

Epoch 8, batch 1895
Training loss: 1.6672285795211792 

Epoch 8, batch 1896
Training loss: 1.5923835039138794 

Epoch 8, batch 1897
Training loss: 1.6545146703720093 

Epoch 8, batch 1898
Training loss: 1.842785120010376 

Epoch 8, batch 1899
Training loss: 1.632025957107544 

Epoch 8, batch 1900
Training loss: 1.5068182945251465 

Epoch 8, batch 1901
Training loss: 1.6707110404968262 

Epoch 8, batch 1902
Training loss: 1.6163301467895508 

Epoch 8, batch 1903
Training loss: 1.8453847169876099 

Epoch 8, batch 1904
Training loss: 1.706000566482544 

Epoch 8, batch 1905
Training loss: 1.6786243915557861 

Epoch 8, batch 1906
Training loss: 1.477550625801086

Epoch 8, batch 2093
Training loss: 1.9033112525939941 

Epoch 8, batch 2094
Training loss: 1.8022325038909912 

Epoch 8, batch 2095
Training loss: 1.8809778690338135 

Epoch 8, batch 2096
Training loss: 1.624466061592102 

Epoch 8, batch 2097
Training loss: 1.7231123447418213 

Epoch 8, batch 2098
Training loss: 1.6437968015670776 

Epoch 8, batch 2099
Training loss: 1.637323260307312 

Epoch 8, batch 2100
Training loss: 1.9470428228378296 

Epoch 8, batch 2101
Training loss: 1.8326958417892456 

Epoch 8, batch 2102
Training loss: 1.822955846786499 

Epoch 8, batch 2103
Training loss: 1.8787962198257446 

Epoch 8, batch 2104
Training loss: 1.5013705492019653 

Epoch 8, batch 2105
Training loss: 1.5066945552825928 

Epoch 8, batch 2106
Training loss: 1.6010397672653198 

Epoch 8, batch 2107
Training loss: 1.9831013679504395 

Epoch 8, batch 2108
Training loss: 1.673680305480957 

Epoch 8, batch 2109
Training loss: 1.700140118598938 

Epoch 8, batch 2110
Training loss: 1.8051540851593018

Epoch 8, batch 2297
Training loss: 1.7654929161071777 

Epoch 8, batch 2298
Training loss: 1.7470399141311646 

Epoch 8, batch 2299
Training loss: 1.8072543144226074 

Epoch 8, batch 2300
Training loss: 1.8986892700195312 

Epoch 8, batch 2301
Training loss: 1.762403964996338 

Epoch 8, batch 2302
Training loss: 1.9418258666992188 

Epoch 8, batch 2303
Training loss: 1.7780659198760986 

Epoch 8, batch 2304
Training loss: 1.880003571510315 

Epoch 8, batch 2305
Training loss: 1.750433087348938 

Epoch 8, batch 2306
Training loss: 1.7272827625274658 

Epoch 8, batch 2307
Training loss: 1.8932695388793945 

Epoch 8, batch 2308
Training loss: 1.8889738321304321 

Epoch 8, batch 2309
Training loss: 1.6787772178649902 

Epoch 8, batch 2310
Training loss: 1.8983323574066162 

Epoch 8, batch 2311
Training loss: 1.7319598197937012 

Epoch 8, batch 2312
Training loss: 1.7712323665618896 

Epoch 8, batch 2313
Training loss: 1.851173758506775 

Epoch 8, batch 2314
Training loss: 1.501787066459655

Epoch 8, batch 2502
Training loss: 1.6370069980621338 

Epoch 8, batch 2503
Training loss: 1.7902613878250122 

Epoch 8, batch 2504
Training loss: 1.8161427974700928 

Epoch 8, batch 2505
Training loss: 1.8593499660491943 

Epoch 8, batch 2506
Training loss: 1.5093644857406616 

Epoch 8, batch 2507
Training loss: 1.6045987606048584 

Epoch 8, batch 2508
Training loss: 1.7320462465286255 

Epoch 8, batch 2509
Training loss: 1.7838575839996338 

Epoch 8, batch 2510
Training loss: 1.757093071937561 

Epoch 8, batch 2511
Training loss: 1.556602954864502 

Epoch 8, batch 2512
Training loss: 1.5996003150939941 

Epoch 8, batch 2513
Training loss: 1.9178621768951416 

Epoch 8, batch 2514
Training loss: 1.613008975982666 

Epoch 8, batch 2515
Training loss: 1.6800460815429688 

Epoch 8, batch 2516
Training loss: 1.7639036178588867 

Epoch 8, batch 2517
Training loss: 1.953133463859558 

Epoch 8, batch 2518
Training loss: 1.7336894273757935 

Epoch 8, batch 2519
Training loss: 1.860209703445434

Epoch 8, batch 2705
Training loss: 1.5360150337219238 

Epoch 8, batch 2706
Training loss: 1.731855034828186 

Epoch 8, batch 2707
Training loss: 1.808307409286499 

Epoch 8, batch 2708
Training loss: 1.670228123664856 

Epoch 8, batch 2709
Training loss: 1.481382131576538 

Epoch 8, batch 2710
Training loss: 1.8256691694259644 

Epoch 8, batch 2711
Training loss: 1.5345667600631714 

Epoch 8, batch 2712
Training loss: 1.710729718208313 

Epoch 8, batch 2713
Training loss: 1.7682714462280273 

Epoch 8, batch 2714
Training loss: 1.8774491548538208 

Epoch 8, batch 2715
Training loss: 2.033353805541992 

Epoch 8, batch 2716
Training loss: 1.8788948059082031 

Epoch 8, batch 2717
Training loss: 1.5386803150177002 

Epoch 8, batch 2718
Training loss: 1.6734881401062012 

Epoch 8, batch 2719
Training loss: 1.9474022388458252 

Epoch 8, batch 2720
Training loss: 1.6980957984924316 

Epoch 8, batch 2721
Training loss: 1.7136037349700928 

Epoch 8, batch 2722
Training loss: 1.679426670074463 


Epoch 8, batch 2908
Training loss: 1.8829506635665894 

Epoch 8, batch 2909
Training loss: 1.9022225141525269 

Epoch 8, batch 2910
Training loss: 1.5902304649353027 

Epoch 8, batch 2911
Training loss: 1.7151589393615723 

Epoch 8, batch 2912
Training loss: 1.529798984527588 

Epoch 8, batch 2913
Training loss: 1.708737850189209 

Epoch 8, batch 2914
Training loss: 1.908111333847046 

Epoch 8, batch 2915
Training loss: 1.7361453771591187 

Epoch 8, batch 2916
Training loss: 1.7970855236053467 

Epoch 8, batch 2917
Training loss: 1.8519160747528076 

Epoch 8, batch 2918
Training loss: 1.6076487302780151 

Epoch 8, batch 2919
Training loss: 2.005582094192505 

Epoch 8, batch 2920
Training loss: 1.9406980276107788 

Epoch 8, batch 2921
Training loss: 1.6544667482376099 

Epoch 8, batch 2922
Training loss: 1.7041916847229004 

Epoch 8, batch 2923
Training loss: 1.8484079837799072 

Epoch 8, batch 2924
Training loss: 1.9854772090911865 

Epoch 8, batch 2925
Training loss: 2.045374631881714

Epoch 8, batch 3110
Training loss: 1.760460615158081 

Epoch 8, batch 3111
Training loss: 1.7244131565093994 

Epoch 8, batch 3112
Training loss: 1.8336727619171143 

Epoch 8, batch 3113
Training loss: 1.6394071578979492 

Epoch 8, batch 3114
Training loss: 1.5239571332931519 

Epoch 8, batch 3115
Training loss: 1.9500041007995605 

Epoch 8, batch 3116
Training loss: 1.7545418739318848 

Epoch 8, batch 3117
Training loss: 1.8954973220825195 

Epoch 8, batch 3118
Training loss: 1.7214274406433105 

Epoch 8, batch 3119
Training loss: 1.621626853942871 

Epoch 8, batch 3120
Training loss: 1.809248447418213 

Epoch 8, batch 3121
Training loss: 1.9058518409729004 

Epoch 8, batch 3122
Training loss: 1.625192642211914 

Epoch 8, batch 3123
Training loss: 1.9660308361053467 

Epoch 8, batch 3124
Training loss: 1.4803355932235718 

Epoch 8, batch 3125
Training loss: 1.4707918167114258 

Epoch 8, batch 3126
Training loss: 1.9034740924835205 

Epoch 8, batch 3127
Training loss: 1.724713563919067

Epoch 8, batch 3313
Training loss: 1.74344801902771 

Epoch 8, batch 3314
Training loss: 1.5021653175354004 

Epoch 8, batch 3315
Training loss: 1.864229679107666 

Epoch 8, batch 3316
Training loss: 1.915910243988037 

Epoch 8, batch 3317
Training loss: 1.7797445058822632 

Epoch 8, batch 3318
Training loss: 1.8469122648239136 

Epoch 8, batch 3319
Training loss: 1.9048097133636475 

Epoch 8, batch 3320
Training loss: 1.579049825668335 

Epoch 8, batch 3321
Training loss: 1.8279614448547363 

Epoch 8, batch 3322
Training loss: 1.8238605260849 

Epoch 8, batch 3323
Training loss: 1.7939698696136475 

Epoch 8, batch 3324
Training loss: 1.6105595827102661 

Epoch 8, batch 3325
Training loss: 1.5939608812332153 

Epoch 8, batch 3326
Training loss: 1.5747694969177246 

Epoch 8, batch 3327
Training loss: 1.9470078945159912 

Epoch 8, batch 3328
Training loss: 1.7356700897216797 

Epoch 8, batch 3329
Training loss: 1.707491397857666 

Epoch 8, batch 3330
Training loss: 1.7963156700134277 

E

Epoch 8, batch 3517
Training loss: 2.0083229541778564 

Epoch 8, batch 3518
Training loss: 1.8894689083099365 

Epoch 8, batch 3519
Training loss: 1.6065783500671387 

Epoch 8, batch 3520
Training loss: 1.6664584875106812 

Epoch 8, batch 3521
Training loss: 1.7396328449249268 

Epoch 8, batch 3522
Training loss: 1.7522363662719727 

Epoch 8, batch 3523
Training loss: 1.6260294914245605 

Epoch 8, batch 3524
Training loss: 1.6269686222076416 

Epoch 8, batch 3525
Training loss: 1.8414950370788574 

Epoch 8, batch 3526
Training loss: 1.48630690574646 

Epoch 8, batch 3527
Training loss: 1.8209867477416992 

Epoch 8, batch 3528
Training loss: 1.5931117534637451 

Epoch 8, batch 3529
Training loss: 1.8169517517089844 

Epoch 8, batch 3530
Training loss: 1.8191602230072021 

Epoch 8, batch 3531
Training loss: 1.5662537813186646 

Epoch 8, batch 3532
Training loss: 1.5241954326629639 

Epoch 8, batch 3533
Training loss: 1.6996548175811768 

Epoch 8, batch 3534
Training loss: 1.7491527795791

Epoch 8, batch 3721
Training loss: 1.7612500190734863 

Epoch 8, batch 3722
Training loss: 1.854650616645813 

Epoch 8, batch 3723
Training loss: 1.8045322895050049 

Epoch 8, batch 3724
Training loss: 1.9125699996948242 

Epoch 8, batch 3725
Training loss: 1.7249469757080078 

Epoch 8, batch 3726
Training loss: 1.6639851331710815 

Epoch 8, batch 3727
Training loss: 1.6161625385284424 

Epoch 8, batch 3728
Training loss: 1.705634355545044 

Epoch 8, batch 3729
Training loss: 1.9217681884765625 

Epoch 8, batch 3730
Training loss: 1.7847429513931274 

Epoch 8, batch 3731
Training loss: 2.005455493927002 

Epoch 8, batch 3732
Training loss: 1.948287010192871 

Epoch 8, batch 3733
Training loss: 1.5111396312713623 

Epoch 8, batch 3734
Training loss: 1.6109117269515991 

Epoch 8, batch 3735
Training loss: 1.7611477375030518 

Epoch 8, batch 3736
Training loss: 1.6471199989318848 

Epoch 8, batch 3737
Training loss: 1.9560924768447876 

Epoch 8, batch 3738
Training loss: 1.680826067924499

Epoch 8, batch 3928
Training loss: 1.794747233390808 

Epoch 8, batch 3929
Training loss: 1.6414968967437744 

Epoch 8, batch 3930
Training loss: 1.4958069324493408 

Epoch 8, batch 3931
Training loss: 1.5848881006240845 

Epoch 8, batch 3932
Training loss: 1.7202911376953125 

Epoch 8, batch 3933
Training loss: 1.9129714965820312 

Epoch 8, batch 3934
Training loss: 1.6127355098724365 

Epoch 8, batch 3935
Training loss: 2.0095138549804688 

Epoch 8, batch 3936
Training loss: 1.8732714653015137 

Epoch 8, batch 3937
Training loss: 1.9457621574401855 

Epoch 8, batch 3938
Training loss: 1.9381202459335327 

Epoch 8, batch 3939
Training loss: 1.7045890092849731 

Epoch 8, batch 3940
Training loss: 1.7660870552062988 

Epoch 8, batch 3941
Training loss: 1.6934374570846558 

Epoch 8, batch 3942
Training loss: 1.6527091264724731 

Epoch 8, batch 3943
Training loss: 1.578421711921692 

Epoch 8, batch 3944
Training loss: 1.819425106048584 

Epoch 8, batch 3945
Training loss: 1.86643576622009

Epoch 8, batch 4132
Training loss: 1.8164286613464355 

Epoch 8, batch 4133
Training loss: 1.8928303718566895 

Epoch 8, batch 4134
Training loss: 1.720434546470642 

Epoch 8, batch 4135
Training loss: 1.712714672088623 

Epoch 8, batch 4136
Training loss: 1.8604304790496826 

Epoch 8, batch 4137
Training loss: 1.8808271884918213 

Epoch 8, batch 4138
Training loss: 1.99588942527771 

Epoch 8, batch 4139
Training loss: 1.7506883144378662 

Epoch 8, batch 4140
Training loss: 1.6733055114746094 

Epoch 8, batch 4141
Training loss: 1.6973994970321655 

Epoch 8, batch 4142
Training loss: 1.504852056503296 

Epoch 8, batch 4143
Training loss: 1.5857502222061157 

Epoch 8, batch 4144
Training loss: 1.6808738708496094 

Epoch 8, batch 4145
Training loss: 1.8780879974365234 

Epoch 8, batch 4146
Training loss: 1.6655340194702148 

Epoch 8, batch 4147
Training loss: 1.526975154876709 

Epoch 8, batch 4148
Training loss: 1.6294580698013306 

Epoch 8, batch 4149
Training loss: 1.6345882415771484 

Epoch 8, batch 4333
Training loss: 1.9053525924682617 

Epoch 8, batch 4334
Training loss: 2.0242621898651123 

Epoch 8, batch 4335
Training loss: 1.8034424781799316 

Epoch 8, batch 4336
Training loss: 1.9223518371582031 

Epoch 8, batch 4337
Training loss: 1.8602559566497803 

Epoch 8, batch 4338
Training loss: 1.7393776178359985 

Epoch 8, batch 4339
Training loss: 1.6709654331207275 

Epoch 8, batch 4340
Training loss: 1.8165769577026367 

Epoch 8, batch 4341
Training loss: 1.8749208450317383 

Epoch 8, batch 4342
Training loss: 1.6466057300567627 

Epoch 8, batch 4343
Training loss: 1.6574435234069824 

Epoch 8, batch 4344
Training loss: 1.4681752920150757 

Epoch 8, batch 4345
Training loss: 1.486689567565918 

Epoch 8, batch 4346
Training loss: 1.8336104154586792 

Epoch 8, batch 4347
Training loss: 1.86991286277771 

Epoch 8, batch 4348
Training loss: 1.6039464473724365 

Epoch 8, batch 4349
Training loss: 1.8544477224349976 

Epoch 8, batch 4350
Training loss: 1.51942992210388

Epoch 8, batch 4533
Training loss: 1.7332576513290405 

Epoch 8, batch 4534
Training loss: 1.8861720561981201 

Epoch 8, batch 4535
Training loss: 1.5646950006484985 

Epoch 8, batch 4536
Training loss: 1.831752061843872 

Epoch 8, batch 4537
Training loss: 1.8923256397247314 

Epoch 8, batch 4538
Training loss: 1.7466166019439697 

Epoch 8, batch 4539
Training loss: 1.5088083744049072 

Epoch 8, batch 4540
Training loss: 1.7271580696105957 

Epoch 8, batch 4541
Training loss: 1.7915277481079102 

Epoch 8, batch 4542
Training loss: 1.6925902366638184 

Epoch 8, batch 4543
Training loss: 1.7382827997207642 

Epoch 8, batch 4544
Training loss: 1.9675381183624268 

Epoch 8, batch 4545
Training loss: 1.7547136545181274 

Epoch 8, batch 4546
Training loss: 1.8378899097442627 

Epoch 8, batch 4547
Training loss: 1.5487662553787231 

Epoch 8, batch 4548
Training loss: 1.6955255270004272 

Epoch 8, batch 4549
Training loss: 1.9469115734100342 

Epoch 8, batch 4550
Training loss: 1.997950434684

Epoch 8, batch 4723
Training loss: 1.956255555152893 

Epoch 8, batch 4724
Training loss: 1.574781894683838 

Epoch 8, batch 4725
Training loss: 1.9473013877868652 

Epoch 8, batch 4726
Training loss: 1.775550365447998 

Epoch 8, batch 4727
Training loss: 1.8905868530273438 

Epoch 8, batch 4728
Training loss: 1.5168607234954834 

Epoch 8, batch 4729
Training loss: 1.9142801761627197 

Epoch 8, batch 4730
Training loss: 1.5976531505584717 

Epoch 8, batch 4731
Training loss: 1.7094717025756836 

Epoch 8, batch 4732
Training loss: 1.6818500757217407 

Epoch 8, batch 4733
Training loss: 1.8978309631347656 

Epoch 8, batch 4734
Training loss: 1.8563811779022217 

Epoch 8, batch 4735
Training loss: 1.6489397287368774 

Epoch 8, batch 4736
Training loss: 1.596517562866211 

Epoch 8, batch 4737
Training loss: 1.9799309968948364 

Epoch 8, batch 4738
Training loss: 1.6317384243011475 

Epoch 8, batch 4739
Training loss: 1.8004786968231201 

Epoch 8, batch 4740
Training loss: 1.880655646324157

Epoch 8, batch 4924
Training loss: 1.5362379550933838 

Epoch 8, batch 4925
Training loss: 1.6085063219070435 

Epoch 8, batch 4926
Training loss: 1.5009392499923706 

Epoch 8, batch 4927
Training loss: 2.004215717315674 

Epoch 8, batch 4928
Training loss: 1.9478445053100586 

Epoch 8, batch 4929
Training loss: 1.84004545211792 

Epoch 8, batch 4930
Training loss: 1.8745254278182983 

Epoch 8, batch 4931
Training loss: 1.5327228307724 

Epoch 8, batch 4932
Training loss: 1.9699069261550903 

Epoch 8, batch 4933
Training loss: 1.8215664625167847 

Epoch 8, batch 4934
Training loss: 1.6277620792388916 

Epoch 8, batch 4935
Training loss: 1.9187710285186768 

Epoch 8, batch 4936
Training loss: 1.7664906978607178 

Epoch 8, batch 4937
Training loss: 1.880859136581421 

Epoch 8, batch 4938
Training loss: 1.639428734779358 

Epoch 8, batch 4939
Training loss: 1.7118680477142334 

Epoch 8, batch 4940
Training loss: 1.5233291387557983 

Epoch 8, batch 4941
Training loss: 1.6772191524505615 



Epoch 8, batch 5123
Training loss: 1.5403416156768799 

Epoch 8, batch 5124
Training loss: 1.9602065086364746 

Epoch 8, batch 5125
Training loss: 1.6200608015060425 

Epoch 8, batch 5126
Training loss: 1.562495231628418 

Epoch 8, batch 5127
Training loss: 1.9583823680877686 

Epoch 8, batch 5128
Training loss: 1.5507892370224 

Epoch 8, batch 5129
Training loss: 1.6332082748413086 

Epoch 8, batch 5130
Training loss: 1.8587242364883423 

Epoch 8, batch 5131
Training loss: 1.5313068628311157 

Epoch 8, batch 5132
Training loss: 1.835613489151001 

Epoch 8, batch 5133
Training loss: 1.8776018619537354 

Epoch 8, batch 5134
Training loss: 1.7334606647491455 

Epoch 8, batch 5135
Training loss: 1.8338217735290527 

Epoch 8, batch 5136
Training loss: 1.6411423683166504 

Epoch 8, batch 5137
Training loss: 1.6214041709899902 

Epoch 8, batch 5138
Training loss: 1.9058244228363037 

Epoch 8, batch 5139
Training loss: 1.6932698488235474 

Epoch 8, batch 5140
Training loss: 1.6734431982040405

Epoch 8, batch 5322
Training loss: 1.7643353939056396 

Epoch 8, batch 5323
Training loss: 1.8400611877441406 

Epoch 8, batch 5324
Training loss: 1.6642158031463623 

Epoch 8, batch 5325
Training loss: 1.9008634090423584 

Epoch 8, batch 5326
Training loss: 1.8983235359191895 

Epoch 8, batch 5327
Training loss: 1.515698790550232 

Epoch 8, batch 5328
Training loss: 1.5158629417419434 

Epoch 8, batch 5329
Training loss: 1.908926248550415 

Epoch 8, batch 5330
Training loss: 1.824380874633789 

Epoch 8, batch 5331
Training loss: 1.8823555707931519 

Epoch 8, batch 5332
Training loss: 1.7745020389556885 

Epoch 8, batch 5333
Training loss: 1.8204941749572754 

Epoch 8, batch 5334
Training loss: 1.8187201023101807 

Epoch 8, batch 5335
Training loss: 1.527464747428894 

Epoch 8, batch 5336
Training loss: 1.8329885005950928 

Epoch 8, batch 5337
Training loss: 1.6708776950836182 

Epoch 8, batch 5338
Training loss: 1.7693196535110474 

Epoch 8, batch 5339
Training loss: 1.741950154304504

Epoch 8, batch 5522
Training loss: 1.5678181648254395 

Epoch 8, batch 5523
Training loss: 1.6978650093078613 

Epoch 8, batch 5524
Training loss: 1.7914588451385498 

Epoch 8, batch 5525
Training loss: 1.886269211769104 

Epoch 8, batch 5526
Training loss: 1.9052066802978516 

Epoch 8, batch 5527
Training loss: 1.5015143156051636 

Epoch 8, batch 5528
Training loss: 1.6404967308044434 

Epoch 8, batch 5529
Training loss: 1.5990028381347656 

Epoch 8, batch 5530
Training loss: 1.71955406665802 

Epoch 8, batch 5531
Training loss: 1.8882780075073242 

Epoch 8, batch 5532
Training loss: 1.894174337387085 

Epoch 8, batch 5533
Training loss: 1.5474681854248047 

Epoch 8, batch 5534
Training loss: 1.8836349248886108 

Epoch 8, batch 5535
Training loss: 1.6454777717590332 

Epoch 8, batch 5536
Training loss: 1.8566288948059082 

Epoch 8, batch 5537
Training loss: 1.7137013673782349 

Epoch 8, batch 5538
Training loss: 1.883684754371643 

Epoch 8, batch 5539
Training loss: 1.6669964790344238

Epoch 8, batch 5716
Training loss: 1.5242245197296143 

Epoch 8, batch 5717
Training loss: 1.6447474956512451 

Epoch 8, batch 5718
Training loss: 1.8233407735824585 

Epoch 8, batch 5719
Training loss: 1.5707776546478271 

Epoch 8, batch 5720
Training loss: 1.5334964990615845 

Epoch 8, batch 5721
Training loss: 1.553737998008728 

Epoch 8, batch 5722
Training loss: 1.8540875911712646 

Epoch 8, batch 5723
Training loss: 1.4935634136199951 

Epoch 8, batch 5724
Training loss: 1.5388052463531494 

Epoch 8, batch 5725
Training loss: 1.6807796955108643 

Epoch 8, batch 5726
Training loss: 1.5258581638336182 

Epoch 8, batch 5727
Training loss: 1.916823148727417 

Epoch 8, batch 5728
Training loss: 1.7966264486312866 

Epoch 8, batch 5729
Training loss: 1.865954875946045 

Epoch 8, batch 5730
Training loss: 1.6094584465026855 

Epoch 8, batch 5731
Training loss: 1.5679411888122559 

Epoch 8, batch 5732
Training loss: 1.8318673372268677 

Epoch 8, batch 5733
Training loss: 1.74200546741485

Epoch 8, batch 5910
Training loss: 1.4790219068527222 

Epoch 8, batch 5911
Training loss: 1.5620691776275635 

Epoch 8, batch 5912
Training loss: 1.9209895133972168 

Epoch 8, batch 5913
Training loss: 1.7558445930480957 

Epoch 8, batch 5914
Training loss: 1.808875560760498 

Epoch 8, batch 5915
Training loss: 1.7486326694488525 

Epoch 8, batch 5916
Training loss: 1.6238442659378052 

Epoch 8, batch 5917
Training loss: 1.9255192279815674 

Epoch 8, batch 5918
Training loss: 1.462700366973877 

Epoch 8, batch 5919
Training loss: 1.6076366901397705 

Epoch 8, batch 5920
Training loss: 1.5835590362548828 

Epoch 8, batch 5921
Training loss: 1.7951467037200928 

Epoch 8, batch 5922
Training loss: 1.6659866571426392 

Epoch 8, batch 5923
Training loss: 1.5457748174667358 

Epoch 8, batch 5924
Training loss: 1.7807236909866333 

Epoch 8, batch 5925
Training loss: 1.6320528984069824 

Epoch 8, batch 5926
Training loss: 1.5928431749343872 

Epoch 8, batch 5927
Training loss: 1.7966358661651

Epoch 9, batch 108
Training loss: 1.4669888019561768 

Epoch 9, batch 109
Training loss: 1.6131092309951782 

Epoch 9, batch 110
Training loss: 1.832777500152588 

Epoch 9, batch 111
Training loss: 1.860707402229309 

Epoch 9, batch 112
Training loss: 1.5688611268997192 

Epoch 9, batch 113
Training loss: 1.539431095123291 

Epoch 9, batch 114
Training loss: 1.639439344406128 

Epoch 9, batch 115
Training loss: 1.6179951429367065 

Epoch 9, batch 116
Training loss: 1.5346181392669678 

Epoch 9, batch 117
Training loss: 2.055492639541626 

Epoch 9, batch 118
Training loss: 1.8140177726745605 

Epoch 9, batch 119
Training loss: 1.7983434200286865 

Epoch 9, batch 120
Training loss: 1.6543145179748535 

Epoch 9, batch 121
Training loss: 1.5959782600402832 

Epoch 9, batch 122
Training loss: 1.9380216598510742 

Epoch 9, batch 123
Training loss: 1.6846349239349365 

Epoch 9, batch 124
Training loss: 1.614173173904419 

Epoch 9, batch 125
Training loss: 1.8645298480987549 

Epoch 9, batch 1

Epoch 9, batch 310
Training loss: 1.9862080812454224 

Epoch 9, batch 311
Training loss: 1.7800824642181396 

Epoch 9, batch 312
Training loss: 2.002601146697998 

Epoch 9, batch 313
Training loss: 1.8970229625701904 

Epoch 9, batch 314
Training loss: 1.9415786266326904 

Epoch 9, batch 315
Training loss: 1.6114338636398315 

Epoch 9, batch 316
Training loss: 1.559281349182129 

Epoch 9, batch 317
Training loss: 1.5774949789047241 

Epoch 9, batch 318
Training loss: 1.629608392715454 

Epoch 9, batch 319
Training loss: 1.9633516073226929 

Epoch 9, batch 320
Training loss: 1.9589465856552124 

Epoch 9, batch 321
Training loss: 1.7426095008850098 

Epoch 9, batch 322
Training loss: 1.6237212419509888 

Epoch 9, batch 323
Training loss: 1.7004222869873047 

Epoch 9, batch 324
Training loss: 1.543874740600586 

Epoch 9, batch 325
Training loss: 1.5857207775115967 

Epoch 9, batch 326
Training loss: 1.6200709342956543 

Epoch 9, batch 327
Training loss: 1.5299577713012695 

Epoch 9, batch

Epoch 9, batch 511
Training loss: 1.5983519554138184 

Epoch 9, batch 512
Training loss: 1.570802927017212 

Epoch 9, batch 513
Training loss: 1.904353380203247 

Epoch 9, batch 514
Training loss: 1.6583975553512573 

Epoch 9, batch 515
Training loss: 2.063906669616699 

Epoch 9, batch 516
Training loss: 1.7374906539916992 

Epoch 9, batch 517
Training loss: 1.813528299331665 

Epoch 9, batch 518
Training loss: 1.604907751083374 

Epoch 9, batch 519
Training loss: 1.9599120616912842 

Epoch 9, batch 520
Training loss: 1.7796412706375122 

Epoch 9, batch 521
Training loss: 1.624957799911499 

Epoch 9, batch 522
Training loss: 1.8698899745941162 

Epoch 9, batch 523
Training loss: 1.940980076789856 

Epoch 9, batch 524
Training loss: 1.7710206508636475 

Epoch 9, batch 525
Training loss: 1.8068654537200928 

Epoch 9, batch 526
Training loss: 1.6066057682037354 

Epoch 9, batch 527
Training loss: 1.8205019235610962 

Epoch 9, batch 528
Training loss: 1.6687648296356201 

Epoch 9, batch 52

Epoch 9, batch 712
Training loss: 1.9853148460388184 

Epoch 9, batch 713
Training loss: 1.667807936668396 

Epoch 9, batch 714
Training loss: 1.7527532577514648 

Epoch 9, batch 715
Training loss: 1.6020804643630981 

Epoch 9, batch 716
Training loss: 1.728327751159668 

Epoch 9, batch 717
Training loss: 1.4994447231292725 

Epoch 9, batch 718
Training loss: 1.634757161140442 

Epoch 9, batch 719
Training loss: 1.5972034931182861 

Epoch 9, batch 720
Training loss: 1.6256104707717896 

Epoch 9, batch 721
Training loss: 1.9249215126037598 

Epoch 9, batch 722
Training loss: 1.7037086486816406 

Epoch 9, batch 723
Training loss: 1.7549291849136353 

Epoch 9, batch 724
Training loss: 1.7200393676757812 

Epoch 9, batch 725
Training loss: 1.8090429306030273 

Epoch 9, batch 726
Training loss: 1.7883808612823486 

Epoch 9, batch 727
Training loss: 1.8079818487167358 

Epoch 9, batch 728
Training loss: 1.643821358680725 

Epoch 9, batch 729
Training loss: 1.659562110900879 

Epoch 9, batch 

Epoch 9, batch 914
Training loss: 1.5359212160110474 

Epoch 9, batch 915
Training loss: 1.5816168785095215 

Epoch 9, batch 916
Training loss: 1.7807555198669434 

Epoch 9, batch 917
Training loss: 1.655556321144104 

Epoch 9, batch 918
Training loss: 1.6106797456741333 

Epoch 9, batch 919
Training loss: 1.693074345588684 

Epoch 9, batch 920
Training loss: 1.9007456302642822 

Epoch 9, batch 921
Training loss: 2.002486228942871 

Epoch 9, batch 922
Training loss: 1.9468815326690674 

Epoch 9, batch 923
Training loss: 1.563086748123169 

Epoch 9, batch 924
Training loss: 1.6413379907608032 

Epoch 9, batch 925
Training loss: 1.7429733276367188 

Epoch 9, batch 926
Training loss: 1.63821542263031 

Epoch 9, batch 927
Training loss: 1.5258445739746094 

Epoch 9, batch 928
Training loss: 1.9488245248794556 

Epoch 9, batch 929
Training loss: 1.6504017114639282 

Epoch 9, batch 930
Training loss: 1.711942434310913 

Epoch 9, batch 931
Training loss: 1.7658449411392212 

Epoch 9, batch 93

Epoch 9, batch 1117
Training loss: 1.7886370420455933 

Epoch 9, batch 1118
Training loss: 1.6247023344039917 

Epoch 9, batch 1119
Training loss: 1.7180428504943848 

Epoch 9, batch 1120
Training loss: 1.5139654874801636 

Epoch 9, batch 1121
Training loss: 1.6692829132080078 

Epoch 9, batch 1122
Training loss: 1.9257761240005493 

Epoch 9, batch 1123
Training loss: 1.663210391998291 

Epoch 9, batch 1124
Training loss: 1.710269808769226 

Epoch 9, batch 1125
Training loss: 1.5056614875793457 

Epoch 9, batch 1126
Training loss: 1.7824897766113281 

Epoch 9, batch 1127
Training loss: 1.634635090827942 

Epoch 9, batch 1128
Training loss: 1.7671386003494263 

Epoch 9, batch 1129
Training loss: 1.7373969554901123 

Epoch 9, batch 1130
Training loss: 1.7690119743347168 

Epoch 9, batch 1131
Training loss: 1.9833788871765137 

Epoch 9, batch 1132
Training loss: 1.7112597227096558 

Epoch 9, batch 1133
Training loss: 1.9244914054870605 

Epoch 9, batch 1134
Training loss: 1.71943604946136

Epoch 9, batch 1320
Training loss: 1.8418267965316772 

Epoch 9, batch 1321
Training loss: 1.504219651222229 

Epoch 9, batch 1322
Training loss: 1.7971217632293701 

Epoch 9, batch 1323
Training loss: 1.9205782413482666 

Epoch 9, batch 1324
Training loss: 1.6388756036758423 

Epoch 9, batch 1325
Training loss: 1.9975650310516357 

Epoch 9, batch 1326
Training loss: 1.4989304542541504 

Epoch 9, batch 1327
Training loss: 1.901912808418274 

Epoch 9, batch 1328
Training loss: 1.90421724319458 

Epoch 9, batch 1329
Training loss: 1.7559313774108887 

Epoch 9, batch 1330
Training loss: 1.8582348823547363 

Epoch 9, batch 1331
Training loss: 1.6615197658538818 

Epoch 9, batch 1332
Training loss: 1.6963379383087158 

Epoch 9, batch 1333
Training loss: 1.5761266946792603 

Epoch 9, batch 1334
Training loss: 1.9299919605255127 

Epoch 9, batch 1335
Training loss: 1.6328516006469727 

Epoch 9, batch 1336
Training loss: 1.8293125629425049 

Epoch 9, batch 1337
Training loss: 1.644451141357421

Epoch 9, batch 1525
Training loss: 1.709075927734375 

Epoch 9, batch 1526
Training loss: 1.7975273132324219 

Epoch 9, batch 1527
Training loss: 1.5851023197174072 

Epoch 9, batch 1528
Training loss: 1.5098350048065186 

Epoch 9, batch 1529
Training loss: 1.6804962158203125 

Epoch 9, batch 1530
Training loss: 1.7617723941802979 

Epoch 9, batch 1531
Training loss: 1.6390323638916016 

Epoch 9, batch 1532
Training loss: 1.741974115371704 

Epoch 9, batch 1533
Training loss: 1.6088236570358276 

Epoch 9, batch 1534
Training loss: 2.022871494293213 

Epoch 9, batch 1535
Training loss: 1.5944867134094238 

Epoch 9, batch 1536
Training loss: 1.801180362701416 

Epoch 9, batch 1537
Training loss: 1.6584084033966064 

Epoch 9, batch 1538
Training loss: 2.018449544906616 

Epoch 9, batch 1539
Training loss: 1.6027286052703857 

Epoch 9, batch 1540
Training loss: 1.8678092956542969 

Epoch 9, batch 1541
Training loss: 1.6591336727142334 

Epoch 9, batch 1542
Training loss: 1.687047004699707 

Epoch 9, batch 1729
Training loss: 1.4650003910064697 

Epoch 9, batch 1730
Training loss: 1.586011528968811 

Epoch 9, batch 1731
Training loss: 2.030336380004883 

Epoch 9, batch 1732
Training loss: 1.93581223487854 

Epoch 9, batch 1733
Training loss: 1.5009806156158447 

Epoch 9, batch 1734
Training loss: 1.6159498691558838 

Epoch 9, batch 1735
Training loss: 1.5857471227645874 

Epoch 9, batch 1736
Training loss: 1.591139793395996 

Epoch 9, batch 1737
Training loss: 1.551192045211792 

Epoch 9, batch 1738
Training loss: 2.007768154144287 

Epoch 9, batch 1739
Training loss: 1.978100299835205 

Epoch 9, batch 1740
Training loss: 1.8364814519882202 

Epoch 9, batch 1741
Training loss: 1.8086209297180176 

Epoch 9, batch 1742
Training loss: 1.6559079885482788 

Epoch 9, batch 1743
Training loss: 1.8356640338897705 

Epoch 9, batch 1744
Training loss: 1.7437608242034912 

Epoch 9, batch 1745
Training loss: 1.505718469619751 

Epoch 9, batch 1746
Training loss: 1.720644235610962 

Ep

Epoch 9, batch 1931
Training loss: 1.9097344875335693 

Epoch 9, batch 1932
Training loss: 1.8044432401657104 

Epoch 9, batch 1933
Training loss: 1.7252044677734375 

Epoch 9, batch 1934
Training loss: 1.7184494733810425 

Epoch 9, batch 1935
Training loss: 1.6936824321746826 

Epoch 9, batch 1936
Training loss: 1.8172531127929688 

Epoch 9, batch 1937
Training loss: 1.8094358444213867 

Epoch 9, batch 1938
Training loss: 1.6079503297805786 

Epoch 9, batch 1939
Training loss: 1.6766525506973267 

Epoch 9, batch 1940
Training loss: 1.7416502237319946 

Epoch 9, batch 1941
Training loss: 1.7850333452224731 

Epoch 9, batch 1942
Training loss: 1.4872841835021973 

Epoch 9, batch 1943
Training loss: 1.9338830709457397 

Epoch 9, batch 1944
Training loss: 1.5637927055358887 

Epoch 9, batch 1945
Training loss: 1.9695438146591187 

Epoch 9, batch 1946
Training loss: 1.6226602792739868 

Epoch 9, batch 1947
Training loss: 1.889866828918457 

Epoch 9, batch 1948
Training loss: 1.677191257476

Epoch 9, batch 2134
Training loss: 1.6874608993530273 

Epoch 9, batch 2135
Training loss: 1.7362654209136963 

Epoch 9, batch 2136
Training loss: 1.8149986267089844 

Epoch 9, batch 2137
Training loss: 1.8293628692626953 

Epoch 9, batch 2138
Training loss: 1.702710747718811 

Epoch 9, batch 2139
Training loss: 1.7451145648956299 

Epoch 9, batch 2140
Training loss: 1.5672993659973145 

Epoch 9, batch 2141
Training loss: 2.036484718322754 

Epoch 9, batch 2142
Training loss: 1.7772815227508545 

Epoch 9, batch 2143
Training loss: 1.5703704357147217 

Epoch 9, batch 2144
Training loss: 1.7202099561691284 

Epoch 9, batch 2145
Training loss: 2.026379346847534 

Epoch 9, batch 2146
Training loss: 1.8713874816894531 

Epoch 9, batch 2147
Training loss: 1.8384073972702026 

Epoch 9, batch 2148
Training loss: 1.8727307319641113 

Epoch 9, batch 2149
Training loss: 1.6150966882705688 

Epoch 9, batch 2150
Training loss: 1.8684308528900146 

Epoch 9, batch 2151
Training loss: 1.74138569831848

Epoch 9, batch 2338
Training loss: 1.5237255096435547 

Epoch 9, batch 2339
Training loss: 1.5673511028289795 

Epoch 9, batch 2340
Training loss: 1.9937841892242432 

Epoch 9, batch 2341
Training loss: 1.6588510274887085 

Epoch 9, batch 2342
Training loss: 1.7819448709487915 

Epoch 9, batch 2343
Training loss: 1.7485144138336182 

Epoch 9, batch 2344
Training loss: 1.4721620082855225 

Epoch 9, batch 2345
Training loss: 1.6014074087142944 

Epoch 9, batch 2346
Training loss: 1.9528182744979858 

Epoch 9, batch 2347
Training loss: 1.5826200246810913 

Epoch 9, batch 2348
Training loss: 1.548835277557373 

Epoch 9, batch 2349
Training loss: 1.8611361980438232 

Epoch 9, batch 2350
Training loss: 2.0115532875061035 

Epoch 9, batch 2351
Training loss: 1.6806132793426514 

Epoch 9, batch 2352
Training loss: 1.9321579933166504 

Epoch 9, batch 2353
Training loss: 1.6602017879486084 

Epoch 9, batch 2354
Training loss: 1.5283000469207764 

Epoch 9, batch 2355
Training loss: 1.705144762992

Epoch 9, batch 2541
Training loss: 1.646188735961914 

Epoch 9, batch 2542
Training loss: 1.874979019165039 

Epoch 9, batch 2543
Training loss: 1.9246821403503418 

Epoch 9, batch 2544
Training loss: 1.7991900444030762 

Epoch 9, batch 2545
Training loss: 1.7821457386016846 

Epoch 9, batch 2546
Training loss: 1.842821717262268 

Epoch 9, batch 2547
Training loss: 1.6247544288635254 

Epoch 9, batch 2548
Training loss: 1.6855591535568237 

Epoch 9, batch 2549
Training loss: 1.7758151292800903 

Epoch 9, batch 2550
Training loss: 1.6795703172683716 

Epoch 9, batch 2551
Training loss: 1.7968662977218628 

Epoch 9, batch 2552
Training loss: 1.6660698652267456 

Epoch 9, batch 2553
Training loss: 1.6865482330322266 

Epoch 9, batch 2554
Training loss: 1.5612192153930664 

Epoch 9, batch 2555
Training loss: 1.5200738906860352 

Epoch 9, batch 2556
Training loss: 1.7608314752578735 

Epoch 9, batch 2557
Training loss: 1.9676754474639893 

Epoch 9, batch 2558
Training loss: 1.78036916255950

Epoch 9, batch 2741
Training loss: 1.5475170612335205 

Epoch 9, batch 2742
Training loss: 1.6117674112319946 

Epoch 9, batch 2743
Training loss: 2.0046472549438477 

Epoch 9, batch 2744
Training loss: 1.6133720874786377 

Epoch 9, batch 2745
Training loss: 1.6950169801712036 

Epoch 9, batch 2746
Training loss: 1.46863853931427 

Epoch 9, batch 2747
Training loss: 1.636246681213379 

Epoch 9, batch 2748
Training loss: 1.9600383043289185 

Epoch 9, batch 2749
Training loss: 1.8242771625518799 

Epoch 9, batch 2750
Training loss: 1.7416834831237793 

Epoch 9, batch 2751
Training loss: 1.7996492385864258 

Epoch 9, batch 2752
Training loss: 1.5745208263397217 

Epoch 9, batch 2753
Training loss: 1.4989458322525024 

Epoch 9, batch 2754
Training loss: 1.8537976741790771 

Epoch 9, batch 2755
Training loss: 1.7794697284698486 

Epoch 9, batch 2756
Training loss: 1.814305067062378 

Epoch 9, batch 2757
Training loss: 1.6981089115142822 

Epoch 9, batch 2758
Training loss: 1.585105657577514

Epoch 9, batch 2942
Training loss: 1.621201515197754 

Epoch 9, batch 2943
Training loss: 1.5285450220108032 

Epoch 9, batch 2944
Training loss: 1.8138906955718994 

Epoch 9, batch 2945
Training loss: 1.8438338041305542 

Epoch 9, batch 2946
Training loss: 1.9047110080718994 

Epoch 9, batch 2947
Training loss: 1.8496884107589722 

Epoch 9, batch 2948
Training loss: 1.6855785846710205 

Epoch 9, batch 2949
Training loss: 1.7276750802993774 

Epoch 9, batch 2950
Training loss: 1.4692445993423462 

Epoch 9, batch 2951
Training loss: 1.6848747730255127 

Epoch 9, batch 2952
Training loss: 1.8025472164154053 

Epoch 9, batch 2953
Training loss: 1.8159096240997314 

Epoch 9, batch 2954
Training loss: 1.8114166259765625 

Epoch 9, batch 2955
Training loss: 1.8620452880859375 

Epoch 9, batch 2956
Training loss: 1.8703430891036987 

Epoch 9, batch 2957
Training loss: 1.605146050453186 

Epoch 9, batch 2958
Training loss: 1.6352359056472778 

Epoch 9, batch 2959
Training loss: 1.7270380258560

Epoch 9, batch 3148
Training loss: 1.9166136980056763 

Epoch 9, batch 3149
Training loss: 1.9102414846420288 

Epoch 9, batch 3150
Training loss: 1.5806777477264404 

Epoch 9, batch 3151
Training loss: 1.8358705043792725 

Epoch 9, batch 3152
Training loss: 1.9722881317138672 

Epoch 9, batch 3153
Training loss: 1.9208890199661255 

Epoch 9, batch 3154
Training loss: 1.8599255084991455 

Epoch 9, batch 3155
Training loss: 1.6613163948059082 

Epoch 9, batch 3156
Training loss: 1.8797471523284912 

Epoch 9, batch 3157
Training loss: 1.5553514957427979 

Epoch 9, batch 3158
Training loss: 1.618734359741211 

Epoch 9, batch 3159
Training loss: 1.9311132431030273 

Epoch 9, batch 3160
Training loss: 1.7145856618881226 

Epoch 9, batch 3161
Training loss: 1.8306962251663208 

Epoch 9, batch 3162
Training loss: 1.9079625606536865 

Epoch 9, batch 3163
Training loss: 1.86809504032135 

Epoch 9, batch 3164
Training loss: 1.7018558979034424 

Epoch 9, batch 3165
Training loss: 1.97623181343078

Epoch 9, batch 3350
Training loss: 1.684132695198059 

Epoch 9, batch 3351
Training loss: 1.6331853866577148 

Epoch 9, batch 3352
Training loss: 1.680622935295105 

Epoch 9, batch 3353
Training loss: 1.6477437019348145 

Epoch 9, batch 3354
Training loss: 1.480839729309082 

Epoch 9, batch 3355
Training loss: 1.9151942729949951 

Epoch 9, batch 3356
Training loss: 1.5987563133239746 

Epoch 9, batch 3357
Training loss: 1.5039188861846924 

Epoch 9, batch 3358
Training loss: 1.5236912965774536 

Epoch 9, batch 3359
Training loss: 1.681039571762085 

Epoch 9, batch 3360
Training loss: 1.6100142002105713 

Epoch 9, batch 3361
Training loss: 1.7558457851409912 

Epoch 9, batch 3362
Training loss: 1.6684527397155762 

Epoch 9, batch 3363
Training loss: 1.4726879596710205 

Epoch 9, batch 3364
Training loss: 1.9441187381744385 

Epoch 9, batch 3365
Training loss: 1.852104902267456 

Epoch 9, batch 3366
Training loss: 1.7664453983306885 

Epoch 9, batch 3367
Training loss: 1.7026546001434326

Epoch 9, batch 3552
Training loss: 1.6145172119140625 

Epoch 9, batch 3553
Training loss: 1.5749640464782715 

Epoch 9, batch 3554
Training loss: 1.743128776550293 

Epoch 9, batch 3555
Training loss: 1.568669319152832 

Epoch 9, batch 3556
Training loss: 1.846963882446289 

Epoch 9, batch 3557
Training loss: 1.7508116960525513 

Epoch 9, batch 3558
Training loss: 1.7877311706542969 

Epoch 9, batch 3559
Training loss: 1.5508244037628174 

Epoch 9, batch 3560
Training loss: 1.5065687894821167 

Epoch 9, batch 3561
Training loss: 1.8538541793823242 

Epoch 9, batch 3562
Training loss: 1.795440435409546 

Epoch 9, batch 3563
Training loss: 1.855135202407837 

Epoch 9, batch 3564
Training loss: 1.734283208847046 

Epoch 9, batch 3565
Training loss: 1.7971320152282715 

Epoch 9, batch 3566
Training loss: 1.677761197090149 

Epoch 9, batch 3567
Training loss: 1.6219815015792847 

Epoch 9, batch 3568
Training loss: 1.940702199935913 

Epoch 9, batch 3569
Training loss: 1.7551000118255615 



Epoch 9, batch 3754
Training loss: 1.8336800336837769 

Epoch 9, batch 3755
Training loss: 1.8167879581451416 

Epoch 9, batch 3756
Training loss: 1.5819432735443115 

Epoch 9, batch 3757
Training loss: 1.8200159072875977 

Epoch 9, batch 3758
Training loss: 1.6082898378372192 

Epoch 9, batch 3759
Training loss: 1.5991010665893555 

Epoch 9, batch 3760
Training loss: 1.5507301092147827 

Epoch 9, batch 3761
Training loss: 1.8268613815307617 

Epoch 9, batch 3762
Training loss: 1.515769600868225 

Epoch 9, batch 3763
Training loss: 1.8632197380065918 

Epoch 9, batch 3764
Training loss: 1.7457489967346191 

Epoch 9, batch 3765
Training loss: 1.8843849897384644 

Epoch 9, batch 3766
Training loss: 1.7712063789367676 

Epoch 9, batch 3767
Training loss: 1.7789348363876343 

Epoch 9, batch 3768
Training loss: 1.844231367111206 

Epoch 9, batch 3769
Training loss: 1.5759447813034058 

Epoch 9, batch 3770
Training loss: 1.8071805238723755 

Epoch 9, batch 3771
Training loss: 1.5402718782424

Epoch 9, batch 3955
Training loss: 1.4886404275894165 

Epoch 9, batch 3956
Training loss: 1.6480181217193604 

Epoch 9, batch 3957
Training loss: 1.706407904624939 

Epoch 9, batch 3958
Training loss: 1.4771865606307983 

Epoch 9, batch 3959
Training loss: 1.5937196016311646 

Epoch 9, batch 3960
Training loss: 1.8334184885025024 

Epoch 9, batch 3961
Training loss: 1.6202001571655273 

Epoch 9, batch 3962
Training loss: 1.8292557001113892 

Epoch 9, batch 3963
Training loss: 1.7114404439926147 

Epoch 9, batch 3964
Training loss: 1.825710415840149 

Epoch 9, batch 3965
Training loss: 1.779097557067871 

Epoch 9, batch 3966
Training loss: 1.9338445663452148 

Epoch 9, batch 3967
Training loss: 1.7005712985992432 

Epoch 9, batch 3968
Training loss: 1.769871473312378 

Epoch 9, batch 3969
Training loss: 1.4972302913665771 

Epoch 9, batch 3970
Training loss: 1.8071045875549316 

Epoch 9, batch 3971
Training loss: 1.7124621868133545 

Epoch 9, batch 3972
Training loss: 1.739763498306274

Epoch 9, batch 4160
Training loss: 1.506564736366272 

Epoch 9, batch 4161
Training loss: 1.716083288192749 

Epoch 9, batch 4162
Training loss: 1.6269285678863525 

Epoch 9, batch 4163
Training loss: 1.7895491123199463 

Epoch 9, batch 4164
Training loss: 1.6951290369033813 

Epoch 9, batch 4165
Training loss: 1.8037114143371582 

Epoch 9, batch 4166
Training loss: 1.779076099395752 

Epoch 9, batch 4167
Training loss: 1.9461809396743774 

Epoch 9, batch 4168
Training loss: 1.7893707752227783 

Epoch 9, batch 4169
Training loss: 1.5852174758911133 

Epoch 9, batch 4170
Training loss: 1.70441472530365 

Epoch 9, batch 4171
Training loss: 1.7689945697784424 

Epoch 9, batch 4172
Training loss: 1.6860840320587158 

Epoch 9, batch 4173
Training loss: 1.6058809757232666 

Epoch 9, batch 4174
Training loss: 1.806140422821045 

Epoch 9, batch 4175
Training loss: 1.5513198375701904 

Epoch 9, batch 4176
Training loss: 1.6572717428207397 

Epoch 9, batch 4177
Training loss: 1.9805469512939453 

Epoch 9, batch 4363
Training loss: 1.6349356174468994 

Epoch 9, batch 4364
Training loss: 1.4935328960418701 

Epoch 9, batch 4365
Training loss: 1.8985073566436768 

Epoch 9, batch 4366
Training loss: 1.5593137741088867 

Epoch 9, batch 4367
Training loss: 1.5675504207611084 

Epoch 9, batch 4368
Training loss: 1.6533055305480957 

Epoch 9, batch 4369
Training loss: 1.8356354236602783 

Epoch 9, batch 4370
Training loss: 1.7735885381698608 

Epoch 9, batch 4371
Training loss: 1.6155664920806885 

Epoch 9, batch 4372
Training loss: 1.926703929901123 

Epoch 9, batch 4373
Training loss: 1.7054451704025269 

Epoch 9, batch 4374
Training loss: 1.9713850021362305 

Epoch 9, batch 4375
Training loss: 1.4944279193878174 

Epoch 9, batch 4376
Training loss: 1.6235460042953491 

Epoch 9, batch 4377
Training loss: 1.587001919746399 

Epoch 9, batch 4378
Training loss: 1.6225111484527588 

Epoch 9, batch 4379
Training loss: 1.6235485076904297 

Epoch 9, batch 4380
Training loss: 1.9029967784881

Epoch 9, batch 4568
Training loss: 1.817121148109436 

Epoch 9, batch 4569
Training loss: 2.0155622959136963 

Epoch 9, batch 4570
Training loss: 1.8203802108764648 

Epoch 9, batch 4571
Training loss: 1.5034412145614624 

Epoch 9, batch 4572
Training loss: 1.7616798877716064 

Epoch 9, batch 4573
Training loss: 1.6534641981124878 

Epoch 9, batch 4574
Training loss: 1.5058128833770752 

Epoch 9, batch 4575
Training loss: 1.8057337999343872 

Epoch 9, batch 4576
Training loss: 1.7550867795944214 

Epoch 9, batch 4577
Training loss: 2.0486154556274414 

Epoch 9, batch 4578
Training loss: 1.6103439331054688 

Epoch 9, batch 4579
Training loss: 1.7085782289505005 

Epoch 9, batch 4580
Training loss: 1.8733980655670166 

Epoch 9, batch 4581
Training loss: 1.7340190410614014 

Epoch 9, batch 4582
Training loss: 1.538107991218567 

Epoch 9, batch 4583
Training loss: 1.739023208618164 

Epoch 9, batch 4584
Training loss: 1.770535945892334 

Epoch 9, batch 4585
Training loss: 1.780732154846191

Epoch 9, batch 4773
Training loss: 1.5442278385162354 

Epoch 9, batch 4774
Training loss: 1.857080101966858 

Epoch 9, batch 4775
Training loss: 1.8297991752624512 

Epoch 9, batch 4776
Training loss: 1.761234998703003 

Epoch 9, batch 4777
Training loss: 1.918550968170166 

Epoch 9, batch 4778
Training loss: 1.6238406896591187 

Epoch 9, batch 4779
Training loss: 1.6958274841308594 

Epoch 9, batch 4780
Training loss: 1.9535901546478271 

Epoch 9, batch 4781
Training loss: 1.8243238925933838 

Epoch 9, batch 4782
Training loss: 1.713355302810669 

Epoch 9, batch 4783
Training loss: 1.738757610321045 

Epoch 9, batch 4784
Training loss: 1.9082088470458984 

Epoch 9, batch 4785
Training loss: 1.7994922399520874 

Epoch 9, batch 4786
Training loss: 1.7937781810760498 

Epoch 9, batch 4787
Training loss: 1.722071886062622 

Epoch 9, batch 4788
Training loss: 1.936389684677124 

Epoch 9, batch 4789
Training loss: 1.8466417789459229 

Epoch 9, batch 4790
Training loss: 1.5396493673324585 


Epoch 9, batch 4977
Training loss: 1.4859187602996826 

Epoch 9, batch 4978
Training loss: 1.5628167390823364 

Epoch 9, batch 4979
Training loss: 1.7291866540908813 

Epoch 9, batch 4980
Training loss: 1.531195044517517 

Epoch 9, batch 4981
Training loss: 1.954761266708374 

Epoch 9, batch 4982
Training loss: 1.547329306602478 

Epoch 9, batch 4983
Training loss: 1.846543788909912 

Epoch 9, batch 4984
Training loss: 1.7174901962280273 

Epoch 9, batch 4985
Training loss: 1.5113972425460815 

Epoch 9, batch 4986
Training loss: 1.5412817001342773 

Epoch 9, batch 4987
Training loss: 1.8254340887069702 

Epoch 9, batch 4988
Training loss: 1.859704852104187 

Epoch 9, batch 4989
Training loss: 1.9870727062225342 

Epoch 9, batch 4990
Training loss: 1.9186789989471436 

Epoch 9, batch 4991
Training loss: 1.6992896795272827 

Epoch 9, batch 4992
Training loss: 2.060483455657959 

Epoch 9, batch 4993
Training loss: 1.9198229312896729 

Epoch 9, batch 4994
Training loss: 1.9604700803756714 

Epoch 9, batch 5182
Training loss: 1.545768141746521 

Epoch 9, batch 5183
Training loss: 1.861588716506958 

Epoch 9, batch 5184
Training loss: 1.5564604997634888 

Epoch 9, batch 5185
Training loss: 1.7940806150436401 

Epoch 9, batch 5186
Training loss: 1.5954594612121582 

Epoch 9, batch 5187
Training loss: 1.8702497482299805 

Epoch 9, batch 5188
Training loss: 1.557971715927124 

Epoch 9, batch 5189
Training loss: 1.6836299896240234 

Epoch 9, batch 5190
Training loss: 1.8691298961639404 

Epoch 9, batch 5191
Training loss: 1.9251632690429688 

Epoch 9, batch 5192
Training loss: 1.8054862022399902 

Epoch 9, batch 5193
Training loss: 1.5684970617294312 

Epoch 9, batch 5194
Training loss: 1.819901943206787 

Epoch 9, batch 5195
Training loss: 1.7985023260116577 

Epoch 9, batch 5196
Training loss: 1.5620009899139404 

Epoch 9, batch 5197
Training loss: 1.9282207489013672 

Epoch 9, batch 5198
Training loss: 1.7790555953979492 

Epoch 9, batch 5199
Training loss: 1.756779432296753

Epoch 9, batch 5384
Training loss: 1.956769585609436 

Epoch 9, batch 5385
Training loss: 2.0939414501190186 

Epoch 9, batch 5386
Training loss: 1.9547303915023804 

Epoch 9, batch 5387
Training loss: 1.9601757526397705 

Epoch 9, batch 5388
Training loss: 1.6901466846466064 

Epoch 9, batch 5389
Training loss: 1.6527342796325684 

Epoch 9, batch 5390
Training loss: 1.9500483274459839 

Epoch 9, batch 5391
Training loss: 1.7831250429153442 

Epoch 9, batch 5392
Training loss: 1.5022364854812622 

Epoch 9, batch 5393
Training loss: 1.7144496440887451 

Epoch 9, batch 5394
Training loss: 1.6709911823272705 

Epoch 9, batch 5395
Training loss: 1.5562810897827148 

Epoch 9, batch 5396
Training loss: 1.5458483695983887 

Epoch 9, batch 5397
Training loss: 1.8610846996307373 

Epoch 9, batch 5398
Training loss: 1.5072972774505615 

Epoch 9, batch 5399
Training loss: 1.900560736656189 

Epoch 9, batch 5400
Training loss: 1.7014267444610596 

Epoch 9, batch 5401
Training loss: 1.7053971290588

Epoch 9, batch 5577
Training loss: 1.6433130502700806 

Epoch 9, batch 5578
Training loss: 1.705137014389038 

Epoch 9, batch 5579
Training loss: 1.7151198387145996 

Epoch 9, batch 5580
Training loss: 1.6363186836242676 

Epoch 9, batch 5581
Training loss: 1.5432953834533691 

Epoch 9, batch 5582
Training loss: 1.7369509935379028 

Epoch 9, batch 5583
Training loss: 2.0100185871124268 

Epoch 9, batch 5584
Training loss: 1.9247043132781982 

Epoch 9, batch 5585
Training loss: 1.9612908363342285 

Epoch 9, batch 5586
Training loss: 1.653045654296875 

Epoch 9, batch 5587
Training loss: 1.7878497838974 

Epoch 9, batch 5588
Training loss: 1.7839722633361816 

Epoch 9, batch 5589
Training loss: 1.907343864440918 

Epoch 9, batch 5590
Training loss: 1.9609010219573975 

Epoch 9, batch 5591
Training loss: 1.84506094455719 

Epoch 9, batch 5592
Training loss: 1.57017982006073 

Epoch 9, batch 5593
Training loss: 1.6272567510604858 

Epoch 9, batch 5594
Training loss: 1.8266998529434204 

Ep

Epoch 9, batch 5783
Training loss: 1.799643635749817 

Epoch 9, batch 5784
Training loss: 1.7718088626861572 

Epoch 9, batch 5785
Training loss: 1.8523128032684326 

Epoch 9, batch 5786
Training loss: 1.6510770320892334 

Epoch 9, batch 5787
Training loss: 1.6743924617767334 

Epoch 9, batch 5788
Training loss: 1.6927140951156616 

Epoch 9, batch 5789
Training loss: 1.764780879020691 

Epoch 9, batch 5790
Training loss: 1.8475964069366455 

Epoch 9, batch 5791
Training loss: 1.9712715148925781 

Epoch 9, batch 5792
Training loss: 1.8249351978302002 

Epoch 9, batch 5793
Training loss: 1.5155668258666992 

Epoch 9, batch 5794
Training loss: 1.8119159936904907 

Epoch 9, batch 5795
Training loss: 1.4927754402160645 

Epoch 9, batch 5796
Training loss: 1.8904656171798706 

Epoch 9, batch 5797
Training loss: 1.5713180303573608 

Epoch 9, batch 5798
Training loss: 1.8653850555419922 

Epoch 9, batch 5799
Training loss: 1.6991586685180664 

Epoch 9, batch 5800
Training loss: 1.6822128295898

Epoch 9, batch 5986
Training loss: 1.7942860126495361 

Epoch 9, batch 5987
Training loss: 1.6420339345932007 

Epoch 9, batch 5988
Training loss: 1.642257809638977 

Epoch 9, batch 5989
Training loss: 1.6499443054199219 

Epoch 9, batch 5990
Training loss: 1.8624224662780762 

Epoch 9, batch 5991
Training loss: 1.8552372455596924 

Epoch 9, batch 5992
Training loss: 1.544620394706726 

Epoch 9, batch 5993
Training loss: 1.652527093887329 

Epoch 9, batch 5994
Training loss: 1.8099822998046875 

Epoch 9, batch 5995
Training loss: 1.5038665533065796 

Epoch 9, batch 5996
Training loss: 1.7110159397125244 

Epoch 9, batch 5997
Training loss: 1.7490615844726562 

Epoch 9, batch 5998
Training loss: 1.5554614067077637 

Epoch 9, batch 5999
Training loss: 2.0625574588775635 

Epoch 9, batch 6000
Training loss: 1.9741935729980469 

Epoch 10, batch 1
Training loss: 1.653944492340088 

Epoch 10, batch 2
Training loss: 1.7792813777923584 

Epoch 10, batch 3
Training loss: 1.9471473693847656 

Ep

Epoch 10, batch 186
Training loss: 1.7724229097366333 

Epoch 10, batch 187
Training loss: 1.6653759479522705 

Epoch 10, batch 188
Training loss: 1.7934908866882324 

Epoch 10, batch 189
Training loss: 1.8937294483184814 

Epoch 10, batch 190
Training loss: 1.8297516107559204 

Epoch 10, batch 191
Training loss: 1.9090222120285034 

Epoch 10, batch 192
Training loss: 1.5684311389923096 

Epoch 10, batch 193
Training loss: 1.6299984455108643 

Epoch 10, batch 194
Training loss: 1.777087926864624 

Epoch 10, batch 195
Training loss: 1.6531286239624023 

Epoch 10, batch 196
Training loss: 1.679518699645996 

Epoch 10, batch 197
Training loss: 1.5486781597137451 

Epoch 10, batch 198
Training loss: 1.575926661491394 

Epoch 10, batch 199
Training loss: 1.6784939765930176 

Epoch 10, batch 200
Training loss: 1.7296600341796875 

Epoch 10, batch 201
Training loss: 1.909184455871582 

Epoch 10, batch 202
Training loss: 2.0824637413024902 

Epoch 10, batch 203
Training loss: 1.764081239700317

Epoch 10, batch 389
Training loss: 1.7463406324386597 

Epoch 10, batch 390
Training loss: 1.657818078994751 

Epoch 10, batch 391
Training loss: 1.8456635475158691 

Epoch 10, batch 392
Training loss: 1.7207539081573486 

Epoch 10, batch 393
Training loss: 1.4759522676467896 

Epoch 10, batch 394
Training loss: 1.6356854438781738 

Epoch 10, batch 395
Training loss: 1.8558018207550049 

Epoch 10, batch 396
Training loss: 1.6641017198562622 

Epoch 10, batch 397
Training loss: 1.9368600845336914 

Epoch 10, batch 398
Training loss: 1.8691747188568115 

Epoch 10, batch 399
Training loss: 1.8292889595031738 

Epoch 10, batch 400
Training loss: 1.6464738845825195 

Epoch 10, batch 401
Training loss: 1.7192047834396362 

Epoch 10, batch 402
Training loss: 1.6461844444274902 

Epoch 10, batch 403
Training loss: 1.8156538009643555 

Epoch 10, batch 404
Training loss: 1.9193625450134277 

Epoch 10, batch 405
Training loss: 1.5555192232131958 

Epoch 10, batch 406
Training loss: 1.484118819236

Epoch 10, batch 591
Training loss: 1.4790153503417969 

Epoch 10, batch 592
Training loss: 1.6566758155822754 

Epoch 10, batch 593
Training loss: 1.854170799255371 

Epoch 10, batch 594
Training loss: 1.9077824354171753 

Epoch 10, batch 595
Training loss: 1.5777114629745483 

Epoch 10, batch 596
Training loss: 1.7688907384872437 

Epoch 10, batch 597
Training loss: 1.7435662746429443 

Epoch 10, batch 598
Training loss: 1.6617896556854248 

Epoch 10, batch 599
Training loss: 1.7843841314315796 

Epoch 10, batch 600
Training loss: 1.683192253112793 

Epoch 10, batch 601
Training loss: 1.9844067096710205 

Epoch 10, batch 602
Training loss: 1.5528466701507568 

Epoch 10, batch 603
Training loss: 1.8225347995758057 

Epoch 10, batch 604
Training loss: 1.6464787721633911 

Epoch 10, batch 605
Training loss: 1.5555580854415894 

Epoch 10, batch 606
Training loss: 1.7724871635437012 

Epoch 10, batch 607
Training loss: 1.7405283451080322 

Epoch 10, batch 608
Training loss: 1.6931525468826

Epoch 10, batch 794
Training loss: 1.7457518577575684 

Epoch 10, batch 795
Training loss: 1.9720619916915894 

Epoch 10, batch 796
Training loss: 1.8168761730194092 

Epoch 10, batch 797
Training loss: 1.8224807977676392 

Epoch 10, batch 798
Training loss: 1.5936030149459839 

Epoch 10, batch 799
Training loss: 1.6819612979888916 

Epoch 10, batch 800
Training loss: 1.745269536972046 

Epoch 10, batch 801
Training loss: 1.7460359334945679 

Epoch 10, batch 802
Training loss: 1.482290506362915 

Epoch 10, batch 803
Training loss: 1.5248732566833496 

Epoch 10, batch 804
Training loss: 1.6176985502243042 

Epoch 10, batch 805
Training loss: 1.9419610500335693 

Epoch 10, batch 806
Training loss: 1.8547182083129883 

Epoch 10, batch 807
Training loss: 1.6482465267181396 

Epoch 10, batch 808
Training loss: 1.9306182861328125 

Epoch 10, batch 809
Training loss: 1.7446054220199585 

Epoch 10, batch 810
Training loss: 1.7653443813323975 

Epoch 10, batch 811
Training loss: 1.9933001995086

Epoch 10, batch 997
Training loss: 1.6338872909545898 

Epoch 10, batch 998
Training loss: 2.032536506652832 

Epoch 10, batch 999
Training loss: 1.619266152381897 

Epoch 10, batch 1000
Training loss: 1.6465402841567993 

Epoch 10, batch 1001
Training loss: 1.587192177772522 

Epoch 10, batch 1002
Training loss: 1.6276814937591553 

Epoch 10, batch 1003
Training loss: 1.850640058517456 

Epoch 10, batch 1004
Training loss: 1.827958583831787 

Epoch 10, batch 1005
Training loss: 1.770833134651184 

Epoch 10, batch 1006
Training loss: 1.630173921585083 

Epoch 10, batch 1007
Training loss: 1.5406568050384521 

Epoch 10, batch 1008
Training loss: 1.5458343029022217 

Epoch 10, batch 1009
Training loss: 1.566301703453064 

Epoch 10, batch 1010
Training loss: 1.7038567066192627 

Epoch 10, batch 1011
Training loss: 1.9519354104995728 

Epoch 10, batch 1012
Training loss: 1.8997035026550293 

Epoch 10, batch 1013
Training loss: 1.5995104312896729 

Epoch 10, batch 1014
Training loss: 1.7864

Epoch 10, batch 1201
Training loss: 1.497880458831787 

Epoch 10, batch 1202
Training loss: 1.5072376728057861 

Epoch 10, batch 1203
Training loss: 1.868241310119629 

Epoch 10, batch 1204
Training loss: 1.9132013320922852 

Epoch 10, batch 1205
Training loss: 1.8462004661560059 

Epoch 10, batch 1206
Training loss: 1.757563591003418 

Epoch 10, batch 1207
Training loss: 1.7869033813476562 

Epoch 10, batch 1208
Training loss: 1.6324619054794312 

Epoch 10, batch 1209
Training loss: 1.7861595153808594 

Epoch 10, batch 1210
Training loss: 1.913738489151001 

Epoch 10, batch 1211
Training loss: 1.8186979293823242 

Epoch 10, batch 1212
Training loss: 1.919282078742981 

Epoch 10, batch 1213
Training loss: 1.5012654066085815 

Epoch 10, batch 1214
Training loss: 1.899064064025879 

Epoch 10, batch 1215
Training loss: 1.8197484016418457 

Epoch 10, batch 1216
Training loss: 1.6923900842666626 

Epoch 10, batch 1217
Training loss: 1.4820955991744995 

Epoch 10, batch 1218
Training loss: 1

Epoch 10, batch 1404
Training loss: 1.6733206510543823 

Epoch 10, batch 1405
Training loss: 1.535219669342041 

Epoch 10, batch 1406
Training loss: 1.7550891637802124 

Epoch 10, batch 1407
Training loss: 1.900984764099121 

Epoch 10, batch 1408
Training loss: 1.6754543781280518 

Epoch 10, batch 1409
Training loss: 1.8549516201019287 

Epoch 10, batch 1410
Training loss: 1.5720072984695435 

Epoch 10, batch 1411
Training loss: 1.5627424716949463 

Epoch 10, batch 1412
Training loss: 1.6778349876403809 

Epoch 10, batch 1413
Training loss: 1.6124118566513062 

Epoch 10, batch 1414
Training loss: 1.824384093284607 

Epoch 10, batch 1415
Training loss: 1.945681095123291 

Epoch 10, batch 1416
Training loss: 1.7764427661895752 

Epoch 10, batch 1417
Training loss: 1.7310240268707275 

Epoch 10, batch 1418
Training loss: 1.6602222919464111 

Epoch 10, batch 1419
Training loss: 1.7675068378448486 

Epoch 10, batch 1420
Training loss: 1.9859623908996582 

Epoch 10, batch 1421
Training loss:

Epoch 10, batch 1607
Training loss: 1.6820003986358643 

Epoch 10, batch 1608
Training loss: 1.6407036781311035 

Epoch 10, batch 1609
Training loss: 1.6081171035766602 

Epoch 10, batch 1610
Training loss: 1.657415747642517 

Epoch 10, batch 1611
Training loss: 1.6137504577636719 

Epoch 10, batch 1612
Training loss: 1.656944990158081 

Epoch 10, batch 1613
Training loss: 1.7898918390274048 

Epoch 10, batch 1614
Training loss: 1.853489875793457 

Epoch 10, batch 1615
Training loss: 1.7430721521377563 

Epoch 10, batch 1616
Training loss: 1.6605055332183838 

Epoch 10, batch 1617
Training loss: 1.7858178615570068 

Epoch 10, batch 1618
Training loss: 1.5863828659057617 

Epoch 10, batch 1619
Training loss: 1.7630083560943604 

Epoch 10, batch 1620
Training loss: 1.7268704175949097 

Epoch 10, batch 1621
Training loss: 1.6974501609802246 

Epoch 10, batch 1622
Training loss: 1.8723268508911133 

Epoch 10, batch 1623
Training loss: 1.6242246627807617 

Epoch 10, batch 1624
Training loss

Epoch 10, batch 1808
Training loss: 1.6854151487350464 

Epoch 10, batch 1809
Training loss: 1.650123953819275 

Epoch 10, batch 1810
Training loss: 1.9068598747253418 

Epoch 10, batch 1811
Training loss: 1.5071744918823242 

Epoch 10, batch 1812
Training loss: 1.8627374172210693 

Epoch 10, batch 1813
Training loss: 1.5202865600585938 

Epoch 10, batch 1814
Training loss: 1.7287185192108154 

Epoch 10, batch 1815
Training loss: 1.480800747871399 

Epoch 10, batch 1816
Training loss: 1.7726949453353882 

Epoch 10, batch 1817
Training loss: 1.6622099876403809 

Epoch 10, batch 1818
Training loss: 1.7493270635604858 

Epoch 10, batch 1819
Training loss: 1.8588225841522217 

Epoch 10, batch 1820
Training loss: 1.536859393119812 

Epoch 10, batch 1821
Training loss: 1.8823820352554321 

Epoch 10, batch 1822
Training loss: 1.8198882341384888 

Epoch 10, batch 1823
Training loss: 1.5111958980560303 

Epoch 10, batch 1824
Training loss: 2.046515464782715 

Epoch 10, batch 1825
Training loss:

Epoch 10, batch 2010
Training loss: 1.670831322669983 

Epoch 10, batch 2011
Training loss: 1.9544410705566406 

Epoch 10, batch 2012
Training loss: 1.815413475036621 

Epoch 10, batch 2013
Training loss: 1.7706459760665894 

Epoch 10, batch 2014
Training loss: 1.9013631343841553 

Epoch 10, batch 2015
Training loss: 1.7014353275299072 

Epoch 10, batch 2016
Training loss: 1.9214754104614258 

Epoch 10, batch 2017
Training loss: 1.6628577709197998 

Epoch 10, batch 2018
Training loss: 1.546600341796875 

Epoch 10, batch 2019
Training loss: 1.7769699096679688 

Epoch 10, batch 2020
Training loss: 1.7800471782684326 

Epoch 10, batch 2021
Training loss: 1.4854042530059814 

Epoch 10, batch 2022
Training loss: 1.8201305866241455 

Epoch 10, batch 2023
Training loss: 1.8741023540496826 

Epoch 10, batch 2024
Training loss: 1.797638177871704 

Epoch 10, batch 2025
Training loss: 1.887608528137207 

Epoch 10, batch 2026
Training loss: 1.7896403074264526 

Epoch 10, batch 2027
Training loss: 

Epoch 10, batch 2213
Training loss: 1.7298367023468018 

Epoch 10, batch 2214
Training loss: 1.5756152868270874 

Epoch 10, batch 2215
Training loss: 1.6342120170593262 

Epoch 10, batch 2216
Training loss: 1.6077791452407837 

Epoch 10, batch 2217
Training loss: 1.8945186138153076 

Epoch 10, batch 2218
Training loss: 1.9624332189559937 

Epoch 10, batch 2219
Training loss: 1.8741739988327026 

Epoch 10, batch 2220
Training loss: 1.9571572542190552 

Epoch 10, batch 2221
Training loss: 1.6548335552215576 

Epoch 10, batch 2222
Training loss: 1.5504100322723389 

Epoch 10, batch 2223
Training loss: 1.701995611190796 

Epoch 10, batch 2224
Training loss: 1.9761751890182495 

Epoch 10, batch 2225
Training loss: 1.8987846374511719 

Epoch 10, batch 2226
Training loss: 1.692396879196167 

Epoch 10, batch 2227
Training loss: 2.016042709350586 

Epoch 10, batch 2228
Training loss: 1.6759328842163086 

Epoch 10, batch 2229
Training loss: 1.6917519569396973 

Epoch 10, batch 2230
Training loss

Epoch 10, batch 2415
Training loss: 1.7226788997650146 

Epoch 10, batch 2416
Training loss: 1.5942283868789673 

Epoch 10, batch 2417
Training loss: 1.851068139076233 

Epoch 10, batch 2418
Training loss: 1.7021318674087524 

Epoch 10, batch 2419
Training loss: 1.6318451166152954 

Epoch 10, batch 2420
Training loss: 1.9664413928985596 

Epoch 10, batch 2421
Training loss: 1.5654603242874146 

Epoch 10, batch 2422
Training loss: 1.7373665571212769 

Epoch 10, batch 2423
Training loss: 1.7326486110687256 

Epoch 10, batch 2424
Training loss: 1.6497758626937866 

Epoch 10, batch 2425
Training loss: 1.6326878070831299 

Epoch 10, batch 2426
Training loss: 1.523790955543518 

Epoch 10, batch 2427
Training loss: 1.7221590280532837 

Epoch 10, batch 2428
Training loss: 1.6480519771575928 

Epoch 10, batch 2429
Training loss: 1.8353179693222046 

Epoch 10, batch 2430
Training loss: 1.8818398714065552 

Epoch 10, batch 2431
Training loss: 1.5942225456237793 

Epoch 10, batch 2432
Training los

Epoch 10, batch 2617
Training loss: 1.7068086862564087 

Epoch 10, batch 2618
Training loss: 1.7377499341964722 

Epoch 10, batch 2619
Training loss: 1.5377177000045776 

Epoch 10, batch 2620
Training loss: 1.920462727546692 

Epoch 10, batch 2621
Training loss: 1.6130174398422241 

Epoch 10, batch 2622
Training loss: 1.9158543348312378 

Epoch 10, batch 2623
Training loss: 1.5771013498306274 

Epoch 10, batch 2624
Training loss: 1.6236627101898193 

Epoch 10, batch 2625
Training loss: 1.699408769607544 

Epoch 10, batch 2626
Training loss: 1.7698144912719727 

Epoch 10, batch 2627
Training loss: 1.855581283569336 

Epoch 10, batch 2628
Training loss: 1.5620214939117432 

Epoch 10, batch 2629
Training loss: 1.5353273153305054 

Epoch 10, batch 2630
Training loss: 1.6043366193771362 

Epoch 10, batch 2631
Training loss: 1.7370729446411133 

Epoch 10, batch 2632
Training loss: 1.8158162832260132 

Epoch 10, batch 2633
Training loss: 1.5351080894470215 

Epoch 10, batch 2634
Training loss

Epoch 10, batch 2818
Training loss: 1.7449133396148682 

Epoch 10, batch 2819
Training loss: 1.8741743564605713 

Epoch 10, batch 2820
Training loss: 1.9845821857452393 

Epoch 10, batch 2821
Training loss: 1.6199240684509277 

Epoch 10, batch 2822
Training loss: 1.8130698204040527 

Epoch 10, batch 2823
Training loss: 1.8443870544433594 

Epoch 10, batch 2824
Training loss: 1.7671983242034912 

Epoch 10, batch 2825
Training loss: 1.6063928604125977 

Epoch 10, batch 2826
Training loss: 1.9179476499557495 

Epoch 10, batch 2827
Training loss: 1.8724730014801025 

Epoch 10, batch 2828
Training loss: 1.8167887926101685 

Epoch 10, batch 2829
Training loss: 1.753084659576416 

Epoch 10, batch 2830
Training loss: 1.8406227827072144 

Epoch 10, batch 2831
Training loss: 1.6071480512619019 

Epoch 10, batch 2832
Training loss: 1.746005892753601 

Epoch 10, batch 2833
Training loss: 1.8461809158325195 

Epoch 10, batch 2834
Training loss: 1.9262733459472656 

Epoch 10, batch 2835
Training los

Epoch 10, batch 3021
Training loss: 1.9548532962799072 

Epoch 10, batch 3022
Training loss: 1.802520513534546 

Epoch 10, batch 3023
Training loss: 1.6430683135986328 

Epoch 10, batch 3024
Training loss: 1.5661604404449463 

Epoch 10, batch 3025
Training loss: 1.64285147190094 

Epoch 10, batch 3026
Training loss: 1.9007811546325684 

Epoch 10, batch 3027
Training loss: 1.887745976448059 

Epoch 10, batch 3028
Training loss: 1.7596486806869507 

Epoch 10, batch 3029
Training loss: 1.5736637115478516 

Epoch 10, batch 3030
Training loss: 1.994645118713379 

Epoch 10, batch 3031
Training loss: 1.8508212566375732 

Epoch 10, batch 3032
Training loss: 1.800091028213501 

Epoch 10, batch 3033
Training loss: 1.8133243322372437 

Epoch 10, batch 3034
Training loss: 1.7691237926483154 

Epoch 10, batch 3035
Training loss: 1.8697500228881836 

Epoch 10, batch 3036
Training loss: 1.816847562789917 

Epoch 10, batch 3037
Training loss: 1.4677814245224 

Epoch 10, batch 3038
Training loss: 1.648

Epoch 10, batch 3226
Training loss: 1.5923889875411987 

Epoch 10, batch 3227
Training loss: 1.6808202266693115 

Epoch 10, batch 3228
Training loss: 1.848304271697998 

Epoch 10, batch 3229
Training loss: 1.7816202640533447 

Epoch 10, batch 3230
Training loss: 1.5527325868606567 

Epoch 10, batch 3231
Training loss: 1.7845032215118408 

Epoch 10, batch 3232
Training loss: 1.8179240226745605 

Epoch 10, batch 3233
Training loss: 1.8608989715576172 

Epoch 10, batch 3234
Training loss: 1.7612345218658447 

Epoch 10, batch 3235
Training loss: 1.535221815109253 

Epoch 10, batch 3236
Training loss: 1.6707631349563599 

Epoch 10, batch 3237
Training loss: 1.623258113861084 

Epoch 10, batch 3238
Training loss: 1.6666975021362305 

Epoch 10, batch 3239
Training loss: 1.787627935409546 

Epoch 10, batch 3240
Training loss: 1.6804351806640625 

Epoch 10, batch 3241
Training loss: 1.8526579141616821 

Epoch 10, batch 3242
Training loss: 1.8152248859405518 

Epoch 10, batch 3243
Training loss:

Epoch 10, batch 3428
Training loss: 1.5577036142349243 

Epoch 10, batch 3429
Training loss: 1.669311761856079 

Epoch 10, batch 3430
Training loss: 1.6918396949768066 

Epoch 10, batch 3431
Training loss: 1.7489092350006104 

Epoch 10, batch 3432
Training loss: 1.8843772411346436 

Epoch 10, batch 3433
Training loss: 1.8767304420471191 

Epoch 10, batch 3434
Training loss: 1.7752351760864258 

Epoch 10, batch 3435
Training loss: 1.8559925556182861 

Epoch 10, batch 3436
Training loss: 1.657150149345398 

Epoch 10, batch 3437
Training loss: 1.912580966949463 

Epoch 10, batch 3438
Training loss: 1.9146215915679932 

Epoch 10, batch 3439
Training loss: 1.8467793464660645 

Epoch 10, batch 3440
Training loss: 1.6474636793136597 

Epoch 10, batch 3441
Training loss: 1.8623902797698975 

Epoch 10, batch 3442
Training loss: 1.8300702571868896 

Epoch 10, batch 3443
Training loss: 1.655908226966858 

Epoch 10, batch 3444
Training loss: 1.7096149921417236 

Epoch 10, batch 3445
Training loss:

Epoch 10, batch 3632
Training loss: 1.7845919132232666 

Epoch 10, batch 3633
Training loss: 1.6476101875305176 

Epoch 10, batch 3634
Training loss: 1.905539870262146 

Epoch 10, batch 3635
Training loss: 1.9613341093063354 

Epoch 10, batch 3636
Training loss: 1.7216120958328247 

Epoch 10, batch 3637
Training loss: 1.898789405822754 

Epoch 10, batch 3638
Training loss: 1.7734456062316895 

Epoch 10, batch 3639
Training loss: 1.5984196662902832 

Epoch 10, batch 3640
Training loss: 1.911039113998413 

Epoch 10, batch 3641
Training loss: 1.7093744277954102 

Epoch 10, batch 3642
Training loss: 1.9275448322296143 

Epoch 10, batch 3643
Training loss: 1.7968437671661377 

Epoch 10, batch 3644
Training loss: 1.7815158367156982 

Epoch 10, batch 3645
Training loss: 1.573897361755371 

Epoch 10, batch 3646
Training loss: 1.9050624370574951 

Epoch 10, batch 3647
Training loss: 1.6119695901870728 

Epoch 10, batch 3648
Training loss: 1.60270357131958 

Epoch 10, batch 3649
Training loss: 1

Epoch 10, batch 3828
Training loss: 1.5155763626098633 

Epoch 10, batch 3829
Training loss: 1.5831208229064941 

Epoch 10, batch 3830
Training loss: 1.5949970483779907 

Epoch 10, batch 3831
Training loss: 1.7898974418640137 

Epoch 10, batch 3832
Training loss: 1.4765772819519043 

Epoch 10, batch 3833
Training loss: 1.7824857234954834 

Epoch 10, batch 3834
Training loss: 1.7216912508010864 

Epoch 10, batch 3835
Training loss: 1.9802470207214355 

Epoch 10, batch 3836
Training loss: 1.6892805099487305 

Epoch 10, batch 3837
Training loss: 1.5298877954483032 

Epoch 10, batch 3838
Training loss: 1.5412923097610474 

Epoch 10, batch 3839
Training loss: 1.7649394273757935 

Epoch 10, batch 3840
Training loss: 1.8556042909622192 

Epoch 10, batch 3841
Training loss: 1.8948496580123901 

Epoch 10, batch 3842
Training loss: 1.8688242435455322 

Epoch 10, batch 3843
Training loss: 1.8683912754058838 

Epoch 10, batch 3844
Training loss: 1.6504855155944824 

Epoch 10, batch 3845
Training l

Epoch 10, batch 4030
Training loss: 2.015627861022949 

Epoch 10, batch 4031
Training loss: 1.9765217304229736 

Epoch 10, batch 4032
Training loss: 1.7404417991638184 

Epoch 10, batch 4033
Training loss: 1.7338213920593262 

Epoch 10, batch 4034
Training loss: 1.4718728065490723 

Epoch 10, batch 4035
Training loss: 1.7455167770385742 

Epoch 10, batch 4036
Training loss: 1.5999375581741333 

Epoch 10, batch 4037
Training loss: 1.6412155628204346 

Epoch 10, batch 4038
Training loss: 2.0441741943359375 

Epoch 10, batch 4039
Training loss: 1.6750011444091797 

Epoch 10, batch 4040
Training loss: 1.5641913414001465 

Epoch 10, batch 4041
Training loss: 1.8087971210479736 

Epoch 10, batch 4042
Training loss: 1.8919153213500977 

Epoch 10, batch 4043
Training loss: 1.7144138813018799 

Epoch 10, batch 4044
Training loss: 1.7945644855499268 

Epoch 10, batch 4045
Training loss: 1.716566801071167 

Epoch 10, batch 4046
Training loss: 1.6575312614440918 

Epoch 10, batch 4047
Training los

Epoch 10, batch 4234
Training loss: 1.7304755449295044 

Epoch 10, batch 4235
Training loss: 1.887373924255371 

Epoch 10, batch 4236
Training loss: 1.5750982761383057 

Epoch 10, batch 4237
Training loss: 1.796529769897461 

Epoch 10, batch 4238
Training loss: 1.7456656694412231 

Epoch 10, batch 4239
Training loss: 1.555719017982483 

Epoch 10, batch 4240
Training loss: 1.8195807933807373 

Epoch 10, batch 4241
Training loss: 1.745471477508545 

Epoch 10, batch 4242
Training loss: 1.7352474927902222 

Epoch 10, batch 4243
Training loss: 1.856215238571167 

Epoch 10, batch 4244
Training loss: 1.7695996761322021 

Epoch 10, batch 4245
Training loss: 1.5917235612869263 

Epoch 10, batch 4246
Training loss: 1.5582168102264404 

Epoch 10, batch 4247
Training loss: 1.4872270822525024 

Epoch 10, batch 4248
Training loss: 1.8479440212249756 

Epoch 10, batch 4249
Training loss: 1.524787187576294 

Epoch 10, batch 4250
Training loss: 1.6681220531463623 

Epoch 10, batch 4251
Training loss: 1

Epoch 10, batch 4437
Training loss: 1.4751454591751099 

Epoch 10, batch 4438
Training loss: 1.7209572792053223 

Epoch 10, batch 4439
Training loss: 1.513837218284607 

Epoch 10, batch 4440
Training loss: 2.0698070526123047 

Epoch 10, batch 4441
Training loss: 1.6450481414794922 

Epoch 10, batch 4442
Training loss: 1.8300142288208008 

Epoch 10, batch 4443
Training loss: 1.7106199264526367 

Epoch 10, batch 4444
Training loss: 1.8329081535339355 

Epoch 10, batch 4445
Training loss: 1.881598949432373 

Epoch 10, batch 4446
Training loss: 1.6615123748779297 

Epoch 10, batch 4447
Training loss: 1.7911148071289062 

Epoch 10, batch 4448
Training loss: 1.771773099899292 

Epoch 10, batch 4449
Training loss: 1.8240702152252197 

Epoch 10, batch 4450
Training loss: 1.7536036968231201 

Epoch 10, batch 4451
Training loss: 1.6301004886627197 

Epoch 10, batch 4452
Training loss: 1.696601152420044 

Epoch 10, batch 4453
Training loss: 1.6733640432357788 

Epoch 10, batch 4454
Training loss:

Epoch 10, batch 4639
Training loss: 1.9631563425064087 

Epoch 10, batch 4640
Training loss: 1.7594389915466309 

Epoch 10, batch 4641
Training loss: 1.4874536991119385 

Epoch 10, batch 4642
Training loss: 1.7107326984405518 

Epoch 10, batch 4643
Training loss: 1.6819112300872803 

Epoch 10, batch 4644
Training loss: 1.6445622444152832 

Epoch 10, batch 4645
Training loss: 1.4844313859939575 

Epoch 10, batch 4646
Training loss: 1.7160747051239014 

Epoch 10, batch 4647
Training loss: 1.5503597259521484 

Epoch 10, batch 4648
Training loss: 1.6232069730758667 

Epoch 10, batch 4649
Training loss: 1.8561913967132568 

Epoch 10, batch 4650
Training loss: 1.547473430633545 

Epoch 10, batch 4651
Training loss: 1.7432844638824463 

Epoch 10, batch 4652
Training loss: 1.6590789556503296 

Epoch 10, batch 4653
Training loss: 1.9467275142669678 

Epoch 10, batch 4654
Training loss: 1.6767683029174805 

Epoch 10, batch 4655
Training loss: 1.7681317329406738 

Epoch 10, batch 4656
Training lo

Epoch 10, batch 4840
Training loss: 1.6325603723526 

Epoch 10, batch 4841
Training loss: 1.7011561393737793 

Epoch 10, batch 4842
Training loss: 1.520756483078003 

Epoch 10, batch 4843
Training loss: 1.7278861999511719 

Epoch 10, batch 4844
Training loss: 1.7132718563079834 

Epoch 10, batch 4845
Training loss: 1.9428625106811523 

Epoch 10, batch 4846
Training loss: 1.5939042568206787 

Epoch 10, batch 4847
Training loss: 1.7910499572753906 

Epoch 10, batch 4848
Training loss: 1.6036123037338257 

Epoch 10, batch 4849
Training loss: 1.5822272300720215 

Epoch 10, batch 4850
Training loss: 1.6244237422943115 

Epoch 10, batch 4851
Training loss: 1.7128140926361084 

Epoch 10, batch 4852
Training loss: 1.907632827758789 

Epoch 10, batch 4853
Training loss: 1.7860257625579834 

Epoch 10, batch 4854
Training loss: 1.6029515266418457 

Epoch 10, batch 4855
Training loss: 1.5101754665374756 

Epoch 10, batch 4856
Training loss: 1.839716911315918 

Epoch 10, batch 4857
Training loss: 1

Epoch 10, batch 5041
Training loss: 1.8058342933654785 

Epoch 10, batch 5042
Training loss: 1.8491568565368652 

Epoch 10, batch 5043
Training loss: 1.694685697555542 

Epoch 10, batch 5044
Training loss: 1.7385376691818237 

Epoch 10, batch 5045
Training loss: 1.6387219429016113 

Epoch 10, batch 5046
Training loss: 1.8488705158233643 

Epoch 10, batch 5047
Training loss: 1.739903211593628 

Epoch 10, batch 5048
Training loss: 1.8064051866531372 

Epoch 10, batch 5049
Training loss: 1.8755762577056885 

Epoch 10, batch 5050
Training loss: 1.6200875043869019 

Epoch 10, batch 5051
Training loss: 1.7891634702682495 

Epoch 10, batch 5052
Training loss: 1.7598788738250732 

Epoch 10, batch 5053
Training loss: 1.6115245819091797 

Epoch 10, batch 5054
Training loss: 1.7338019609451294 

Epoch 10, batch 5055
Training loss: 1.6170358657836914 

Epoch 10, batch 5056
Training loss: 1.5230798721313477 

Epoch 10, batch 5057
Training loss: 1.6449040174484253 

Epoch 10, batch 5058
Training los

Epoch 10, batch 5243
Training loss: 1.701870322227478 

Epoch 10, batch 5244
Training loss: 1.7050089836120605 

Epoch 10, batch 5245
Training loss: 1.7632511854171753 

Epoch 10, batch 5246
Training loss: 1.8067760467529297 

Epoch 10, batch 5247
Training loss: 1.9611191749572754 

Epoch 10, batch 5248
Training loss: 1.9116946458816528 

Epoch 10, batch 5249
Training loss: 1.5878371000289917 

Epoch 10, batch 5250
Training loss: 1.6540076732635498 

Epoch 10, batch 5251
Training loss: 1.606649398803711 

Epoch 10, batch 5252
Training loss: 1.73924720287323 

Epoch 10, batch 5253
Training loss: 1.9280662536621094 

Epoch 10, batch 5254
Training loss: 1.6376374959945679 

Epoch 10, batch 5255
Training loss: 1.7461307048797607 

Epoch 10, batch 5256
Training loss: 1.5208624601364136 

Epoch 10, batch 5257
Training loss: 1.7799564599990845 

Epoch 10, batch 5258
Training loss: 1.6603562831878662 

Epoch 10, batch 5259
Training loss: 1.9115300178527832 

Epoch 10, batch 5260
Training loss:

Epoch 10, batch 5446
Training loss: 1.9548205137252808 

Epoch 10, batch 5447
Training loss: 1.9431369304656982 

Epoch 10, batch 5448
Training loss: 1.723223328590393 

Epoch 10, batch 5449
Training loss: 1.9694867134094238 

Epoch 10, batch 5450
Training loss: 1.8081271648406982 

Epoch 10, batch 5451
Training loss: 1.6476277112960815 

Epoch 10, batch 5452
Training loss: 1.8232083320617676 

Epoch 10, batch 5453
Training loss: 1.7936757802963257 

Epoch 10, batch 5454
Training loss: 1.972135305404663 

Epoch 10, batch 5455
Training loss: 1.61649489402771 

Epoch 10, batch 5456
Training loss: 1.6451491117477417 

Epoch 10, batch 5457
Training loss: 1.7363840341567993 

Epoch 10, batch 5458
Training loss: 1.5501190423965454 

Epoch 10, batch 5459
Training loss: 1.8736331462860107 

Epoch 10, batch 5460
Training loss: 1.5204285383224487 

Epoch 10, batch 5461
Training loss: 1.7191134691238403 

Epoch 10, batch 5462
Training loss: 1.5958092212677002 

Epoch 10, batch 5463
Training loss:

Epoch 10, batch 5642
Training loss: 1.5472244024276733 

Epoch 10, batch 5643
Training loss: 1.6328277587890625 

Epoch 10, batch 5644
Training loss: 1.8932561874389648 

Epoch 10, batch 5645
Training loss: 1.74770188331604 

Epoch 10, batch 5646
Training loss: 1.7620726823806763 

Epoch 10, batch 5647
Training loss: 1.9558234214782715 

Epoch 10, batch 5648
Training loss: 1.5689176321029663 

Epoch 10, batch 5649
Training loss: 1.6503140926361084 

Epoch 10, batch 5650
Training loss: 1.6873235702514648 

Epoch 10, batch 5651
Training loss: 1.5027719736099243 

Epoch 10, batch 5652
Training loss: 1.6370481252670288 

Epoch 10, batch 5653
Training loss: 1.6013730764389038 

Epoch 10, batch 5654
Training loss: 1.683150053024292 

Epoch 10, batch 5655
Training loss: 1.9129478931427002 

Epoch 10, batch 5656
Training loss: 1.7470057010650635 

Epoch 10, batch 5657
Training loss: 1.5519263744354248 

Epoch 10, batch 5658
Training loss: 1.8713717460632324 

Epoch 10, batch 5659
Training loss

Epoch 10, batch 5845
Training loss: 1.51950204372406 

Epoch 10, batch 5846
Training loss: 1.8845237493515015 

Epoch 10, batch 5847
Training loss: 1.8247469663619995 

Epoch 10, batch 5848
Training loss: 1.5244932174682617 

Epoch 10, batch 5849
Training loss: 1.664185881614685 

Epoch 10, batch 5850
Training loss: 1.6264889240264893 

Epoch 10, batch 5851
Training loss: 1.924539566040039 

Epoch 10, batch 5852
Training loss: 1.5878324508666992 

Epoch 10, batch 5853
Training loss: 1.6142404079437256 

Epoch 10, batch 5854
Training loss: 1.6420928239822388 

Epoch 10, batch 5855
Training loss: 1.796539545059204 

Epoch 10, batch 5856
Training loss: 1.4932479858398438 

Epoch 10, batch 5857
Training loss: 1.684606909751892 

Epoch 10, batch 5858
Training loss: 1.6333355903625488 

Epoch 10, batch 5859
Training loss: 1.9395098686218262 

Epoch 10, batch 5860
Training loss: 1.6793819665908813 

Epoch 10, batch 5861
Training loss: 1.9561569690704346 

Epoch 10, batch 5862
Training loss: 1

### Evaluate

In [9]:
def eval_model(model, test_data):
    test_loader = DataLoader(test_data, batch_size=10, shuffle=True)
#     print(f'test_loader = {test_loader}')
    correct = 0
    total = 0
    with torch.no_grad():
        for data in test_loader:
            x, y = data
#             print(f'x.shape = {x.shape}')
#             print(f'y.shape = {y}')
            output = model(x.view(-1, 784))
#             print(f'output = {output}')
            for idx, i in enumerate(output):
                if torch.argmax(i) == y[idx]:
                    correct += 1
                total += 1
    print(f'accuracy: {correct/total}')

eval_model(model, mnist_test)

  x = F.softmax(x)


accuracy: 0.931
