## Multiclass Classification Model on MNIST Dataset

### Dependencies Imports

In [38]:
import torch
import torch.nn as nn
import torch.nn.functional as F

import torch.optim as optim
from torch.utils.data import TensorDataset, DataLoader

import torchvision
import torchvision.datasets as datasets
import torchvision.transforms as transforms
from PIL import Image

import numpy as np
import random

### Data Preparation

In [39]:
transform = transforms.Compose([
    transforms.ToTensor(),
    transforms.Normalize((0.5,), (0.5,)),
])

In [40]:
mnist_train = datasets.MNIST(root='./data', train=True, download=False, transform=transform)
mnist_test = datasets.MNIST(root='./data', train=False, download=False, transform=transform)

### Model

In [41]:
class MNIST_Model(nn.Module):
    def __init__(self):
        super(MNIST_Model, self).__init__()
        self.hidden1 = nn.Linear(28*28, 50)
        self.output = nn.Linear(50, 10)
    def forward(self, x):
        x = self.hidden1(x)
        x = F.sigmoid(x)
        x = self.output(x)
        x = F.log_softmax(x, dim=1)
        return x

### Training

In [46]:
# training
def train_model(model, train_data):
    train_loader = DataLoader(train_data, batch_size=10, shuffle=True)
    
    loss_fn = nn.CrossEntropyLoss()
    optimizer = optim.Adam(model.parameters(), lr=0.001) #e-1
    epoch = 10

    for epoch in range(epoch):
        model.train()
        batch = 0
        for data in train_loader:
            batch += 1
            x, y = data
            optimizer.zero_grad()
            output = model(x.view(-1, 28*28))
            loss = loss_fn(output, y)
            print(f'Epoch {epoch + 1}, batch {batch}')
            print(f'training loss: {loss} \n')
            loss.backward()
            optimizer.step()
        
model = MNIST_Model()
train_model(model, mnist_train)

Epoch 1, batch 1
training loss: 2.327225685119629 

Epoch 1, batch 2
training loss: 2.2547380924224854 

Epoch 1, batch 3
training loss: 2.38495135307312 

Epoch 1, batch 4
training loss: 2.298846960067749 

Epoch 1, batch 5
training loss: 2.251718044281006 

Epoch 1, batch 6
training loss: 2.6407933235168457 

Epoch 1, batch 7
training loss: 2.4106225967407227 

Epoch 1, batch 8
training loss: 2.530484437942505 

Epoch 1, batch 9
training loss: 2.163801670074463 

Epoch 1, batch 10
training loss: 2.1432976722717285 

Epoch 1, batch 11
training loss: 2.346522808074951 

Epoch 1, batch 12
training loss: 2.232602119445801 

Epoch 1, batch 13
training loss: 2.313727617263794 

Epoch 1, batch 14
training loss: 2.1225128173828125 

Epoch 1, batch 15
training loss: 2.122763156890869 

Epoch 1, batch 16
training loss: 2.217761993408203 

Epoch 1, batch 17
training loss: 2.2493398189544678 

Epoch 1, batch 18
training loss: 2.275660991668701 

Epoch 1, batch 19
training loss: 2.253000497817993

Epoch 1, batch 190
training loss: 1.271484136581421 

Epoch 1, batch 191
training loss: 1.2284350395202637 

Epoch 1, batch 192
training loss: 1.2900711297988892 

Epoch 1, batch 193
training loss: 1.1364723443984985 

Epoch 1, batch 194
training loss: 1.2682725191116333 

Epoch 1, batch 195
training loss: 1.0686004161834717 

Epoch 1, batch 196
training loss: 0.9532972574234009 

Epoch 1, batch 197
training loss: 1.008105993270874 

Epoch 1, batch 198
training loss: 1.1306359767913818 

Epoch 1, batch 199
training loss: 1.1088449954986572 

Epoch 1, batch 200
training loss: 1.3080081939697266 

Epoch 1, batch 201
training loss: 1.123275876045227 

Epoch 1, batch 202
training loss: 1.2853528261184692 

Epoch 1, batch 203
training loss: 1.5264593362808228 

Epoch 1, batch 204
training loss: 1.6649501323699951 

Epoch 1, batch 205
training loss: 1.3469288349151611 

Epoch 1, batch 206
training loss: 1.1497365236282349 

Epoch 1, batch 207
training loss: 1.0511069297790527 

Epoch 1, batc

Epoch 1, batch 408
training loss: 0.7469614744186401 

Epoch 1, batch 409
training loss: 0.9806791543960571 

Epoch 1, batch 410
training loss: 1.0292868614196777 

Epoch 1, batch 411
training loss: 0.6609417200088501 

Epoch 1, batch 412
training loss: 0.528598427772522 

Epoch 1, batch 413
training loss: 0.6343280673027039 

Epoch 1, batch 414
training loss: 0.7248181700706482 

Epoch 1, batch 415
training loss: 0.8468929529190063 

Epoch 1, batch 416
training loss: 0.5947611927986145 

Epoch 1, batch 417
training loss: 0.8170591592788696 

Epoch 1, batch 418
training loss: 0.7637423276901245 

Epoch 1, batch 419
training loss: 0.639510989189148 

Epoch 1, batch 420
training loss: 1.0115278959274292 

Epoch 1, batch 421
training loss: 0.4897603988647461 

Epoch 1, batch 422
training loss: 0.9218262434005737 

Epoch 1, batch 423
training loss: 0.5941669344902039 

Epoch 1, batch 424
training loss: 0.5120471119880676 

Epoch 1, batch 425
training loss: 0.7172623872756958 

Epoch 1, bat

Epoch 1, batch 627
training loss: 0.7421920895576477 

Epoch 1, batch 628
training loss: 0.8225499391555786 

Epoch 1, batch 629
training loss: 0.490936279296875 

Epoch 1, batch 630
training loss: 0.6505508422851562 

Epoch 1, batch 631
training loss: 0.4423099458217621 

Epoch 1, batch 632
training loss: 0.756377100944519 

Epoch 1, batch 633
training loss: 0.8458075523376465 

Epoch 1, batch 634
training loss: 0.5501059293746948 

Epoch 1, batch 635
training loss: 0.47149863839149475 

Epoch 1, batch 636
training loss: 0.5548356771469116 

Epoch 1, batch 637
training loss: 0.3515075445175171 

Epoch 1, batch 638
training loss: 0.43243542313575745 

Epoch 1, batch 639
training loss: 0.47209709882736206 

Epoch 1, batch 640
training loss: 0.5318939089775085 

Epoch 1, batch 641
training loss: 0.49150675535202026 

Epoch 1, batch 642
training loss: 0.44224658608436584 

Epoch 1, batch 643
training loss: 0.41861653327941895 

Epoch 1, batch 644
training loss: 1.1612012386322021 

Epoch 

Epoch 1, batch 847
training loss: 0.7183061838150024 

Epoch 1, batch 848
training loss: 0.4726925492286682 

Epoch 1, batch 849
training loss: 0.41459912061691284 

Epoch 1, batch 850
training loss: 0.2441742867231369 

Epoch 1, batch 851
training loss: 0.2451665848493576 

Epoch 1, batch 852
training loss: 0.5252528190612793 

Epoch 1, batch 853
training loss: 0.1722320318222046 

Epoch 1, batch 854
training loss: 0.7155513763427734 

Epoch 1, batch 855
training loss: 0.4997130334377289 

Epoch 1, batch 856
training loss: 0.39391282200813293 

Epoch 1, batch 857
training loss: 0.22313587367534637 

Epoch 1, batch 858
training loss: 0.19357851147651672 

Epoch 1, batch 859
training loss: 1.1549547910690308 

Epoch 1, batch 860
training loss: 0.31164199113845825 

Epoch 1, batch 861
training loss: 0.571043848991394 

Epoch 1, batch 862
training loss: 0.8058068156242371 

Epoch 1, batch 863
training loss: 0.6844323873519897 

Epoch 1, batch 864
training loss: 0.49712076783180237 

Epoch

Epoch 1, batch 1066
training loss: 0.18382106721401215 

Epoch 1, batch 1067
training loss: 0.7574867010116577 

Epoch 1, batch 1068
training loss: 0.6100079417228699 

Epoch 1, batch 1069
training loss: 0.2368718683719635 

Epoch 1, batch 1070
training loss: 0.1699695885181427 

Epoch 1, batch 1071
training loss: 0.5163748860359192 

Epoch 1, batch 1072
training loss: 0.4037557542324066 

Epoch 1, batch 1073
training loss: 0.27690961956977844 

Epoch 1, batch 1074
training loss: 0.4418541491031647 

Epoch 1, batch 1075
training loss: 0.3296670913696289 

Epoch 1, batch 1076
training loss: 0.1321330964565277 

Epoch 1, batch 1077
training loss: 0.2912033498287201 

Epoch 1, batch 1078
training loss: 0.7138214111328125 

Epoch 1, batch 1079
training loss: 0.49269723892211914 

Epoch 1, batch 1080
training loss: 0.521862804889679 

Epoch 1, batch 1081
training loss: 0.11873097717761993 

Epoch 1, batch 1082
training loss: 0.30725282430648804 

Epoch 1, batch 1083
training loss: 0.2457066

Epoch 1, batch 1256
training loss: 0.24583539366722107 

Epoch 1, batch 1257
training loss: 1.1093024015426636 

Epoch 1, batch 1258
training loss: 0.3559468686580658 

Epoch 1, batch 1259
training loss: 0.6926121711730957 

Epoch 1, batch 1260
training loss: 0.25724515318870544 

Epoch 1, batch 1261
training loss: 0.21514566242694855 

Epoch 1, batch 1262
training loss: 0.4070318341255188 

Epoch 1, batch 1263
training loss: 0.388510525226593 

Epoch 1, batch 1264
training loss: 0.35063332319259644 

Epoch 1, batch 1265
training loss: 0.5561740398406982 

Epoch 1, batch 1266
training loss: 0.26011863350868225 

Epoch 1, batch 1267
training loss: 0.4868711531162262 

Epoch 1, batch 1268
training loss: 0.4108216166496277 

Epoch 1, batch 1269
training loss: 0.6714478731155396 

Epoch 1, batch 1270
training loss: 0.3955414891242981 

Epoch 1, batch 1271
training loss: 0.1892106682062149 

Epoch 1, batch 1272
training loss: 0.4114454388618469 

Epoch 1, batch 1273
training loss: 0.1862336

Epoch 1, batch 1461
training loss: 0.4567747116088867 

Epoch 1, batch 1462
training loss: 0.34541720151901245 

Epoch 1, batch 1463
training loss: 0.33445626497268677 

Epoch 1, batch 1464
training loss: 0.3755183815956116 

Epoch 1, batch 1465
training loss: 0.3931161165237427 

Epoch 1, batch 1466
training loss: 0.09153866022825241 

Epoch 1, batch 1467
training loss: 0.2547302842140198 

Epoch 1, batch 1468
training loss: 0.13567452132701874 

Epoch 1, batch 1469
training loss: 0.22421889007091522 

Epoch 1, batch 1470
training loss: 0.32625630497932434 

Epoch 1, batch 1471
training loss: 0.3309374749660492 

Epoch 1, batch 1472
training loss: 0.8150313496589661 

Epoch 1, batch 1473
training loss: 0.3628203272819519 

Epoch 1, batch 1474
training loss: 0.27710673213005066 

Epoch 1, batch 1475
training loss: 1.4399279356002808 

Epoch 1, batch 1476
training loss: 0.40039318799972534 

Epoch 1, batch 1477
training loss: 0.2435084581375122 

Epoch 1, batch 1478
training loss: 0.197

Epoch 1, batch 1679
training loss: 0.2217838019132614 

Epoch 1, batch 1680
training loss: 0.3165901303291321 

Epoch 1, batch 1681
training loss: 0.117467500269413 

Epoch 1, batch 1682
training loss: 0.08417264372110367 

Epoch 1, batch 1683
training loss: 0.2960285246372223 

Epoch 1, batch 1684
training loss: 0.15512099862098694 

Epoch 1, batch 1685
training loss: 0.49338358640670776 

Epoch 1, batch 1686
training loss: 0.4379088282585144 

Epoch 1, batch 1687
training loss: 0.12909959256649017 

Epoch 1, batch 1688
training loss: 0.17330698668956757 

Epoch 1, batch 1689
training loss: 0.8255631327629089 

Epoch 1, batch 1690
training loss: 0.21511848270893097 

Epoch 1, batch 1691
training loss: 0.4124855101108551 

Epoch 1, batch 1692
training loss: 0.08872078359127045 

Epoch 1, batch 1693
training loss: 0.18773548305034637 

Epoch 1, batch 1694
training loss: 0.05367227643728256 

Epoch 1, batch 1695
training loss: 0.6797576546669006 

Epoch 1, batch 1696
training loss: 0.295

Epoch 1, batch 1902
training loss: 0.09255890548229218 

Epoch 1, batch 1903
training loss: 0.7129300236701965 

Epoch 1, batch 1904
training loss: 0.4808577001094818 

Epoch 1, batch 1905
training loss: 0.09878379106521606 

Epoch 1, batch 1906
training loss: 0.4125819802284241 

Epoch 1, batch 1907
training loss: 0.09205158054828644 

Epoch 1, batch 1908
training loss: 0.35162556171417236 

Epoch 1, batch 1909
training loss: 0.09045332670211792 

Epoch 1, batch 1910
training loss: 0.6131477355957031 

Epoch 1, batch 1911
training loss: 0.27310246229171753 

Epoch 1, batch 1912
training loss: 0.2723151743412018 

Epoch 1, batch 1913
training loss: 0.15766140818595886 

Epoch 1, batch 1914
training loss: 0.16297920048236847 

Epoch 1, batch 1915
training loss: 0.10617633163928986 

Epoch 1, batch 1916
training loss: 0.3182864785194397 

Epoch 1, batch 1917
training loss: 0.30997180938720703 

Epoch 1, batch 1918
training loss: 0.43524178862571716 

Epoch 1, batch 1919
training loss: 0.

Epoch 1, batch 2121
training loss: 0.10731060802936554 

Epoch 1, batch 2122
training loss: 0.1217857375741005 

Epoch 1, batch 2123
training loss: 0.15347793698310852 

Epoch 1, batch 2124
training loss: 0.11572793871164322 

Epoch 1, batch 2125
training loss: 0.23600609600543976 

Epoch 1, batch 2126
training loss: 0.4085657596588135 

Epoch 1, batch 2127
training loss: 0.8015694618225098 

Epoch 1, batch 2128
training loss: 0.3490888476371765 

Epoch 1, batch 2129
training loss: 0.04892347753047943 

Epoch 1, batch 2130
training loss: 0.8359448313713074 

Epoch 1, batch 2131
training loss: 0.187454491853714 

Epoch 1, batch 2132
training loss: 0.13927069306373596 

Epoch 1, batch 2133
training loss: 0.1450968086719513 

Epoch 1, batch 2134
training loss: 0.4456240236759186 

Epoch 1, batch 2135
training loss: 0.15304572880268097 

Epoch 1, batch 2136
training loss: 0.12142373621463776 

Epoch 1, batch 2137
training loss: 0.2843684256076813 

Epoch 1, batch 2138
training loss: 0.1808

Epoch 1, batch 2345
training loss: 0.15482120215892792 

Epoch 1, batch 2346
training loss: 0.1424318104982376 

Epoch 1, batch 2347
training loss: 0.518168568611145 

Epoch 1, batch 2348
training loss: 0.19446639716625214 

Epoch 1, batch 2349
training loss: 0.3821336627006531 

Epoch 1, batch 2350
training loss: 0.5800854563713074 

Epoch 1, batch 2351
training loss: 0.13642969727516174 

Epoch 1, batch 2352
training loss: 0.2270042598247528 

Epoch 1, batch 2353
training loss: 0.4543500542640686 

Epoch 1, batch 2354
training loss: 0.6715874075889587 

Epoch 1, batch 2355
training loss: 0.0313694104552269 

Epoch 1, batch 2356
training loss: 0.8306707143783569 

Epoch 1, batch 2357
training loss: 0.40989789366722107 

Epoch 1, batch 2358
training loss: 0.3049679398536682 

Epoch 1, batch 2359
training loss: 0.13880720734596252 

Epoch 1, batch 2360
training loss: 0.0893857330083847 

Epoch 1, batch 2361
training loss: 0.10765568912029266 

Epoch 1, batch 2362
training loss: 0.478751

Epoch 1, batch 2561
training loss: 0.298582524061203 

Epoch 1, batch 2562
training loss: 0.46948033571243286 

Epoch 1, batch 2563
training loss: 0.3931581676006317 

Epoch 1, batch 2564
training loss: 0.4899415969848633 

Epoch 1, batch 2565
training loss: 0.3032914698123932 

Epoch 1, batch 2566
training loss: 0.05865924805402756 

Epoch 1, batch 2567
training loss: 0.5680174231529236 

Epoch 1, batch 2568
training loss: 0.4871242940425873 

Epoch 1, batch 2569
training loss: 0.100083127617836 

Epoch 1, batch 2570
training loss: 0.6542172431945801 

Epoch 1, batch 2571
training loss: 0.129388689994812 

Epoch 1, batch 2572
training loss: 0.1861634999513626 

Epoch 1, batch 2573
training loss: 0.24306583404541016 

Epoch 1, batch 2574
training loss: 0.332651287317276 

Epoch 1, batch 2575
training loss: 0.29243913292884827 

Epoch 1, batch 2576
training loss: 0.2626882493495941 

Epoch 1, batch 2577
training loss: 0.08674611896276474 

Epoch 1, batch 2578
training loss: 0.4760418832

Epoch 1, batch 2781
training loss: 0.2083429992198944 

Epoch 1, batch 2782
training loss: 0.25077441334724426 

Epoch 1, batch 2783
training loss: 0.3306714594364166 

Epoch 1, batch 2784
training loss: 0.2569480836391449 

Epoch 1, batch 2785
training loss: 0.24746227264404297 

Epoch 1, batch 2786
training loss: 0.05820322036743164 

Epoch 1, batch 2787
training loss: 0.26393893361091614 

Epoch 1, batch 2788
training loss: 0.786688506603241 

Epoch 1, batch 2789
training loss: 0.4306116998195648 

Epoch 1, batch 2790
training loss: 0.0636792853474617 

Epoch 1, batch 2791
training loss: 0.1940772533416748 

Epoch 1, batch 2792
training loss: 0.11604533344507217 

Epoch 1, batch 2793
training loss: 0.3244984745979309 

Epoch 1, batch 2794
training loss: 0.08191944658756256 

Epoch 1, batch 2795
training loss: 0.08723039925098419 

Epoch 1, batch 2796
training loss: 0.6787446737289429 

Epoch 1, batch 2797
training loss: 0.14260850846767426 

Epoch 1, batch 2798
training loss: 0.1122

Epoch 1, batch 3000
training loss: 0.34424757957458496 

Epoch 1, batch 3001
training loss: 0.29192477464675903 

Epoch 1, batch 3002
training loss: 0.10906416177749634 

Epoch 1, batch 3003
training loss: 0.7023348808288574 

Epoch 1, batch 3004
training loss: 0.2294464409351349 

Epoch 1, batch 3005
training loss: 0.34894484281539917 

Epoch 1, batch 3006
training loss: 0.10095387697219849 

Epoch 1, batch 3007
training loss: 0.13551399111747742 

Epoch 1, batch 3008
training loss: 0.11384803056716919 

Epoch 1, batch 3009
training loss: 0.43076223134994507 

Epoch 1, batch 3010
training loss: 0.11246446520090103 

Epoch 1, batch 3011
training loss: 0.29212644696235657 

Epoch 1, batch 3012
training loss: 0.05175672844052315 

Epoch 1, batch 3013
training loss: 0.13367262482643127 

Epoch 1, batch 3014
training loss: 0.041761964559555054 

Epoch 1, batch 3015
training loss: 0.18181060254573822 

Epoch 1, batch 3016
training loss: 0.3435065448284149 

Epoch 1, batch 3017
training loss

Epoch 1, batch 3221
training loss: 0.0356084406375885 

Epoch 1, batch 3222
training loss: 0.09066017717123032 

Epoch 1, batch 3223
training loss: 0.8906117677688599 

Epoch 1, batch 3224
training loss: 0.39486753940582275 

Epoch 1, batch 3225
training loss: 0.23506975173950195 

Epoch 1, batch 3226
training loss: 0.12525765597820282 

Epoch 1, batch 3227
training loss: 0.2695423364639282 

Epoch 1, batch 3228
training loss: 0.2031112015247345 

Epoch 1, batch 3229
training loss: 0.025026563555002213 

Epoch 1, batch 3230
training loss: 0.17818042635917664 

Epoch 1, batch 3231
training loss: 0.493023544549942 

Epoch 1, batch 3232
training loss: 0.5295490026473999 

Epoch 1, batch 3233
training loss: 0.5691500902175903 

Epoch 1, batch 3234
training loss: 0.2704264223575592 

Epoch 1, batch 3235
training loss: 0.10540206730365753 

Epoch 1, batch 3236
training loss: 0.13688483834266663 

Epoch 1, batch 3237
training loss: 0.04106258600950241 

Epoch 1, batch 3238
training loss: 0.46

Epoch 1, batch 3440
training loss: 0.540515661239624 

Epoch 1, batch 3441
training loss: 0.07590744644403458 

Epoch 1, batch 3442
training loss: 0.1588839441537857 

Epoch 1, batch 3443
training loss: 0.17050369083881378 

Epoch 1, batch 3444
training loss: 0.3205687999725342 

Epoch 1, batch 3445
training loss: 0.6258960962295532 

Epoch 1, batch 3446
training loss: 0.34083935618400574 

Epoch 1, batch 3447
training loss: 0.1866430640220642 

Epoch 1, batch 3448
training loss: 0.07809038460254669 

Epoch 1, batch 3449
training loss: 0.185221865773201 

Epoch 1, batch 3450
training loss: 0.2139725387096405 

Epoch 1, batch 3451
training loss: 0.16149500012397766 

Epoch 1, batch 3452
training loss: 0.28525063395500183 

Epoch 1, batch 3453
training loss: 0.974875271320343 

Epoch 1, batch 3454
training loss: 0.48860007524490356 

Epoch 1, batch 3455
training loss: 0.16416022181510925 

Epoch 1, batch 3456
training loss: 0.14427503943443298 

Epoch 1, batch 3457
training loss: 0.38515

Epoch 1, batch 3658
training loss: 0.6294676065444946 

Epoch 1, batch 3659
training loss: 0.33074671030044556 

Epoch 1, batch 3660
training loss: 0.07956536114215851 

Epoch 1, batch 3661
training loss: 0.14446377754211426 

Epoch 1, batch 3662
training loss: 0.5010702610015869 

Epoch 1, batch 3663
training loss: 0.3959185481071472 

Epoch 1, batch 3664
training loss: 0.29029709100723267 

Epoch 1, batch 3665
training loss: 0.44754189252853394 

Epoch 1, batch 3666
training loss: 0.2785537838935852 

Epoch 1, batch 3667
training loss: 0.11674348264932632 

Epoch 1, batch 3668
training loss: 0.0809025913476944 

Epoch 1, batch 3669
training loss: 0.12109603732824326 

Epoch 1, batch 3670
training loss: 0.09018469601869583 

Epoch 1, batch 3671
training loss: 0.5846381187438965 

Epoch 1, batch 3672
training loss: 0.13297533988952637 

Epoch 1, batch 3673
training loss: 0.1196218952536583 

Epoch 1, batch 3674
training loss: 0.46283596754074097 

Epoch 1, batch 3675
training loss: 0.4

Epoch 1, batch 3877
training loss: 0.05409518629312515 

Epoch 1, batch 3878
training loss: 0.3973099887371063 

Epoch 1, batch 3879
training loss: 0.4725476801395416 

Epoch 1, batch 3880
training loss: 0.6066997051239014 

Epoch 1, batch 3881
training loss: 0.045554451644420624 

Epoch 1, batch 3882
training loss: 0.36992257833480835 

Epoch 1, batch 3883
training loss: 0.1772887408733368 

Epoch 1, batch 3884
training loss: 0.3941769599914551 

Epoch 1, batch 3885
training loss: 0.031633637845516205 

Epoch 1, batch 3886
training loss: 0.04029400646686554 

Epoch 1, batch 3887
training loss: 0.12252958863973618 

Epoch 1, batch 3888
training loss: 0.22844476997852325 

Epoch 1, batch 3889
training loss: 0.36289915442466736 

Epoch 1, batch 3890
training loss: 0.11138667166233063 

Epoch 1, batch 3891
training loss: 0.11649255454540253 

Epoch 1, batch 3892
training loss: 0.12381911277770996 

Epoch 1, batch 3893
training loss: 0.4296598434448242 

Epoch 1, batch 3894
training loss: 

Epoch 1, batch 4085
training loss: 0.26935282349586487 

Epoch 1, batch 4086
training loss: 0.04654182121157646 

Epoch 1, batch 4087
training loss: 0.5825656652450562 

Epoch 1, batch 4088
training loss: 0.28049522638320923 

Epoch 1, batch 4089
training loss: 0.04677622765302658 

Epoch 1, batch 4090
training loss: 0.10906050354242325 

Epoch 1, batch 4091
training loss: 0.05737396329641342 

Epoch 1, batch 4092
training loss: 0.36326348781585693 

Epoch 1, batch 4093
training loss: 0.49141472578048706 

Epoch 1, batch 4094
training loss: 0.20841145515441895 

Epoch 1, batch 4095
training loss: 0.0822761133313179 

Epoch 1, batch 4096
training loss: 0.22130493819713593 

Epoch 1, batch 4097
training loss: 0.37936222553253174 

Epoch 1, batch 4098
training loss: 0.2761647701263428 

Epoch 1, batch 4099
training loss: 0.03946330025792122 

Epoch 1, batch 4100
training loss: 0.3557945489883423 

Epoch 1, batch 4101
training loss: 0.18207313120365143 

Epoch 1, batch 4102
training loss: 

Epoch 1, batch 4305
training loss: 0.6752390265464783 

Epoch 1, batch 4306
training loss: 0.7390570640563965 

Epoch 1, batch 4307
training loss: 0.7626603841781616 

Epoch 1, batch 4308
training loss: 0.09207174181938171 

Epoch 1, batch 4309
training loss: 0.2710699737071991 

Epoch 1, batch 4310
training loss: 0.1565892994403839 

Epoch 1, batch 4311
training loss: 0.16692587733268738 

Epoch 1, batch 4312
training loss: 0.29611486196517944 

Epoch 1, batch 4313
training loss: 0.40188097953796387 

Epoch 1, batch 4314
training loss: 0.12570355832576752 

Epoch 1, batch 4315
training loss: 0.4554007947444916 

Epoch 1, batch 4316
training loss: 0.10350265353918076 

Epoch 1, batch 4317
training loss: 0.18018095195293427 

Epoch 1, batch 4318
training loss: 0.1751064956188202 

Epoch 1, batch 4319
training loss: 0.4420631527900696 

Epoch 1, batch 4320
training loss: 0.06132153794169426 

Epoch 1, batch 4321
training loss: 0.14403268694877625 

Epoch 1, batch 4322
training loss: 0.31

Epoch 1, batch 4524
training loss: 0.5808089971542358 

Epoch 1, batch 4525
training loss: 0.8207833170890808 

Epoch 1, batch 4526
training loss: 0.3045373857021332 

Epoch 1, batch 4527
training loss: 0.5218149423599243 

Epoch 1, batch 4528
training loss: 0.17424263060092926 

Epoch 1, batch 4529
training loss: 0.8109881281852722 

Epoch 1, batch 4530
training loss: 0.20729514956474304 

Epoch 1, batch 4531
training loss: 0.08436594903469086 

Epoch 1, batch 4532
training loss: 0.16975665092468262 

Epoch 1, batch 4533
training loss: 0.6751340627670288 

Epoch 1, batch 4534
training loss: 0.09231475740671158 

Epoch 1, batch 4535
training loss: 0.18190938234329224 

Epoch 1, batch 4536
training loss: 0.10126273334026337 

Epoch 1, batch 4537
training loss: 0.1473291665315628 

Epoch 1, batch 4538
training loss: 1.6423842906951904 

Epoch 1, batch 4539
training loss: 0.09493875503540039 

Epoch 1, batch 4540
training loss: 0.6681647300720215 

Epoch 1, batch 4541
training loss: 0.715

Epoch 1, batch 4747
training loss: 0.2544230818748474 

Epoch 1, batch 4748
training loss: 0.5491506457328796 

Epoch 1, batch 4749
training loss: 0.07952930778265 

Epoch 1, batch 4750
training loss: 0.03726252168416977 

Epoch 1, batch 4751
training loss: 0.4020215570926666 

Epoch 1, batch 4752
training loss: 0.16747485101222992 

Epoch 1, batch 4753
training loss: 0.3861958384513855 

Epoch 1, batch 4754
training loss: 0.08830247819423676 

Epoch 1, batch 4755
training loss: 0.22732293605804443 

Epoch 1, batch 4756
training loss: 0.06500244140625 

Epoch 1, batch 4757
training loss: 0.4407424032688141 

Epoch 1, batch 4758
training loss: 0.4450301229953766 

Epoch 1, batch 4759
training loss: 0.050843797624111176 

Epoch 1, batch 4760
training loss: 0.2609761357307434 

Epoch 1, batch 4761
training loss: 0.2619834542274475 

Epoch 1, batch 4762
training loss: 0.17707696557044983 

Epoch 1, batch 4763
training loss: 0.4020654261112213 

Epoch 1, batch 4764
training loss: 0.49200105

Epoch 1, batch 4972
training loss: 0.14034101366996765 

Epoch 1, batch 4973
training loss: 0.5420080423355103 

Epoch 1, batch 4974
training loss: 0.1941913217306137 

Epoch 1, batch 4975
training loss: 0.7713819146156311 

Epoch 1, batch 4976
training loss: 0.21337616443634033 

Epoch 1, batch 4977
training loss: 0.2806223928928375 

Epoch 1, batch 4978
training loss: 0.47841644287109375 

Epoch 1, batch 4979
training loss: 0.35505253076553345 

Epoch 1, batch 4980
training loss: 0.1996823251247406 

Epoch 1, batch 4981
training loss: 0.06333853304386139 

Epoch 1, batch 4982
training loss: 0.07929481565952301 

Epoch 1, batch 4983
training loss: 0.08743686974048615 

Epoch 1, batch 4984
training loss: 0.06832821667194366 

Epoch 1, batch 4985
training loss: 0.15091606974601746 

Epoch 1, batch 4986
training loss: 0.06795458495616913 

Epoch 1, batch 4987
training loss: 0.03758310154080391 

Epoch 1, batch 4988
training loss: 0.29642683267593384 

Epoch 1, batch 4989
training loss: 0

Epoch 1, batch 5192
training loss: 0.4770564138889313 

Epoch 1, batch 5193
training loss: 0.14532822370529175 

Epoch 1, batch 5194
training loss: 0.20680570602416992 

Epoch 1, batch 5195
training loss: 0.04958751052618027 

Epoch 1, batch 5196
training loss: 0.11959853023290634 

Epoch 1, batch 5197
training loss: 0.09670545160770416 

Epoch 1, batch 5198
training loss: 0.13019642233848572 

Epoch 1, batch 5199
training loss: 0.042682334780693054 

Epoch 1, batch 5200
training loss: 0.23034493625164032 

Epoch 1, batch 5201
training loss: 0.2696707546710968 

Epoch 1, batch 5202
training loss: 0.036085229367017746 

Epoch 1, batch 5203
training loss: 0.07530159503221512 

Epoch 1, batch 5204
training loss: 0.4449027180671692 

Epoch 1, batch 5205
training loss: 0.43338117003440857 

Epoch 1, batch 5206
training loss: 0.23734073340892792 

Epoch 1, batch 5207
training loss: 0.09448374807834625 

Epoch 1, batch 5208
training loss: 0.4173767566680908 

Epoch 1, batch 5209
training loss

Epoch 1, batch 5413
training loss: 0.8888746500015259 

Epoch 1, batch 5414
training loss: 0.5083380341529846 

Epoch 1, batch 5415
training loss: 0.3486504554748535 

Epoch 1, batch 5416
training loss: 0.34575626254081726 

Epoch 1, batch 5417
training loss: 0.27924513816833496 

Epoch 1, batch 5418
training loss: 0.14350208640098572 

Epoch 1, batch 5419
training loss: 0.21319587528705597 

Epoch 1, batch 5420
training loss: 0.03166165202856064 

Epoch 1, batch 5421
training loss: 0.38572683930397034 

Epoch 1, batch 5422
training loss: 0.42227035760879517 

Epoch 1, batch 5423
training loss: 0.44982701539993286 

Epoch 1, batch 5424
training loss: 0.2640814483165741 

Epoch 1, batch 5425
training loss: 0.2852155566215515 

Epoch 1, batch 5426
training loss: 0.11482846736907959 

Epoch 1, batch 5427
training loss: 0.31262078881263733 

Epoch 1, batch 5428
training loss: 0.0702456384897232 

Epoch 1, batch 5429
training loss: 0.5933713316917419 

Epoch 1, batch 5430
training loss: 0.2

Epoch 1, batch 5632
training loss: 0.12024680525064468 

Epoch 1, batch 5633
training loss: 0.5919647812843323 

Epoch 1, batch 5634
training loss: 0.291167676448822 

Epoch 1, batch 5635
training loss: 0.5855323076248169 

Epoch 1, batch 5636
training loss: 0.03193334490060806 

Epoch 1, batch 5637
training loss: 0.4849678575992584 

Epoch 1, batch 5638
training loss: 0.07408034056425095 

Epoch 1, batch 5639
training loss: 0.5286895036697388 

Epoch 1, batch 5640
training loss: 0.09331000596284866 

Epoch 1, batch 5641
training loss: 0.02139422297477722 

Epoch 1, batch 5642
training loss: 0.289012610912323 

Epoch 1, batch 5643
training loss: 0.24804210662841797 

Epoch 1, batch 5644
training loss: 0.5030097961425781 

Epoch 1, batch 5645
training loss: 0.29308634996414185 

Epoch 1, batch 5646
training loss: 0.23942255973815918 

Epoch 1, batch 5647
training loss: 0.3687823414802551 

Epoch 1, batch 5648
training loss: 0.1895075887441635 

Epoch 1, batch 5649
training loss: 0.45310

Epoch 1, batch 5850
training loss: 0.2379118949174881 

Epoch 1, batch 5851
training loss: 0.043485332280397415 

Epoch 1, batch 5852
training loss: 0.1631416380405426 

Epoch 1, batch 5853
training loss: 0.5665901899337769 

Epoch 1, batch 5854
training loss: 0.030232852324843407 

Epoch 1, batch 5855
training loss: 0.15484222769737244 

Epoch 1, batch 5856
training loss: 0.9013116955757141 

Epoch 1, batch 5857
training loss: 0.49913159012794495 

Epoch 1, batch 5858
training loss: 0.6593440771102905 

Epoch 1, batch 5859
training loss: 0.32876408100128174 

Epoch 1, batch 5860
training loss: 0.025987640023231506 

Epoch 1, batch 5861
training loss: 0.42071694135665894 

Epoch 1, batch 5862
training loss: 1.1845533847808838 

Epoch 1, batch 5863
training loss: 0.11229103803634644 

Epoch 1, batch 5864
training loss: 0.08683282881975174 

Epoch 1, batch 5865
training loss: 0.5739898085594177 

Epoch 1, batch 5866
training loss: 0.12743280827999115 

Epoch 1, batch 5867
training loss: 

Epoch 2, batch 69
training loss: 0.2401927262544632 

Epoch 2, batch 70
training loss: 0.046961911022663116 

Epoch 2, batch 71
training loss: 0.17270693182945251 

Epoch 2, batch 72
training loss: 0.121688112616539 

Epoch 2, batch 73
training loss: 0.06493644416332245 

Epoch 2, batch 74
training loss: 0.05608642101287842 

Epoch 2, batch 75
training loss: 0.3521830439567566 

Epoch 2, batch 76
training loss: 0.11667950451374054 

Epoch 2, batch 77
training loss: 0.05284934490919113 

Epoch 2, batch 78
training loss: 0.06085687875747681 

Epoch 2, batch 79
training loss: 0.2253313511610031 

Epoch 2, batch 80
training loss: 0.027949893847107887 

Epoch 2, batch 81
training loss: 0.03404238447546959 

Epoch 2, batch 82
training loss: 0.24603283405303955 

Epoch 2, batch 83
training loss: 0.1491260677576065 

Epoch 2, batch 84
training loss: 0.6138494610786438 

Epoch 2, batch 85
training loss: 0.28101077675819397 

Epoch 2, batch 86
training loss: 0.1557234823703766 

Epoch 2, batch 8

Epoch 2, batch 285
training loss: 0.12940874695777893 

Epoch 2, batch 286
training loss: 0.1478191316127777 

Epoch 2, batch 287
training loss: 0.40859609842300415 

Epoch 2, batch 288
training loss: 0.19586127996444702 

Epoch 2, batch 289
training loss: 0.045633818954229355 

Epoch 2, batch 290
training loss: 0.18685156106948853 

Epoch 2, batch 291
training loss: 0.02815123274922371 

Epoch 2, batch 292
training loss: 0.031150419265031815 

Epoch 2, batch 293
training loss: 0.07449363172054291 

Epoch 2, batch 294
training loss: 0.46748679876327515 

Epoch 2, batch 295
training loss: 0.044079769402742386 

Epoch 2, batch 296
training loss: 0.264251708984375 

Epoch 2, batch 297
training loss: 0.032139528542757034 

Epoch 2, batch 298
training loss: 0.7513174414634705 

Epoch 2, batch 299
training loss: 0.09107807278633118 

Epoch 2, batch 300
training loss: 0.06316272914409637 

Epoch 2, batch 301
training loss: 0.03583953529596329 

Epoch 2, batch 302
training loss: 0.083508804440

Epoch 2, batch 507
training loss: 0.16110111773014069 

Epoch 2, batch 508
training loss: 0.14101167023181915 

Epoch 2, batch 509
training loss: 0.061723530292510986 

Epoch 2, batch 510
training loss: 0.11908695846796036 

Epoch 2, batch 511
training loss: 0.06207238882780075 

Epoch 2, batch 512
training loss: 0.028070393949747086 

Epoch 2, batch 513
training loss: 0.14094354212284088 

Epoch 2, batch 514
training loss: 0.043950121849775314 

Epoch 2, batch 515
training loss: 0.08717858791351318 

Epoch 2, batch 516
training loss: 0.09718478471040726 

Epoch 2, batch 517
training loss: 0.16347390413284302 

Epoch 2, batch 518
training loss: 0.018946079537272453 

Epoch 2, batch 519
training loss: 0.08398894965648651 

Epoch 2, batch 520
training loss: 0.03152824193239212 

Epoch 2, batch 521
training loss: 0.03487405925989151 

Epoch 2, batch 522
training loss: 0.24010813236236572 

Epoch 2, batch 523
training loss: 0.3338150382041931 

Epoch 2, batch 524
training loss: 0.094655059

Epoch 2, batch 727
training loss: 0.02543514035642147 

Epoch 2, batch 728
training loss: 0.2881303131580353 

Epoch 2, batch 729
training loss: 1.3697993755340576 

Epoch 2, batch 730
training loss: 0.04931085929274559 

Epoch 2, batch 731
training loss: 0.4075709283351898 

Epoch 2, batch 732
training loss: 0.049889370799064636 

Epoch 2, batch 733
training loss: 0.0691574290394783 

Epoch 2, batch 734
training loss: 0.08951500058174133 

Epoch 2, batch 735
training loss: 0.3571721613407135 

Epoch 2, batch 736
training loss: 0.09603094309568405 

Epoch 2, batch 737
training loss: 0.3560045063495636 

Epoch 2, batch 738
training loss: 0.1883111447095871 

Epoch 2, batch 739
training loss: 0.2217450588941574 

Epoch 2, batch 740
training loss: 0.14883354306221008 

Epoch 2, batch 741
training loss: 0.10445266962051392 

Epoch 2, batch 742
training loss: 0.046838946640491486 

Epoch 2, batch 743
training loss: 0.05323050171136856 

Epoch 2, batch 744
training loss: 0.33378130197525024 

Epoch 2, batch 948
training loss: 0.10334908962249756 

Epoch 2, batch 949
training loss: 0.0384845994412899 

Epoch 2, batch 950
training loss: 0.025840258225798607 

Epoch 2, batch 951
training loss: 0.5574865937232971 

Epoch 2, batch 952
training loss: 0.2345248907804489 

Epoch 2, batch 953
training loss: 0.22736242413520813 

Epoch 2, batch 954
training loss: 0.15428854525089264 

Epoch 2, batch 955
training loss: 0.04286932200193405 

Epoch 2, batch 956
training loss: 0.32783398032188416 

Epoch 2, batch 957
training loss: 0.4593953490257263 

Epoch 2, batch 958
training loss: 0.19155588746070862 

Epoch 2, batch 959
training loss: 0.17701812088489532 

Epoch 2, batch 960
training loss: 0.33144611120224 

Epoch 2, batch 961
training loss: 0.5342486500740051 

Epoch 2, batch 962
training loss: 0.06810951232910156 

Epoch 2, batch 963
training loss: 0.05989563465118408 

Epoch 2, batch 964
training loss: 0.7889832258224487 

Epoch 2, batch 965
training loss: 0.11668721586465836 



Epoch 2, batch 1170
training loss: 0.48534178733825684 

Epoch 2, batch 1171
training loss: 0.16550730168819427 

Epoch 2, batch 1172
training loss: 0.16898687183856964 

Epoch 2, batch 1173
training loss: 0.11747340857982635 

Epoch 2, batch 1174
training loss: 0.09850236773490906 

Epoch 2, batch 1175
training loss: 0.19651362299919128 

Epoch 2, batch 1176
training loss: 0.1443784534931183 

Epoch 2, batch 1177
training loss: 0.24215546250343323 

Epoch 2, batch 1178
training loss: 0.1039872020483017 

Epoch 2, batch 1179
training loss: 0.0790681391954422 

Epoch 2, batch 1180
training loss: 0.1580859273672104 

Epoch 2, batch 1181
training loss: 0.44849857687950134 

Epoch 2, batch 1182
training loss: 0.11524097621440887 

Epoch 2, batch 1183
training loss: 0.016718974336981773 

Epoch 2, batch 1184
training loss: 0.7010101675987244 

Epoch 2, batch 1185
training loss: 0.10858608782291412 

Epoch 2, batch 1186
training loss: 0.0758872851729393 

Epoch 2, batch 1187
training loss: 0

Epoch 2, batch 1391
training loss: 0.3157136142253876 

Epoch 2, batch 1392
training loss: 0.1169571653008461 

Epoch 2, batch 1393
training loss: 0.1401352882385254 

Epoch 2, batch 1394
training loss: 0.111861452460289 

Epoch 2, batch 1395
training loss: 0.6293646097183228 

Epoch 2, batch 1396
training loss: 0.03888525813817978 

Epoch 2, batch 1397
training loss: 0.08732683956623077 

Epoch 2, batch 1398
training loss: 0.4516269266605377 

Epoch 2, batch 1399
training loss: 0.14480486512184143 

Epoch 2, batch 1400
training loss: 0.3023354411125183 

Epoch 2, batch 1401
training loss: 0.16533127427101135 

Epoch 2, batch 1402
training loss: 0.09947732836008072 

Epoch 2, batch 1403
training loss: 0.33400386571884155 

Epoch 2, batch 1404
training loss: 0.11098821461200714 

Epoch 2, batch 1405
training loss: 0.4487418532371521 

Epoch 2, batch 1406
training loss: 0.4914481043815613 

Epoch 2, batch 1407
training loss: 0.2711647152900696 

Epoch 2, batch 1408
training loss: 0.59929

Epoch 2, batch 1614
training loss: 0.38340839743614197 

Epoch 2, batch 1615
training loss: 0.16569212079048157 

Epoch 2, batch 1616
training loss: 0.1383778154850006 

Epoch 2, batch 1617
training loss: 0.8125694394111633 

Epoch 2, batch 1618
training loss: 0.6820600628852844 

Epoch 2, batch 1619
training loss: 0.2535436153411865 

Epoch 2, batch 1620
training loss: 0.6014257669448853 

Epoch 2, batch 1621
training loss: 0.11388500034809113 

Epoch 2, batch 1622
training loss: 0.5527151226997375 

Epoch 2, batch 1623
training loss: 0.12050548940896988 

Epoch 2, batch 1624
training loss: 0.08293962478637695 

Epoch 2, batch 1625
training loss: 0.05227797105908394 

Epoch 2, batch 1626
training loss: 0.21726679801940918 

Epoch 2, batch 1627
training loss: 0.11196094751358032 

Epoch 2, batch 1628
training loss: 0.2652677893638611 

Epoch 2, batch 1629
training loss: 0.28094232082366943 

Epoch 2, batch 1630
training loss: 0.10289790481328964 

Epoch 2, batch 1631
training loss: 0.1

Epoch 2, batch 1834
training loss: 0.1972499042749405 

Epoch 2, batch 1835
training loss: 0.2954300343990326 

Epoch 2, batch 1836
training loss: 0.047598473727703094 

Epoch 2, batch 1837
training loss: 0.3870212435722351 

Epoch 2, batch 1838
training loss: 0.10317985713481903 

Epoch 2, batch 1839
training loss: 0.3325822353363037 

Epoch 2, batch 1840
training loss: 0.01877276971936226 

Epoch 2, batch 1841
training loss: 0.3092614412307739 

Epoch 2, batch 1842
training loss: 0.38143840432167053 

Epoch 2, batch 1843
training loss: 0.09314610809087753 

Epoch 2, batch 1844
training loss: 0.0505099818110466 

Epoch 2, batch 1845
training loss: 0.07799317687749863 

Epoch 2, batch 1846
training loss: 0.19293978810310364 

Epoch 2, batch 1847
training loss: 0.5604156851768494 

Epoch 2, batch 1848
training loss: 0.061216987669467926 

Epoch 2, batch 1849
training loss: 0.14687256515026093 

Epoch 2, batch 1850
training loss: 0.2853747010231018 

Epoch 2, batch 1851
training loss: 0.

Epoch 2, batch 2050
training loss: 0.3872338831424713 

Epoch 2, batch 2051
training loss: 0.2655183672904968 

Epoch 2, batch 2052
training loss: 0.2953416407108307 

Epoch 2, batch 2053
training loss: 0.4179588854312897 

Epoch 2, batch 2054
training loss: 0.02889779582619667 

Epoch 2, batch 2055
training loss: 0.23739126324653625 

Epoch 2, batch 2056
training loss: 0.03976758196949959 

Epoch 2, batch 2057
training loss: 0.3834608197212219 

Epoch 2, batch 2058
training loss: 0.4147123694419861 

Epoch 2, batch 2059
training loss: 0.09657464921474457 

Epoch 2, batch 2060
training loss: 0.4862893521785736 

Epoch 2, batch 2061
training loss: 0.25958773493766785 

Epoch 2, batch 2062
training loss: 0.12835225462913513 

Epoch 2, batch 2063
training loss: 0.12584719061851501 

Epoch 2, batch 2064
training loss: 0.23208054900169373 

Epoch 2, batch 2065
training loss: 0.5142605304718018 

Epoch 2, batch 2066
training loss: 0.3245132565498352 

Epoch 2, batch 2067
training loss: 0.512

Epoch 2, batch 2273
training loss: 0.24332764744758606 

Epoch 2, batch 2274
training loss: 0.08642606437206268 

Epoch 2, batch 2275
training loss: 0.15733860433101654 

Epoch 2, batch 2276
training loss: 0.025464991107583046 

Epoch 2, batch 2277
training loss: 0.2006983757019043 

Epoch 2, batch 2278
training loss: 0.5217486619949341 

Epoch 2, batch 2279
training loss: 0.15282782912254333 

Epoch 2, batch 2280
training loss: 0.37351301312446594 

Epoch 2, batch 2281
training loss: 0.8281057476997375 

Epoch 2, batch 2282
training loss: 0.08612000197172165 

Epoch 2, batch 2283
training loss: 0.18027809262275696 

Epoch 2, batch 2284
training loss: 0.09228526055812836 

Epoch 2, batch 2285
training loss: 0.21548107266426086 

Epoch 2, batch 2286
training loss: 0.11424336582422256 

Epoch 2, batch 2287
training loss: 0.05595957115292549 

Epoch 2, batch 2288
training loss: 0.3717464208602905 

Epoch 2, batch 2289
training loss: 0.2908475995063782 

Epoch 2, batch 2290
training loss: 

Epoch 2, batch 2495
training loss: 0.2631324529647827 

Epoch 2, batch 2496
training loss: 0.7659053802490234 

Epoch 2, batch 2497
training loss: 0.03177756816148758 

Epoch 2, batch 2498
training loss: 0.06069228798151016 

Epoch 2, batch 2499
training loss: 0.2651117742061615 

Epoch 2, batch 2500
training loss: 0.06350599229335785 

Epoch 2, batch 2501
training loss: 0.11498758941888809 

Epoch 2, batch 2502
training loss: 0.054502446204423904 

Epoch 2, batch 2503
training loss: 0.24084463715553284 

Epoch 2, batch 2504
training loss: 0.11074511706829071 

Epoch 2, batch 2505
training loss: 0.17856566607952118 

Epoch 2, batch 2506
training loss: 0.0996188297867775 

Epoch 2, batch 2507
training loss: 0.2561706006526947 

Epoch 2, batch 2508
training loss: 0.05076298862695694 

Epoch 2, batch 2509
training loss: 0.630081832408905 

Epoch 2, batch 2510
training loss: 0.20474393665790558 

Epoch 2, batch 2511
training loss: 0.08628493547439575 

Epoch 2, batch 2512
training loss: 0.

Epoch 2, batch 2716
training loss: 0.26080840826034546 

Epoch 2, batch 2717
training loss: 0.10753272473812103 

Epoch 2, batch 2718
training loss: 0.04660102725028992 

Epoch 2, batch 2719
training loss: 0.12413118034601212 

Epoch 2, batch 2720
training loss: 0.05205681920051575 

Epoch 2, batch 2721
training loss: 0.06763119995594025 

Epoch 2, batch 2722
training loss: 0.06472037732601166 

Epoch 2, batch 2723
training loss: 0.6264358758926392 

Epoch 2, batch 2724
training loss: 0.5117902755737305 

Epoch 2, batch 2725
training loss: 0.020341040566563606 

Epoch 2, batch 2726
training loss: 0.16420693695545197 

Epoch 2, batch 2727
training loss: 0.14056751132011414 

Epoch 2, batch 2728
training loss: 0.14052817225456238 

Epoch 2, batch 2729
training loss: 0.06830845773220062 

Epoch 2, batch 2730
training loss: 0.41410690546035767 

Epoch 2, batch 2731
training loss: 0.09093042463064194 

Epoch 2, batch 2732
training loss: 0.07828960567712784 

Epoch 2, batch 2733
training los

Epoch 2, batch 2939
training loss: 0.08952098339796066 

Epoch 2, batch 2940
training loss: 0.12202546745538712 

Epoch 2, batch 2941
training loss: 0.05059831589460373 

Epoch 2, batch 2942
training loss: 0.2543949782848358 

Epoch 2, batch 2943
training loss: 0.05548935383558273 

Epoch 2, batch 2944
training loss: 0.2739330232143402 

Epoch 2, batch 2945
training loss: 0.2501174807548523 

Epoch 2, batch 2946
training loss: 0.08567477017641068 

Epoch 2, batch 2947
training loss: 0.6175194382667542 

Epoch 2, batch 2948
training loss: 0.04698260873556137 

Epoch 2, batch 2949
training loss: 0.42242035269737244 

Epoch 2, batch 2950
training loss: 0.028103778138756752 

Epoch 2, batch 2951
training loss: 0.3176735043525696 

Epoch 2, batch 2952
training loss: 0.29778164625167847 

Epoch 2, batch 2953
training loss: 0.05634468048810959 

Epoch 2, batch 2954
training loss: 0.1459587663412094 

Epoch 2, batch 2955
training loss: 0.6370295882225037 

Epoch 2, batch 2956
training loss: 0.

Epoch 2, batch 3162
training loss: 0.21438995003700256 

Epoch 2, batch 3163
training loss: 0.29939574003219604 

Epoch 2, batch 3164
training loss: 0.4862075746059418 

Epoch 2, batch 3165
training loss: 0.25412851572036743 

Epoch 2, batch 3166
training loss: 0.04583722725510597 

Epoch 2, batch 3167
training loss: 0.054214559495449066 

Epoch 2, batch 3168
training loss: 0.2335391789674759 

Epoch 2, batch 3169
training loss: 0.18860377371311188 

Epoch 2, batch 3170
training loss: 0.05852174758911133 

Epoch 2, batch 3171
training loss: 0.6281739473342896 

Epoch 2, batch 3172
training loss: 0.08259337395429611 

Epoch 2, batch 3173
training loss: 0.1281462013721466 

Epoch 2, batch 3174
training loss: 0.11772160232067108 

Epoch 2, batch 3175
training loss: 0.15420110523700714 

Epoch 2, batch 3176
training loss: 0.09153105318546295 

Epoch 2, batch 3177
training loss: 0.9216818809509277 

Epoch 2, batch 3178
training loss: 0.8232395052909851 

Epoch 2, batch 3179
training loss: 0

Epoch 2, batch 3383
training loss: 0.40901604294776917 

Epoch 2, batch 3384
training loss: 0.2844429612159729 

Epoch 2, batch 3385
training loss: 0.19536134600639343 

Epoch 2, batch 3386
training loss: 0.0291439201682806 

Epoch 2, batch 3387
training loss: 0.06072172522544861 

Epoch 2, batch 3388
training loss: 0.038148000836372375 

Epoch 2, batch 3389
training loss: 0.29012054204940796 

Epoch 2, batch 3390
training loss: 0.022432558238506317 

Epoch 2, batch 3391
training loss: 0.15739640593528748 

Epoch 2, batch 3392
training loss: 0.17866989970207214 

Epoch 2, batch 3393
training loss: 0.11535561084747314 

Epoch 2, batch 3394
training loss: 0.2757953107357025 

Epoch 2, batch 3395
training loss: 0.0619099922478199 

Epoch 2, batch 3396
training loss: 0.06810172647237778 

Epoch 2, batch 3397
training loss: 0.014990325085818768 

Epoch 2, batch 3398
training loss: 0.10916125774383545 

Epoch 2, batch 3399
training loss: 0.10522037744522095 

Epoch 2, batch 3400
training los

Epoch 2, batch 3606
training loss: 0.1660260260105133 

Epoch 2, batch 3607
training loss: 0.26486149430274963 

Epoch 2, batch 3608
training loss: 0.16623744368553162 

Epoch 2, batch 3609
training loss: 0.15711937844753265 

Epoch 2, batch 3610
training loss: 0.4976865351200104 

Epoch 2, batch 3611
training loss: 0.055247049778699875 

Epoch 2, batch 3612
training loss: 0.03615880757570267 

Epoch 2, batch 3613
training loss: 0.3153684735298157 

Epoch 2, batch 3614
training loss: 0.22316136956214905 

Epoch 2, batch 3615
training loss: 0.02331998385488987 

Epoch 2, batch 3616
training loss: 0.18795950710773468 

Epoch 2, batch 3617
training loss: 0.02453434467315674 

Epoch 2, batch 3618
training loss: 0.02061336673796177 

Epoch 2, batch 3619
training loss: 0.012368900701403618 

Epoch 2, batch 3620
training loss: 0.15638083219528198 

Epoch 2, batch 3621
training loss: 0.08463062345981598 

Epoch 2, batch 3622
training loss: 0.1116848960518837 

Epoch 2, batch 3623
training loss

Epoch 2, batch 3814
training loss: 0.5448931455612183 

Epoch 2, batch 3815
training loss: 1.1109977960586548 

Epoch 2, batch 3816
training loss: 0.23195764422416687 

Epoch 2, batch 3817
training loss: 0.4120500087738037 

Epoch 2, batch 3818
training loss: 0.6598657369613647 

Epoch 2, batch 3819
training loss: 0.11087091267108917 

Epoch 2, batch 3820
training loss: 0.3644393980503082 

Epoch 2, batch 3821
training loss: 0.6816145181655884 

Epoch 2, batch 3822
training loss: 0.030041631311178207 

Epoch 2, batch 3823
training loss: 0.2569628357887268 

Epoch 2, batch 3824
training loss: 0.19370122253894806 

Epoch 2, batch 3825
training loss: 0.04131767898797989 

Epoch 2, batch 3826
training loss: 0.3090765178203583 

Epoch 2, batch 3827
training loss: 0.03705131262540817 

Epoch 2, batch 3828
training loss: 0.15138736367225647 

Epoch 2, batch 3829
training loss: 0.2024795264005661 

Epoch 2, batch 3830
training loss: 0.06735280901193619 

Epoch 2, batch 3831
training loss: 0.13

Epoch 2, batch 4030
training loss: 0.09072275459766388 

Epoch 2, batch 4031
training loss: 0.10956092923879623 

Epoch 2, batch 4032
training loss: 0.10306324064731598 

Epoch 2, batch 4033
training loss: 0.18885226547718048 

Epoch 2, batch 4034
training loss: 0.4299953877925873 

Epoch 2, batch 4035
training loss: 0.11316166818141937 

Epoch 2, batch 4036
training loss: 0.04770346358418465 

Epoch 2, batch 4037
training loss: 0.1146656721830368 

Epoch 2, batch 4038
training loss: 0.14102782309055328 

Epoch 2, batch 4039
training loss: 0.4400080740451813 

Epoch 2, batch 4040
training loss: 0.03882133960723877 

Epoch 2, batch 4041
training loss: 0.6057659387588501 

Epoch 2, batch 4042
training loss: 0.030275270342826843 

Epoch 2, batch 4043
training loss: 0.021385755389928818 

Epoch 2, batch 4044
training loss: 0.017235800623893738 

Epoch 2, batch 4045
training loss: 0.031010564416646957 

Epoch 2, batch 4046
training loss: 0.1665944755077362 

Epoch 2, batch 4047
training los

Epoch 2, batch 4254
training loss: 0.10337589681148529 

Epoch 2, batch 4255
training loss: 0.11318663507699966 

Epoch 2, batch 4256
training loss: 0.05522741749882698 

Epoch 2, batch 4257
training loss: 0.14226865768432617 

Epoch 2, batch 4258
training loss: 0.27259957790374756 

Epoch 2, batch 4259
training loss: 0.2716972827911377 

Epoch 2, batch 4260
training loss: 0.20984673500061035 

Epoch 2, batch 4261
training loss: 0.17134304344654083 

Epoch 2, batch 4262
training loss: 0.026595845818519592 

Epoch 2, batch 4263
training loss: 0.10775282233953476 

Epoch 2, batch 4264
training loss: 0.026090800762176514 

Epoch 2, batch 4265
training loss: 0.031405720859766006 

Epoch 2, batch 4266
training loss: 0.11179956048727036 

Epoch 2, batch 4267
training loss: 0.2996590733528137 

Epoch 2, batch 4268
training loss: 0.20346865057945251 

Epoch 2, batch 4269
training loss: 0.13523855805397034 

Epoch 2, batch 4270
training loss: 0.3337109088897705 

Epoch 2, batch 4271
training lo

Epoch 2, batch 4474
training loss: 0.06372028589248657 

Epoch 2, batch 4475
training loss: 0.04716707020998001 

Epoch 2, batch 4476
training loss: 0.10053253173828125 

Epoch 2, batch 4477
training loss: 0.18489286303520203 

Epoch 2, batch 4478
training loss: 0.024465687572956085 

Epoch 2, batch 4479
training loss: 0.23290371894836426 

Epoch 2, batch 4480
training loss: 0.3425276279449463 

Epoch 2, batch 4481
training loss: 0.13683415949344635 

Epoch 2, batch 4482
training loss: 0.1483761966228485 

Epoch 2, batch 4483
training loss: 0.10783755779266357 

Epoch 2, batch 4484
training loss: 0.3574390709400177 

Epoch 2, batch 4485
training loss: 0.25284674763679504 

Epoch 2, batch 4486
training loss: 0.21378079056739807 

Epoch 2, batch 4487
training loss: 0.07528723776340485 

Epoch 2, batch 4488
training loss: 0.06502186506986618 

Epoch 2, batch 4489
training loss: 0.18791638314723969 

Epoch 2, batch 4490
training loss: 0.04538533836603165 

Epoch 2, batch 4491
training loss

Epoch 2, batch 4696
training loss: 0.24503548443317413 

Epoch 2, batch 4697
training loss: 0.4264039993286133 

Epoch 2, batch 4698
training loss: 0.07939713448286057 

Epoch 2, batch 4699
training loss: 0.02971968613564968 

Epoch 2, batch 4700
training loss: 0.02426745928823948 

Epoch 2, batch 4701
training loss: 0.19006165862083435 

Epoch 2, batch 4702
training loss: 0.19877420365810394 

Epoch 2, batch 4703
training loss: 0.09222345799207687 

Epoch 2, batch 4704
training loss: 0.19114641845226288 

Epoch 2, batch 4705
training loss: 0.2660764157772064 

Epoch 2, batch 4706
training loss: 0.04257868230342865 

Epoch 2, batch 4707
training loss: 0.34141677618026733 

Epoch 2, batch 4708
training loss: 0.11389487981796265 

Epoch 2, batch 4709
training loss: 0.09737219661474228 

Epoch 2, batch 4710
training loss: 0.08383466303348541 

Epoch 2, batch 4711
training loss: 0.05000748112797737 

Epoch 2, batch 4712
training loss: 0.07423659414052963 

Epoch 2, batch 4713
training loss

Epoch 2, batch 4913
training loss: 0.010613157413899899 

Epoch 2, batch 4914
training loss: 0.6935633420944214 

Epoch 2, batch 4915
training loss: 0.2786749601364136 

Epoch 2, batch 4916
training loss: 0.7408785223960876 

Epoch 2, batch 4917
training loss: 0.061241887509822845 

Epoch 2, batch 4918
training loss: 0.1454259753227234 

Epoch 2, batch 4919
training loss: 0.03490079566836357 

Epoch 2, batch 4920
training loss: 0.03931639343500137 

Epoch 2, batch 4921
training loss: 0.04575791209936142 

Epoch 2, batch 4922
training loss: 0.06286074221134186 

Epoch 2, batch 4923
training loss: 0.43528905510902405 

Epoch 2, batch 4924
training loss: 0.05201674625277519 

Epoch 2, batch 4925
training loss: 0.03996977582573891 

Epoch 2, batch 4926
training loss: 0.3563472628593445 

Epoch 2, batch 4927
training loss: 0.11332539469003677 

Epoch 2, batch 4928
training loss: 0.16641926765441895 

Epoch 2, batch 4929
training loss: 0.12724316120147705 

Epoch 2, batch 4930
training loss:

Epoch 2, batch 5137
training loss: 0.022449584677815437 

Epoch 2, batch 5138
training loss: 0.9241166114807129 

Epoch 2, batch 5139
training loss: 0.5917191505432129 

Epoch 2, batch 5140
training loss: 0.02142178639769554 

Epoch 2, batch 5141
training loss: 0.1873612403869629 

Epoch 2, batch 5142
training loss: 0.05619656294584274 

Epoch 2, batch 5143
training loss: 0.025925129652023315 

Epoch 2, batch 5144
training loss: 0.07011055201292038 

Epoch 2, batch 5145
training loss: 0.122282013297081 

Epoch 2, batch 5146
training loss: 0.04278546944260597 

Epoch 2, batch 5147
training loss: 0.08698612451553345 

Epoch 2, batch 5148
training loss: 0.2820207476615906 

Epoch 2, batch 5149
training loss: 0.1316368132829666 

Epoch 2, batch 5150
training loss: 0.5159033536911011 

Epoch 2, batch 5151
training loss: 0.03346579521894455 

Epoch 2, batch 5152
training loss: 0.7127028703689575 

Epoch 2, batch 5153
training loss: 0.20365600287914276 

Epoch 2, batch 5154
training loss: 0.0

Epoch 2, batch 5358
training loss: 0.13709808886051178 

Epoch 2, batch 5359
training loss: 1.0854463577270508 

Epoch 2, batch 5360
training loss: 0.025437330827116966 

Epoch 2, batch 5361
training loss: 0.3999404311180115 

Epoch 2, batch 5362
training loss: 0.16531549394130707 

Epoch 2, batch 5363
training loss: 0.1373824179172516 

Epoch 2, batch 5364
training loss: 0.2927877902984619 

Epoch 2, batch 5365
training loss: 0.3944091200828552 

Epoch 2, batch 5366
training loss: 0.0543367937207222 

Epoch 2, batch 5367
training loss: 0.2933894991874695 

Epoch 2, batch 5368
training loss: 0.028576716780662537 

Epoch 2, batch 5369
training loss: 0.030825486406683922 

Epoch 2, batch 5370
training loss: 0.32563814520835876 

Epoch 2, batch 5371
training loss: 0.02073391154408455 

Epoch 2, batch 5372
training loss: 0.22276318073272705 

Epoch 2, batch 5373
training loss: 0.018867252394557 

Epoch 2, batch 5374
training loss: 0.03476463630795479 

Epoch 2, batch 5375
training loss: 0.

Epoch 2, batch 5578
training loss: 0.02583571895956993 

Epoch 2, batch 5579
training loss: 0.04147682338953018 

Epoch 2, batch 5580
training loss: 0.1912086308002472 

Epoch 2, batch 5581
training loss: 0.12803688645362854 

Epoch 2, batch 5582
training loss: 0.13687121868133545 

Epoch 2, batch 5583
training loss: 0.10807938873767853 

Epoch 2, batch 5584
training loss: 0.12306137382984161 

Epoch 2, batch 5585
training loss: 0.30256351828575134 

Epoch 2, batch 5586
training loss: 0.6356302499771118 

Epoch 2, batch 5587
training loss: 0.20978352427482605 

Epoch 2, batch 5588
training loss: 0.2106427401304245 

Epoch 2, batch 5589
training loss: 0.1892259120941162 

Epoch 2, batch 5590
training loss: 0.02919284626841545 

Epoch 2, batch 5591
training loss: 0.03738034516572952 

Epoch 2, batch 5592
training loss: 0.17834389209747314 

Epoch 2, batch 5593
training loss: 0.19157476723194122 

Epoch 2, batch 5594
training loss: 0.5642956495285034 

Epoch 2, batch 5595
training loss: 0

Epoch 2, batch 5798
training loss: 0.03547457605600357 

Epoch 2, batch 5799
training loss: 0.02524930238723755 

Epoch 2, batch 5800
training loss: 0.1261800080537796 

Epoch 2, batch 5801
training loss: 0.5015488862991333 

Epoch 2, batch 5802
training loss: 0.04623015224933624 

Epoch 2, batch 5803
training loss: 0.16995398700237274 

Epoch 2, batch 5804
training loss: 0.04720309376716614 

Epoch 2, batch 5805
training loss: 0.8891714811325073 

Epoch 2, batch 5806
training loss: 0.3373878300189972 

Epoch 2, batch 5807
training loss: 0.012185153551399708 

Epoch 2, batch 5808
training loss: 0.04799559339880943 

Epoch 2, batch 5809
training loss: 0.5031554102897644 

Epoch 2, batch 5810
training loss: 0.05969496816396713 

Epoch 2, batch 5811
training loss: 0.26278072595596313 

Epoch 2, batch 5812
training loss: 0.058667831122875214 

Epoch 2, batch 5813
training loss: 0.15341642498970032 

Epoch 2, batch 5814
training loss: 0.3795086145401001 

Epoch 2, batch 5815
training loss: 

Epoch 3, batch 13
training loss: 0.09817735850811005 

Epoch 3, batch 14
training loss: 0.020160498097538948 

Epoch 3, batch 15
training loss: 0.16124722361564636 

Epoch 3, batch 16
training loss: 0.09675978124141693 

Epoch 3, batch 17
training loss: 0.26588380336761475 

Epoch 3, batch 18
training loss: 0.2602933347225189 

Epoch 3, batch 19
training loss: 0.10601887851953506 

Epoch 3, batch 20
training loss: 0.011115851812064648 

Epoch 3, batch 21
training loss: 0.2177988737821579 

Epoch 3, batch 22
training loss: 0.22832465171813965 

Epoch 3, batch 23
training loss: 0.027982190251350403 

Epoch 3, batch 24
training loss: 0.013735379092395306 

Epoch 3, batch 25
training loss: 0.4788009524345398 

Epoch 3, batch 26
training loss: 0.1575663834810257 

Epoch 3, batch 27
training loss: 0.06320085376501083 

Epoch 3, batch 28
training loss: 0.07886780798435211 

Epoch 3, batch 29
training loss: 0.03683317452669144 

Epoch 3, batch 30
training loss: 0.04929780215024948 

Epoch 3, b

Epoch 3, batch 231
training loss: 0.11032465845346451 

Epoch 3, batch 232
training loss: 0.057888418436050415 

Epoch 3, batch 233
training loss: 0.04165252298116684 

Epoch 3, batch 234
training loss: 0.04083555191755295 

Epoch 3, batch 235
training loss: 0.19270183145999908 

Epoch 3, batch 236
training loss: 0.11922243982553482 

Epoch 3, batch 237
training loss: 0.5475519299507141 

Epoch 3, batch 238
training loss: 0.02709229663014412 

Epoch 3, batch 239
training loss: 0.010693627409636974 

Epoch 3, batch 240
training loss: 0.09937216341495514 

Epoch 3, batch 241
training loss: 0.39725053310394287 

Epoch 3, batch 242
training loss: 0.31649845838546753 

Epoch 3, batch 243
training loss: 0.2842046618461609 

Epoch 3, batch 244
training loss: 0.06121329218149185 

Epoch 3, batch 245
training loss: 0.011523043736815453 

Epoch 3, batch 246
training loss: 0.013887275941669941 

Epoch 3, batch 247
training loss: 0.0134954284876585 

Epoch 3, batch 248
training loss: 0.25926649570

Epoch 3, batch 453
training loss: 0.018555505201220512 

Epoch 3, batch 454
training loss: 0.01807381957769394 

Epoch 3, batch 455
training loss: 0.5599153637886047 

Epoch 3, batch 456
training loss: 0.28650036454200745 

Epoch 3, batch 457
training loss: 0.02279709465801716 

Epoch 3, batch 458
training loss: 0.04869646579027176 

Epoch 3, batch 459
training loss: 0.012381444685161114 

Epoch 3, batch 460
training loss: 0.10614428669214249 

Epoch 3, batch 461
training loss: 0.01725487783551216 

Epoch 3, batch 462
training loss: 0.12745976448059082 

Epoch 3, batch 463
training loss: 0.01622472144663334 

Epoch 3, batch 464
training loss: 0.12624523043632507 

Epoch 3, batch 465
training loss: 0.04135403409600258 

Epoch 3, batch 466
training loss: 0.05356588214635849 

Epoch 3, batch 467
training loss: 0.03539038449525833 

Epoch 3, batch 468
training loss: 0.08538703620433807 

Epoch 3, batch 469
training loss: 0.04802803695201874 

Epoch 3, batch 470
training loss: 0.15131905674

Epoch 3, batch 675
training loss: 0.024109430611133575 

Epoch 3, batch 676
training loss: 0.5893676280975342 

Epoch 3, batch 677
training loss: 0.45974645018577576 

Epoch 3, batch 678
training loss: 0.025910627096891403 

Epoch 3, batch 679
training loss: 0.0899244099855423 

Epoch 3, batch 680
training loss: 0.022329922765493393 

Epoch 3, batch 681
training loss: 0.01749846525490284 

Epoch 3, batch 682
training loss: 0.4902118742465973 

Epoch 3, batch 683
training loss: 0.020512741059064865 

Epoch 3, batch 684
training loss: 0.2519006133079529 

Epoch 3, batch 685
training loss: 0.011607962660491467 

Epoch 3, batch 686
training loss: 0.28586405515670776 

Epoch 3, batch 687
training loss: 0.19743449985980988 

Epoch 3, batch 688
training loss: 0.13955357670783997 

Epoch 3, batch 689
training loss: 0.03313078731298447 

Epoch 3, batch 690
training loss: 0.05035947635769844 

Epoch 3, batch 691
training loss: 0.03191963955760002 

Epoch 3, batch 692
training loss: 0.04643541201

Epoch 3, batch 895
training loss: 0.06510599702596664 

Epoch 3, batch 896
training loss: 0.40410304069519043 

Epoch 3, batch 897
training loss: 0.05792706087231636 

Epoch 3, batch 898
training loss: 0.21465608477592468 

Epoch 3, batch 899
training loss: 0.5707311630249023 

Epoch 3, batch 900
training loss: 0.3160300850868225 

Epoch 3, batch 901
training loss: 0.106087327003479 

Epoch 3, batch 902
training loss: 0.07276086509227753 

Epoch 3, batch 903
training loss: 0.03988618403673172 

Epoch 3, batch 904
training loss: 0.49820083379745483 

Epoch 3, batch 905
training loss: 0.36815688014030457 

Epoch 3, batch 906
training loss: 0.3502650856971741 

Epoch 3, batch 907
training loss: 0.43866509199142456 

Epoch 3, batch 908
training loss: 0.04747123643755913 

Epoch 3, batch 909
training loss: 0.534130871295929 

Epoch 3, batch 910
training loss: 0.1256866604089737 

Epoch 3, batch 911
training loss: 0.0946943387389183 

Epoch 3, batch 912
training loss: 0.03701772168278694 

E

Epoch 3, batch 1115
training loss: 0.37530413269996643 

Epoch 3, batch 1116
training loss: 0.2288050651550293 

Epoch 3, batch 1117
training loss: 0.21762733161449432 

Epoch 3, batch 1118
training loss: 0.7810279130935669 

Epoch 3, batch 1119
training loss: 0.031416263431310654 

Epoch 3, batch 1120
training loss: 0.020013440400362015 

Epoch 3, batch 1121
training loss: 0.04414316266775131 

Epoch 3, batch 1122
training loss: 0.22434337437152863 

Epoch 3, batch 1123
training loss: 0.08419802039861679 

Epoch 3, batch 1124
training loss: 0.14752943813800812 

Epoch 3, batch 1125
training loss: 0.07820219546556473 

Epoch 3, batch 1126
training loss: 0.09700830280780792 

Epoch 3, batch 1127
training loss: 0.4664158821105957 

Epoch 3, batch 1128
training loss: 0.6852832436561584 

Epoch 3, batch 1129
training loss: 0.2796292006969452 

Epoch 3, batch 1130
training loss: 0.4857022762298584 

Epoch 3, batch 1131
training loss: 0.03945528343319893 

Epoch 3, batch 1132
training loss: 

Epoch 3, batch 1337
training loss: 0.15627127885818481 

Epoch 3, batch 1338
training loss: 0.050605423748493195 

Epoch 3, batch 1339
training loss: 0.10200746357440948 

Epoch 3, batch 1340
training loss: 0.19874337315559387 

Epoch 3, batch 1341
training loss: 0.03192267566919327 

Epoch 3, batch 1342
training loss: 0.08972658216953278 

Epoch 3, batch 1343
training loss: 0.1613466441631317 

Epoch 3, batch 1344
training loss: 0.2821972668170929 

Epoch 3, batch 1345
training loss: 0.22562535107135773 

Epoch 3, batch 1346
training loss: 0.029807960614562035 

Epoch 3, batch 1347
training loss: 0.13202473521232605 

Epoch 3, batch 1348
training loss: 0.2763397693634033 

Epoch 3, batch 1349
training loss: 0.12542970478534698 

Epoch 3, batch 1350
training loss: 0.034173525869846344 

Epoch 3, batch 1351
training loss: 0.03401552885770798 

Epoch 3, batch 1352
training loss: 0.1669926941394806 

Epoch 3, batch 1353
training loss: 0.13379092514514923 

Epoch 3, batch 1354
training los

Epoch 3, batch 1555
training loss: 0.6550711393356323 

Epoch 3, batch 1556
training loss: 0.16926155984401703 

Epoch 3, batch 1557
training loss: 0.25160154700279236 

Epoch 3, batch 1558
training loss: 0.02278093993663788 

Epoch 3, batch 1559
training loss: 0.06711842864751816 

Epoch 3, batch 1560
training loss: 0.02815033122897148 

Epoch 3, batch 1561
training loss: 0.10041718184947968 

Epoch 3, batch 1562
training loss: 0.44640859961509705 

Epoch 3, batch 1563
training loss: 0.08773411810398102 

Epoch 3, batch 1564
training loss: 0.02950332500040531 

Epoch 3, batch 1565
training loss: 0.05186524987220764 

Epoch 3, batch 1566
training loss: 0.32914018630981445 

Epoch 3, batch 1567
training loss: 0.6971033811569214 

Epoch 3, batch 1568
training loss: 0.14653585851192474 

Epoch 3, batch 1569
training loss: 0.3295363783836365 

Epoch 3, batch 1570
training loss: 0.21714214980602264 

Epoch 3, batch 1571
training loss: 0.06545288860797882 

Epoch 3, batch 1572
training loss:

Epoch 3, batch 1775
training loss: 0.3032483160495758 

Epoch 3, batch 1776
training loss: 0.06515081226825714 

Epoch 3, batch 1777
training loss: 0.05399644374847412 

Epoch 3, batch 1778
training loss: 0.025398308411240578 

Epoch 3, batch 1779
training loss: 0.14903397858142853 

Epoch 3, batch 1780
training loss: 0.03588181734085083 

Epoch 3, batch 1781
training loss: 0.20150692760944366 

Epoch 3, batch 1782
training loss: 0.35002797842025757 

Epoch 3, batch 1783
training loss: 0.04576686769723892 

Epoch 3, batch 1784
training loss: 0.05914033576846123 

Epoch 3, batch 1785
training loss: 0.39165177941322327 

Epoch 3, batch 1786
training loss: 0.06425200402736664 

Epoch 3, batch 1787
training loss: 0.5859300494194031 

Epoch 3, batch 1788
training loss: 0.1580977886915207 

Epoch 3, batch 1789
training loss: 0.07846944779157639 

Epoch 3, batch 1790
training loss: 0.19314733147621155 

Epoch 3, batch 1791
training loss: 0.042174503207206726 

Epoch 3, batch 1792
training los

Epoch 3, batch 1997
training loss: 0.002896748250350356 

Epoch 3, batch 1998
training loss: 0.6205426454544067 

Epoch 3, batch 1999
training loss: 0.08158250153064728 

Epoch 3, batch 2000
training loss: 0.4917171001434326 

Epoch 3, batch 2001
training loss: 0.17947913706302643 

Epoch 3, batch 2002
training loss: 0.019038796424865723 

Epoch 3, batch 2003
training loss: 0.17997004091739655 

Epoch 3, batch 2004
training loss: 0.08761385828256607 

Epoch 3, batch 2005
training loss: 0.0755033940076828 

Epoch 3, batch 2006
training loss: 0.04301786422729492 

Epoch 3, batch 2007
training loss: 0.027966085821390152 

Epoch 3, batch 2008
training loss: 0.33950740098953247 

Epoch 3, batch 2009
training loss: 0.01864706166088581 

Epoch 3, batch 2010
training loss: 0.2093214988708496 

Epoch 3, batch 2011
training loss: 0.059503357857465744 

Epoch 3, batch 2012
training loss: 0.01046903245151043 

Epoch 3, batch 2013
training loss: 0.26369839906692505 

Epoch 3, batch 2014
training lo

Epoch 3, batch 2218
training loss: 0.32433897256851196 

Epoch 3, batch 2219
training loss: 0.032159071415662766 

Epoch 3, batch 2220
training loss: 0.6780217289924622 

Epoch 3, batch 2221
training loss: 0.3213551938533783 

Epoch 3, batch 2222
training loss: 0.22856497764587402 

Epoch 3, batch 2223
training loss: 0.39718514680862427 

Epoch 3, batch 2224
training loss: 0.03311476483941078 

Epoch 3, batch 2225
training loss: 0.1232815757393837 

Epoch 3, batch 2226
training loss: 0.8704627156257629 

Epoch 3, batch 2227
training loss: 0.020236670970916748 

Epoch 3, batch 2228
training loss: 0.06655152142047882 

Epoch 3, batch 2229
training loss: 0.421968549489975 

Epoch 3, batch 2230
training loss: 0.16921816766262054 

Epoch 3, batch 2231
training loss: 0.08724693208932877 

Epoch 3, batch 2232
training loss: 0.0450839102268219 

Epoch 3, batch 2233
training loss: 0.016335085034370422 

Epoch 3, batch 2234
training loss: 0.3423282206058502 

Epoch 3, batch 2235
training loss: 0

Epoch 3, batch 2438
training loss: 0.816967785358429 

Epoch 3, batch 2439
training loss: 0.05586078017950058 

Epoch 3, batch 2440
training loss: 0.12894302606582642 

Epoch 3, batch 2441
training loss: 0.11624528467655182 

Epoch 3, batch 2442
training loss: 0.14670589566230774 

Epoch 3, batch 2443
training loss: 0.5283023118972778 

Epoch 3, batch 2444
training loss: 0.43543511629104614 

Epoch 3, batch 2445
training loss: 0.09903112053871155 

Epoch 3, batch 2446
training loss: 0.13357946276664734 

Epoch 3, batch 2447
training loss: 0.07278537005186081 

Epoch 3, batch 2448
training loss: 0.058072008192539215 

Epoch 3, batch 2449
training loss: 0.14395079016685486 

Epoch 3, batch 2450
training loss: 0.47430795431137085 

Epoch 3, batch 2451
training loss: 0.17598971724510193 

Epoch 3, batch 2452
training loss: 0.02952813170850277 

Epoch 3, batch 2453
training loss: 0.0518624372780323 

Epoch 3, batch 2454
training loss: 0.06369099766016006 

Epoch 3, batch 2455
training loss:

Epoch 3, batch 2657
training loss: 0.05342607945203781 

Epoch 3, batch 2658
training loss: 0.02427103742957115 

Epoch 3, batch 2659
training loss: 0.6729221940040588 

Epoch 3, batch 2660
training loss: 0.11751637607812881 

Epoch 3, batch 2661
training loss: 0.13072159886360168 

Epoch 3, batch 2662
training loss: 0.27572840452194214 

Epoch 3, batch 2663
training loss: 0.019045110791921616 

Epoch 3, batch 2664
training loss: 0.00453489413484931 

Epoch 3, batch 2665
training loss: 0.15134575963020325 

Epoch 3, batch 2666
training loss: 0.10430234670639038 

Epoch 3, batch 2667
training loss: 0.08317499607801437 

Epoch 3, batch 2668
training loss: 0.4509599804878235 

Epoch 3, batch 2669
training loss: 0.2218053638935089 

Epoch 3, batch 2670
training loss: 0.05260654538869858 

Epoch 3, batch 2671
training loss: 0.021038124337792397 

Epoch 3, batch 2672
training loss: 0.45191091299057007 

Epoch 3, batch 2673
training loss: 0.09348446875810623 

Epoch 3, batch 2674
training los

Epoch 3, batch 2877
training loss: 0.01783783733844757 

Epoch 3, batch 2878
training loss: 0.05911805108189583 

Epoch 3, batch 2879
training loss: 0.5930238962173462 

Epoch 3, batch 2880
training loss: 0.018350113183259964 

Epoch 3, batch 2881
training loss: 0.09340307116508484 

Epoch 3, batch 2882
training loss: 0.15495984256267548 

Epoch 3, batch 2883
training loss: 0.13657133281230927 

Epoch 3, batch 2884
training loss: 0.670921802520752 

Epoch 3, batch 2885
training loss: 0.30129125714302063 

Epoch 3, batch 2886
training loss: 0.10258033126592636 

Epoch 3, batch 2887
training loss: 0.02117440104484558 

Epoch 3, batch 2888
training loss: 0.0890720784664154 

Epoch 3, batch 2889
training loss: 0.09239650517702103 

Epoch 3, batch 2890
training loss: 0.01637295074760914 

Epoch 3, batch 2891
training loss: 0.01857026293873787 

Epoch 3, batch 2892
training loss: 0.059031568467617035 

Epoch 3, batch 2893
training loss: 0.0415458157658577 

Epoch 3, batch 2894
training loss:

Epoch 3, batch 3097
training loss: 0.12576863169670105 

Epoch 3, batch 3098
training loss: 0.021227097138762474 

Epoch 3, batch 3099
training loss: 0.029254794120788574 

Epoch 3, batch 3100
training loss: 0.16572126746177673 

Epoch 3, batch 3101
training loss: 0.060153454542160034 

Epoch 3, batch 3102
training loss: 0.4303286671638489 

Epoch 3, batch 3103
training loss: 0.12007305771112442 

Epoch 3, batch 3104
training loss: 0.06521696597337723 

Epoch 3, batch 3105
training loss: 0.0959850400686264 

Epoch 3, batch 3106
training loss: 0.6606600284576416 

Epoch 3, batch 3107
training loss: 0.17558200657367706 

Epoch 3, batch 3108
training loss: 0.2530108690261841 

Epoch 3, batch 3109
training loss: 0.8135404586791992 

Epoch 3, batch 3110
training loss: 0.4817030429840088 

Epoch 3, batch 3111
training loss: 0.3167794942855835 

Epoch 3, batch 3112
training loss: 0.25993433594703674 

Epoch 3, batch 3113
training loss: 0.2168445587158203 

Epoch 3, batch 3114
training loss: 0

Epoch 3, batch 3316
training loss: 0.3405351936817169 

Epoch 3, batch 3317
training loss: 0.46189722418785095 

Epoch 3, batch 3318
training loss: 0.005427761934697628 

Epoch 3, batch 3319
training loss: 0.35470983386039734 

Epoch 3, batch 3320
training loss: 0.031705327332019806 

Epoch 3, batch 3321
training loss: 0.052951324731111526 

Epoch 3, batch 3322
training loss: 0.49984899163246155 

Epoch 3, batch 3323
training loss: 0.04323650151491165 

Epoch 3, batch 3324
training loss: 0.21291372179985046 

Epoch 3, batch 3325
training loss: 0.2835313677787781 

Epoch 3, batch 3326
training loss: 0.1597343385219574 

Epoch 3, batch 3327
training loss: 0.4226454198360443 

Epoch 3, batch 3328
training loss: 0.24398323893547058 

Epoch 3, batch 3329
training loss: 0.06038457900285721 

Epoch 3, batch 3330
training loss: 0.03877144306898117 

Epoch 3, batch 3331
training loss: 0.06420187652111053 

Epoch 3, batch 3332
training loss: 0.034455664455890656 

Epoch 3, batch 3333
training lo

Epoch 3, batch 3525
training loss: 0.07246632874011993 

Epoch 3, batch 3526
training loss: 0.22735169529914856 

Epoch 3, batch 3527
training loss: 0.17508378624916077 

Epoch 3, batch 3528
training loss: 0.4688642621040344 

Epoch 3, batch 3529
training loss: 0.028075847774744034 

Epoch 3, batch 3530
training loss: 0.046111203730106354 

Epoch 3, batch 3531
training loss: 0.07421956956386566 

Epoch 3, batch 3532
training loss: 0.03361845761537552 

Epoch 3, batch 3533
training loss: 0.3030390739440918 

Epoch 3, batch 3534
training loss: 0.05386177450418472 

Epoch 3, batch 3535
training loss: 0.019098440185189247 

Epoch 3, batch 3536
training loss: 0.1708400398492813 

Epoch 3, batch 3537
training loss: 0.8255205154418945 

Epoch 3, batch 3538
training loss: 0.5602108836174011 

Epoch 3, batch 3539
training loss: 0.18732942640781403 

Epoch 3, batch 3540
training loss: 0.1791185438632965 

Epoch 3, batch 3541
training loss: 0.1503462940454483 

Epoch 3, batch 3542
training loss: 

Epoch 3, batch 3743
training loss: 0.01976367086172104 

Epoch 3, batch 3744
training loss: 0.17828945815563202 

Epoch 3, batch 3745
training loss: 0.03192504122853279 

Epoch 3, batch 3746
training loss: 0.21186241507530212 

Epoch 3, batch 3747
training loss: 0.24358269572257996 

Epoch 3, batch 3748
training loss: 0.08655554801225662 

Epoch 3, batch 3749
training loss: 0.03440055251121521 

Epoch 3, batch 3750
training loss: 0.09871445596218109 

Epoch 3, batch 3751
training loss: 0.07823602855205536 

Epoch 3, batch 3752
training loss: 0.13253386318683624 

Epoch 3, batch 3753
training loss: 0.2051355540752411 

Epoch 3, batch 3754
training loss: 0.23846681416034698 

Epoch 3, batch 3755
training loss: 0.05963829904794693 

Epoch 3, batch 3756
training loss: 0.37851953506469727 

Epoch 3, batch 3757
training loss: 0.3205329477787018 

Epoch 3, batch 3758
training loss: 0.037897031754255295 

Epoch 3, batch 3759
training loss: 0.6804220080375671 

Epoch 3, batch 3760
training loss

Epoch 3, batch 3964
training loss: 0.177285835146904 

Epoch 3, batch 3965
training loss: 0.0829923078417778 

Epoch 3, batch 3966
training loss: 0.03521091118454933 

Epoch 3, batch 3967
training loss: 0.07457397133111954 

Epoch 3, batch 3968
training loss: 0.019562777131795883 

Epoch 3, batch 3969
training loss: 0.21980056166648865 

Epoch 3, batch 3970
training loss: 0.0908902958035469 

Epoch 3, batch 3971
training loss: 0.013340210542082787 

Epoch 3, batch 3972
training loss: 0.43014830350875854 

Epoch 3, batch 3973
training loss: 0.2149374932050705 

Epoch 3, batch 3974
training loss: 1.1625772714614868 

Epoch 3, batch 3975
training loss: 0.23127086460590363 

Epoch 3, batch 3976
training loss: 0.19408217072486877 

Epoch 3, batch 3977
training loss: 0.06433123350143433 

Epoch 3, batch 3978
training loss: 0.08719411492347717 

Epoch 3, batch 3979
training loss: 0.06040434166789055 

Epoch 3, batch 3980
training loss: 0.06327708065509796 

Epoch 3, batch 3981
training loss: 

Epoch 3, batch 4182
training loss: 0.03156162053346634 

Epoch 3, batch 4183
training loss: 0.2633756399154663 

Epoch 3, batch 4184
training loss: 0.039244744926691055 

Epoch 3, batch 4185
training loss: 0.028210824355483055 

Epoch 3, batch 4186
training loss: 0.04148141294717789 

Epoch 3, batch 4187
training loss: 0.06283892691135406 

Epoch 3, batch 4188
training loss: 0.017554255202412605 

Epoch 3, batch 4189
training loss: 0.08803451061248779 

Epoch 3, batch 4190
training loss: 0.12682773172855377 

Epoch 3, batch 4191
training loss: 0.042223744094371796 

Epoch 3, batch 4192
training loss: 0.6855464577674866 

Epoch 3, batch 4193
training loss: 0.05816352367401123 

Epoch 3, batch 4194
training loss: 0.25640934705734253 

Epoch 3, batch 4195
training loss: 0.04690282419323921 

Epoch 3, batch 4196
training loss: 0.392882764339447 

Epoch 3, batch 4197
training loss: 0.2406189888715744 

Epoch 3, batch 4198
training loss: 0.015971021726727486 

Epoch 3, batch 4199
training lo

Epoch 3, batch 4403
training loss: 0.022625554352998734 

Epoch 3, batch 4404
training loss: 0.036089859902858734 

Epoch 3, batch 4405
training loss: 0.032705873250961304 

Epoch 3, batch 4406
training loss: 0.06429274380207062 

Epoch 3, batch 4407
training loss: 0.02921069785952568 

Epoch 3, batch 4408
training loss: 0.01399158500134945 

Epoch 3, batch 4409
training loss: 0.953726589679718 

Epoch 3, batch 4410
training loss: 0.054673321545124054 

Epoch 3, batch 4411
training loss: 0.1272224485874176 

Epoch 3, batch 4412
training loss: 0.05099957063794136 

Epoch 3, batch 4413
training loss: 0.3537622094154358 

Epoch 3, batch 4414
training loss: 0.03627089411020279 

Epoch 3, batch 4415
training loss: 0.3807779550552368 

Epoch 3, batch 4416
training loss: 0.05929701402783394 

Epoch 3, batch 4417
training loss: 0.19950224459171295 

Epoch 3, batch 4418
training loss: 0.1396777182817459 

Epoch 3, batch 4419
training loss: 0.22171270847320557 

Epoch 3, batch 4420
training loss

Epoch 3, batch 4622
training loss: 0.13636189699172974 

Epoch 3, batch 4623
training loss: 0.141172856092453 

Epoch 3, batch 4624
training loss: 0.5325404405593872 

Epoch 3, batch 4625
training loss: 0.036465760320425034 

Epoch 3, batch 4626
training loss: 0.11054684221744537 

Epoch 3, batch 4627
training loss: 0.2657245993614197 

Epoch 3, batch 4628
training loss: 0.042166613042354584 

Epoch 3, batch 4629
training loss: 0.14821207523345947 

Epoch 3, batch 4630
training loss: 0.0050343540497124195 

Epoch 3, batch 4631
training loss: 0.17052032053470612 

Epoch 3, batch 4632
training loss: 0.023017358034849167 

Epoch 3, batch 4633
training loss: 0.3729941248893738 

Epoch 3, batch 4634
training loss: 0.007374942302703857 

Epoch 3, batch 4635
training loss: 0.11744558811187744 

Epoch 3, batch 4636
training loss: 0.07500061392784119 

Epoch 3, batch 4637
training loss: 0.5458826422691345 

Epoch 3, batch 4638
training loss: 0.04769916087388992 

Epoch 3, batch 4639
training lo

Epoch 3, batch 4842
training loss: 0.03258369863033295 

Epoch 3, batch 4843
training loss: 0.04284996539354324 

Epoch 3, batch 4844
training loss: 0.007524422369897366 

Epoch 3, batch 4845
training loss: 0.35248076915740967 

Epoch 3, batch 4846
training loss: 0.128096342086792 

Epoch 3, batch 4847
training loss: 0.027361053973436356 

Epoch 3, batch 4848
training loss: 0.23563134670257568 

Epoch 3, batch 4849
training loss: 0.03184017539024353 

Epoch 3, batch 4850
training loss: 0.21533603966236115 

Epoch 3, batch 4851
training loss: 0.6403931975364685 

Epoch 3, batch 4852
training loss: 0.6525155305862427 

Epoch 3, batch 4853
training loss: 0.05563708022236824 

Epoch 3, batch 4854
training loss: 0.12525217235088348 

Epoch 3, batch 4855
training loss: 0.023380925878882408 

Epoch 3, batch 4856
training loss: 0.16414494812488556 

Epoch 3, batch 4857
training loss: 0.21576865017414093 

Epoch 3, batch 4858
training loss: 0.11543893814086914 

Epoch 3, batch 4859
training los

Epoch 3, batch 5059
training loss: 0.045605435967445374 

Epoch 3, batch 5060
training loss: 0.21389400959014893 

Epoch 3, batch 5061
training loss: 0.315011590719223 

Epoch 3, batch 5062
training loss: 0.15105821192264557 

Epoch 3, batch 5063
training loss: 0.1439667046070099 

Epoch 3, batch 5064
training loss: 0.08110561221837997 

Epoch 3, batch 5065
training loss: 0.026777803897857666 

Epoch 3, batch 5066
training loss: 0.10679014772176743 

Epoch 3, batch 5067
training loss: 0.05849070101976395 

Epoch 3, batch 5068
training loss: 0.06460113823413849 

Epoch 3, batch 5069
training loss: 0.024144960567355156 

Epoch 3, batch 5070
training loss: 0.21750564873218536 

Epoch 3, batch 5071
training loss: 0.16869229078292847 

Epoch 3, batch 5072
training loss: 0.4665514826774597 

Epoch 3, batch 5073
training loss: 0.2448839694261551 

Epoch 3, batch 5074
training loss: 0.05881152302026749 

Epoch 3, batch 5075
training loss: 0.07224705070257187 

Epoch 3, batch 5076
training loss

Epoch 3, batch 5280
training loss: 0.03092266619205475 

Epoch 3, batch 5281
training loss: 0.03603474050760269 

Epoch 3, batch 5282
training loss: 0.08995570987462997 

Epoch 3, batch 5283
training loss: 0.12459572404623032 

Epoch 3, batch 5284
training loss: 0.12770068645477295 

Epoch 3, batch 5285
training loss: 0.2981816530227661 

Epoch 3, batch 5286
training loss: 0.020606093108654022 

Epoch 3, batch 5287
training loss: 0.4867455065250397 

Epoch 3, batch 5288
training loss: 0.017367828637361526 

Epoch 3, batch 5289
training loss: 1.111799955368042 

Epoch 3, batch 5290
training loss: 0.06656866520643234 

Epoch 3, batch 5291
training loss: 0.02464994788169861 

Epoch 3, batch 5292
training loss: 0.2363366186618805 

Epoch 3, batch 5293
training loss: 0.07786017656326294 

Epoch 3, batch 5294
training loss: 0.7655535936355591 

Epoch 3, batch 5295
training loss: 0.845032811164856 

Epoch 3, batch 5296
training loss: 0.06074760481715202 

Epoch 3, batch 5297
training loss: 0.

Epoch 3, batch 5500
training loss: 0.05742419511079788 

Epoch 3, batch 5501
training loss: 0.44254398345947266 

Epoch 3, batch 5502
training loss: 0.032620497047901154 

Epoch 3, batch 5503
training loss: 0.02561408281326294 

Epoch 3, batch 5504
training loss: 0.03191498667001724 

Epoch 3, batch 5505
training loss: 0.010281691327691078 

Epoch 3, batch 5506
training loss: 0.10177335888147354 

Epoch 3, batch 5507
training loss: 0.2094448059797287 

Epoch 3, batch 5508
training loss: 0.24841658771038055 

Epoch 3, batch 5509
training loss: 0.0057191429659724236 

Epoch 3, batch 5510
training loss: 0.1835743635892868 

Epoch 3, batch 5511
training loss: 0.42774567008018494 

Epoch 3, batch 5512
training loss: 0.026860404759645462 

Epoch 3, batch 5513
training loss: 0.07670088112354279 

Epoch 3, batch 5514
training loss: 0.14181171357631683 

Epoch 3, batch 5515
training loss: 0.06422089040279388 

Epoch 3, batch 5516
training loss: 0.05887002870440483 

Epoch 3, batch 5517
training

Epoch 3, batch 5719
training loss: 0.19663576781749725 

Epoch 3, batch 5720
training loss: 0.02590683475136757 

Epoch 3, batch 5721
training loss: 0.13699375092983246 

Epoch 3, batch 5722
training loss: 0.30793648958206177 

Epoch 3, batch 5723
training loss: 0.6130173206329346 

Epoch 3, batch 5724
training loss: 0.1210876926779747 

Epoch 3, batch 5725
training loss: 0.17954310774803162 

Epoch 3, batch 5726
training loss: 0.04374447092413902 

Epoch 3, batch 5727
training loss: 0.28675201535224915 

Epoch 3, batch 5728
training loss: 0.15884904563426971 

Epoch 3, batch 5729
training loss: 0.12442304193973541 

Epoch 3, batch 5730
training loss: 0.12026266753673553 

Epoch 3, batch 5731
training loss: 0.04986304044723511 

Epoch 3, batch 5732
training loss: 0.01465222705155611 

Epoch 3, batch 5733
training loss: 0.022304194048047066 

Epoch 3, batch 5734
training loss: 0.20771372318267822 

Epoch 3, batch 5735
training loss: 0.016224171966314316 

Epoch 3, batch 5736
training lo

Epoch 3, batch 5937
training loss: 0.04686595872044563 

Epoch 3, batch 5938
training loss: 0.9356557726860046 

Epoch 3, batch 5939
training loss: 0.03492344543337822 

Epoch 3, batch 5940
training loss: 0.03346091881394386 

Epoch 3, batch 5941
training loss: 0.058601271361112595 

Epoch 3, batch 5942
training loss: 0.053767211735248566 

Epoch 3, batch 5943
training loss: 0.2757716774940491 

Epoch 3, batch 5944
training loss: 0.3921878933906555 

Epoch 3, batch 5945
training loss: 0.07561679184436798 

Epoch 3, batch 5946
training loss: 0.04957369714975357 

Epoch 3, batch 5947
training loss: 0.32622653245925903 

Epoch 3, batch 5948
training loss: 0.058056991547346115 

Epoch 3, batch 5949
training loss: 0.07826925814151764 

Epoch 3, batch 5950
training loss: 0.1692320704460144 

Epoch 3, batch 5951
training loss: 0.15606406331062317 

Epoch 3, batch 5952
training loss: 0.544265627861023 

Epoch 3, batch 5953
training loss: 0.1592879593372345 

Epoch 3, batch 5954
training loss: 

Epoch 4, batch 156
training loss: 0.4957723617553711 

Epoch 4, batch 157
training loss: 0.017824232578277588 

Epoch 4, batch 158
training loss: 0.6520741581916809 

Epoch 4, batch 159
training loss: 0.14951249957084656 

Epoch 4, batch 160
training loss: 0.015137051232159138 

Epoch 4, batch 161
training loss: 0.03617999330163002 

Epoch 4, batch 162
training loss: 0.14725002646446228 

Epoch 4, batch 163
training loss: 0.010660948231816292 

Epoch 4, batch 164
training loss: 0.029615525156259537 

Epoch 4, batch 165
training loss: 0.010852278210222721 

Epoch 4, batch 166
training loss: 0.24316847324371338 

Epoch 4, batch 167
training loss: 0.03789243847131729 

Epoch 4, batch 168
training loss: 0.20076008141040802 

Epoch 4, batch 169
training loss: 0.05286659672856331 

Epoch 4, batch 170
training loss: 0.10135481506586075 

Epoch 4, batch 171
training loss: 0.40172338485717773 

Epoch 4, batch 172
training loss: 0.0384812206029892 

Epoch 4, batch 173
training loss: 0.1546785384

Epoch 4, batch 374
training loss: 0.08023635298013687 

Epoch 4, batch 375
training loss: 0.01811978593468666 

Epoch 4, batch 376
training loss: 0.02967245504260063 

Epoch 4, batch 377
training loss: 0.5604936480522156 

Epoch 4, batch 378
training loss: 0.03230654075741768 

Epoch 4, batch 379
training loss: 0.007752536796033382 

Epoch 4, batch 380
training loss: 0.7975174188613892 

Epoch 4, batch 381
training loss: 0.19107124209403992 

Epoch 4, batch 382
training loss: 0.0507163405418396 

Epoch 4, batch 383
training loss: 0.06694764643907547 

Epoch 4, batch 384
training loss: 0.04860955476760864 

Epoch 4, batch 385
training loss: 0.009785900823771954 

Epoch 4, batch 386
training loss: 0.029460543766617775 

Epoch 4, batch 387
training loss: 0.16335023939609528 

Epoch 4, batch 388
training loss: 0.10705627501010895 

Epoch 4, batch 389
training loss: 0.4742915630340576 

Epoch 4, batch 390
training loss: 0.07035424560308456 

Epoch 4, batch 391
training loss: 0.0820021107792

Epoch 4, batch 597
training loss: 0.32833123207092285 

Epoch 4, batch 598
training loss: 0.40751904249191284 

Epoch 4, batch 599
training loss: 0.2506575286388397 

Epoch 4, batch 600
training loss: 0.027881577610969543 

Epoch 4, batch 601
training loss: 0.031716279685497284 

Epoch 4, batch 602
training loss: 0.043341536074876785 

Epoch 4, batch 603
training loss: 0.06350351125001907 

Epoch 4, batch 604
training loss: 0.12330667674541473 

Epoch 4, batch 605
training loss: 0.4186210632324219 

Epoch 4, batch 606
training loss: 0.021880879998207092 

Epoch 4, batch 607
training loss: 0.12928423285484314 

Epoch 4, batch 608
training loss: 0.12166569381952286 

Epoch 4, batch 609
training loss: 0.05396503955125809 

Epoch 4, batch 610
training loss: 0.3282548189163208 

Epoch 4, batch 611
training loss: 0.03502896428108215 

Epoch 4, batch 612
training loss: 0.10318179428577423 

Epoch 4, batch 613
training loss: 0.014937961474061012 

Epoch 4, batch 614
training loss: 0.0150263309

Epoch 4, batch 807
training loss: 0.14707812666893005 

Epoch 4, batch 808
training loss: 0.17019997537136078 

Epoch 4, batch 809
training loss: 0.04549117758870125 

Epoch 4, batch 810
training loss: 0.05528447777032852 

Epoch 4, batch 811
training loss: 0.10827501118183136 

Epoch 4, batch 812
training loss: 0.13398750126361847 

Epoch 4, batch 813
training loss: 0.02160242199897766 

Epoch 4, batch 814
training loss: 0.22167429327964783 

Epoch 4, batch 815
training loss: 0.0863208994269371 

Epoch 4, batch 816
training loss: 0.03690505772829056 

Epoch 4, batch 817
training loss: 0.08642291277647018 

Epoch 4, batch 818
training loss: 0.07651541382074356 

Epoch 4, batch 819
training loss: 0.11657704412937164 

Epoch 4, batch 820
training loss: 0.09368220716714859 

Epoch 4, batch 821
training loss: 0.11985693871974945 

Epoch 4, batch 822
training loss: 0.08668819814920425 

Epoch 4, batch 823
training loss: 0.13046132028102875 

Epoch 4, batch 824
training loss: 0.4192016720771

Epoch 4, batch 1027
training loss: 0.8097079992294312 

Epoch 4, batch 1028
training loss: 0.5233251452445984 

Epoch 4, batch 1029
training loss: 0.14866900444030762 

Epoch 4, batch 1030
training loss: 0.15801799297332764 

Epoch 4, batch 1031
training loss: 0.08193107694387436 

Epoch 4, batch 1032
training loss: 0.04599873721599579 

Epoch 4, batch 1033
training loss: 0.21303315460681915 

Epoch 4, batch 1034
training loss: 0.07270356267690659 

Epoch 4, batch 1035
training loss: 0.05864715576171875 

Epoch 4, batch 1036
training loss: 0.013881039805710316 

Epoch 4, batch 1037
training loss: 0.055617280304431915 

Epoch 4, batch 1038
training loss: 0.18726593255996704 

Epoch 4, batch 1039
training loss: 0.37773871421813965 

Epoch 4, batch 1040
training loss: 0.2614399194717407 

Epoch 4, batch 1041
training loss: 0.3425470292568207 

Epoch 4, batch 1042
training loss: 0.5795533657073975 

Epoch 4, batch 1043
training loss: 0.28543344140052795 

Epoch 4, batch 1044
training loss:

Epoch 4, batch 1248
training loss: 0.17139381170272827 

Epoch 4, batch 1249
training loss: 0.0324350968003273 

Epoch 4, batch 1250
training loss: 0.052787117660045624 

Epoch 4, batch 1251
training loss: 0.08040808141231537 

Epoch 4, batch 1252
training loss: 0.03745698183774948 

Epoch 4, batch 1253
training loss: 0.010832260362803936 

Epoch 4, batch 1254
training loss: 0.07982484251260757 

Epoch 4, batch 1255
training loss: 0.14371129870414734 

Epoch 4, batch 1256
training loss: 0.0170952957123518 

Epoch 4, batch 1257
training loss: 0.2737250030040741 

Epoch 4, batch 1258
training loss: 0.24023787677288055 

Epoch 4, batch 1259
training loss: 0.059125445783138275 

Epoch 4, batch 1260
training loss: 0.5894569158554077 

Epoch 4, batch 1261
training loss: 0.034683145582675934 

Epoch 4, batch 1262
training loss: 0.24357476830482483 

Epoch 4, batch 1263
training loss: 0.547435998916626 

Epoch 4, batch 1264
training loss: 0.1543288230895996 

Epoch 4, batch 1265
training loss:

Epoch 4, batch 1472
training loss: 0.2140442430973053 

Epoch 4, batch 1473
training loss: 1.0085229873657227 

Epoch 4, batch 1474
training loss: 0.053802281618118286 

Epoch 4, batch 1475
training loss: 0.05354652926325798 

Epoch 4, batch 1476
training loss: 0.06740546971559525 

Epoch 4, batch 1477
training loss: 0.18978312611579895 

Epoch 4, batch 1478
training loss: 0.043929751962423325 

Epoch 4, batch 1479
training loss: 0.20920486748218536 

Epoch 4, batch 1480
training loss: 0.16431334614753723 

Epoch 4, batch 1481
training loss: 0.07389119267463684 

Epoch 4, batch 1482
training loss: 0.06596283614635468 

Epoch 4, batch 1483
training loss: 0.2166684865951538 

Epoch 4, batch 1484
training loss: 0.010893210768699646 

Epoch 4, batch 1485
training loss: 0.056660234928131104 

Epoch 4, batch 1486
training loss: 0.016073353588581085 

Epoch 4, batch 1487
training loss: 0.06087968498468399 

Epoch 4, batch 1488
training loss: 0.11316323280334473 

Epoch 4, batch 1489
training 

Epoch 4, batch 1697
training loss: 0.31246083974838257 

Epoch 4, batch 1698
training loss: 0.03632970526814461 

Epoch 4, batch 1699
training loss: 0.017717858776450157 

Epoch 4, batch 1700
training loss: 0.037983424961566925 

Epoch 4, batch 1701
training loss: 0.0070438506081700325 

Epoch 4, batch 1702
training loss: 0.6533992886543274 

Epoch 4, batch 1703
training loss: 0.19653582572937012 

Epoch 4, batch 1704
training loss: 0.17794939875602722 

Epoch 4, batch 1705
training loss: 0.01144125871360302 

Epoch 4, batch 1706
training loss: 0.026052573695778847 

Epoch 4, batch 1707
training loss: 0.1513313502073288 

Epoch 4, batch 1708
training loss: 0.03191182389855385 

Epoch 4, batch 1709
training loss: 0.01619010977447033 

Epoch 4, batch 1710
training loss: 0.004936349578201771 

Epoch 4, batch 1711
training loss: 0.03796330839395523 

Epoch 4, batch 1712
training loss: 0.1306629329919815 

Epoch 4, batch 1713
training loss: 0.02627052739262581 

Epoch 4, batch 1714
training

Epoch 4, batch 1917
training loss: 0.03894985839724541 

Epoch 4, batch 1918
training loss: 0.055626802146434784 

Epoch 4, batch 1919
training loss: 0.09061212837696075 

Epoch 4, batch 1920
training loss: 0.033215202391147614 

Epoch 4, batch 1921
training loss: 0.12374355643987656 

Epoch 4, batch 1922
training loss: 0.5371311902999878 

Epoch 4, batch 1923
training loss: 0.15386167168617249 

Epoch 4, batch 1924
training loss: 0.03495163470506668 

Epoch 4, batch 1925
training loss: 0.23592522740364075 

Epoch 4, batch 1926
training loss: 0.21281051635742188 

Epoch 4, batch 1927
training loss: 0.05093952268362045 

Epoch 4, batch 1928
training loss: 0.1262802928686142 

Epoch 4, batch 1929
training loss: 0.6828180551528931 

Epoch 4, batch 1930
training loss: 0.05473928898572922 

Epoch 4, batch 1931
training loss: 0.0198187418282032 

Epoch 4, batch 1932
training loss: 0.04019778594374657 

Epoch 4, batch 1933
training loss: 0.12350283563137054 

Epoch 4, batch 1934
training loss

Epoch 4, batch 2136
training loss: 0.016613880172371864 

Epoch 4, batch 2137
training loss: 0.01613888517022133 

Epoch 4, batch 2138
training loss: 0.02138364687561989 

Epoch 4, batch 2139
training loss: 0.6644686460494995 

Epoch 4, batch 2140
training loss: 0.7604820132255554 

Epoch 4, batch 2141
training loss: 0.10172271728515625 

Epoch 4, batch 2142
training loss: 0.4651072919368744 

Epoch 4, batch 2143
training loss: 0.1366003453731537 

Epoch 4, batch 2144
training loss: 0.2019536793231964 

Epoch 4, batch 2145
training loss: 0.026267260313034058 

Epoch 4, batch 2146
training loss: 0.022145768627524376 

Epoch 4, batch 2147
training loss: 0.01534174382686615 

Epoch 4, batch 2148
training loss: 0.084461510181427 

Epoch 4, batch 2149
training loss: 0.021616151556372643 

Epoch 4, batch 2150
training loss: 0.1444028615951538 

Epoch 4, batch 2151
training loss: 0.00957961194217205 

Epoch 4, batch 2152
training loss: 0.072951540350914 

Epoch 4, batch 2153
training loss: 0.

Epoch 4, batch 2356
training loss: 0.016537128016352654 

Epoch 4, batch 2357
training loss: 0.18255874514579773 

Epoch 4, batch 2358
training loss: 0.05073262378573418 

Epoch 4, batch 2359
training loss: 0.11089762300252914 

Epoch 4, batch 2360
training loss: 0.2852134108543396 

Epoch 4, batch 2361
training loss: 0.13859161734580994 

Epoch 4, batch 2362
training loss: 0.019830254837870598 

Epoch 4, batch 2363
training loss: 0.012919045984745026 

Epoch 4, batch 2364
training loss: 0.1367601901292801 

Epoch 4, batch 2365
training loss: 0.2880610525608063 

Epoch 4, batch 2366
training loss: 0.05071006342768669 

Epoch 4, batch 2367
training loss: 0.03354645520448685 

Epoch 4, batch 2368
training loss: 0.008058019913733006 

Epoch 4, batch 2369
training loss: 0.23031501471996307 

Epoch 4, batch 2370
training loss: 0.24254123866558075 

Epoch 4, batch 2371
training loss: 0.32986751198768616 

Epoch 4, batch 2372
training loss: 0.039984505623579025 

Epoch 4, batch 2373
training 

Epoch 4, batch 2576
training loss: 0.14424759149551392 

Epoch 4, batch 2577
training loss: 0.041393350809812546 

Epoch 4, batch 2578
training loss: 0.018171558156609535 

Epoch 4, batch 2579
training loss: 0.087196484208107 

Epoch 4, batch 2580
training loss: 0.1405375450849533 

Epoch 4, batch 2581
training loss: 0.3528205156326294 

Epoch 4, batch 2582
training loss: 0.025657331570982933 

Epoch 4, batch 2583
training loss: 0.14632157981395721 

Epoch 4, batch 2584
training loss: 0.3623276352882385 

Epoch 4, batch 2585
training loss: 0.04661677032709122 

Epoch 4, batch 2586
training loss: 0.5752245187759399 

Epoch 4, batch 2587
training loss: 0.18107564747333527 

Epoch 4, batch 2588
training loss: 0.14649170637130737 

Epoch 4, batch 2589
training loss: 0.06569238752126694 

Epoch 4, batch 2590
training loss: 0.011176234111189842 

Epoch 4, batch 2591
training loss: 0.4243531823158264 

Epoch 4, batch 2592
training loss: 0.09600064158439636 

Epoch 4, batch 2593
training loss:

Epoch 4, batch 2800
training loss: 0.08566038310527802 

Epoch 4, batch 2801
training loss: 0.18561533093452454 

Epoch 4, batch 2802
training loss: 0.26182684302330017 

Epoch 4, batch 2803
training loss: 0.3001016080379486 

Epoch 4, batch 2804
training loss: 0.15474066138267517 

Epoch 4, batch 2805
training loss: 0.08142885565757751 

Epoch 4, batch 2806
training loss: 0.01582159474492073 

Epoch 4, batch 2807
training loss: 0.06856479495763779 

Epoch 4, batch 2808
training loss: 0.03149533271789551 

Epoch 4, batch 2809
training loss: 0.014717255719006062 

Epoch 4, batch 2810
training loss: 0.21992966532707214 

Epoch 4, batch 2811
training loss: 0.16277548670768738 

Epoch 4, batch 2812
training loss: 0.21280093491077423 

Epoch 4, batch 2813
training loss: 0.1492433249950409 

Epoch 4, batch 2814
training loss: 0.08380717784166336 

Epoch 4, batch 2815
training loss: 0.08891858160495758 

Epoch 4, batch 2816
training loss: 0.13855120539665222 

Epoch 4, batch 2817
training los

Epoch 4, batch 3023
training loss: 0.09261347353458405 

Epoch 4, batch 3024
training loss: 0.18427987396717072 

Epoch 4, batch 3025
training loss: 0.2638075351715088 

Epoch 4, batch 3026
training loss: 0.24730035662651062 

Epoch 4, batch 3027
training loss: 0.01867573708295822 

Epoch 4, batch 3028
training loss: 0.14593765139579773 

Epoch 4, batch 3029
training loss: 0.2708870470523834 

Epoch 4, batch 3030
training loss: 0.7856653332710266 

Epoch 4, batch 3031
training loss: 0.24298980832099915 

Epoch 4, batch 3032
training loss: 0.07113038003444672 

Epoch 4, batch 3033
training loss: 0.027096593752503395 

Epoch 4, batch 3034
training loss: 0.07998868823051453 

Epoch 4, batch 3035
training loss: 0.12524230778217316 

Epoch 4, batch 3036
training loss: 0.05945010110735893 

Epoch 4, batch 3037
training loss: 0.36746904253959656 

Epoch 4, batch 3038
training loss: 0.042759209871292114 

Epoch 4, batch 3039
training loss: 0.017961731180548668 

Epoch 4, batch 3040
training lo

Epoch 4, batch 3247
training loss: 0.06025588512420654 

Epoch 4, batch 3248
training loss: 0.017059355974197388 

Epoch 4, batch 3249
training loss: 0.06245095655322075 

Epoch 4, batch 3250
training loss: 0.14409376680850983 

Epoch 4, batch 3251
training loss: 0.19513951241970062 

Epoch 4, batch 3252
training loss: 0.406804621219635 

Epoch 4, batch 3253
training loss: 0.033642031252384186 

Epoch 4, batch 3254
training loss: 0.009889434091746807 

Epoch 4, batch 3255
training loss: 0.2691982090473175 

Epoch 4, batch 3256
training loss: 0.32153135538101196 

Epoch 4, batch 3257
training loss: 0.009786738082766533 

Epoch 4, batch 3258
training loss: 0.016937704756855965 

Epoch 4, batch 3259
training loss: 0.06434524059295654 

Epoch 4, batch 3260
training loss: 0.1672348529100418 

Epoch 4, batch 3261
training loss: 0.010353521443903446 

Epoch 4, batch 3262
training loss: 0.04438347741961479 

Epoch 4, batch 3263
training loss: 0.9313844442367554 

Epoch 4, batch 3264
training l

Epoch 4, batch 3469
training loss: 0.11503980308771133 

Epoch 4, batch 3470
training loss: 0.01245728600770235 

Epoch 4, batch 3471
training loss: 0.0604739785194397 

Epoch 4, batch 3472
training loss: 0.4277578890323639 

Epoch 4, batch 3473
training loss: 0.05937749147415161 

Epoch 4, batch 3474
training loss: 0.03511740267276764 

Epoch 4, batch 3475
training loss: 0.09279230982065201 

Epoch 4, batch 3476
training loss: 0.12918610870838165 

Epoch 4, batch 3477
training loss: 0.05470218509435654 

Epoch 4, batch 3478
training loss: 0.3264584243297577 

Epoch 4, batch 3479
training loss: 0.0454239621758461 

Epoch 4, batch 3480
training loss: 0.07875533401966095 

Epoch 4, batch 3481
training loss: 0.020653286948800087 

Epoch 4, batch 3482
training loss: 0.053157828748226166 

Epoch 4, batch 3483
training loss: 0.3378513753414154 

Epoch 4, batch 3484
training loss: 0.04786597937345505 

Epoch 4, batch 3485
training loss: 0.09084561467170715 

Epoch 4, batch 3486
training loss:

Epoch 4, batch 3692
training loss: 0.22139999270439148 

Epoch 4, batch 3693
training loss: 0.09641730785369873 

Epoch 4, batch 3694
training loss: 0.06894655525684357 

Epoch 4, batch 3695
training loss: 0.0319661870598793 

Epoch 4, batch 3696
training loss: 0.0866641104221344 

Epoch 4, batch 3697
training loss: 0.054725296795368195 

Epoch 4, batch 3698
training loss: 0.035599447786808014 

Epoch 4, batch 3699
training loss: 0.09789595752954483 

Epoch 4, batch 3700
training loss: 0.09212910383939743 

Epoch 4, batch 3701
training loss: 0.22769984602928162 

Epoch 4, batch 3702
training loss: 0.08867456018924713 

Epoch 4, batch 3703
training loss: 0.0672089084982872 

Epoch 4, batch 3704
training loss: 0.06974363327026367 

Epoch 4, batch 3705
training loss: 0.10504118353128433 

Epoch 4, batch 3706
training loss: 0.004787108860909939 

Epoch 4, batch 3707
training loss: 0.05722472071647644 

Epoch 4, batch 3708
training loss: 0.014374935999512672 

Epoch 4, batch 3709
training l

Epoch 4, batch 3915
training loss: 0.01698506809771061 

Epoch 4, batch 3916
training loss: 0.6603444814682007 

Epoch 4, batch 3917
training loss: 0.0923721119761467 

Epoch 4, batch 3918
training loss: 0.004941781051456928 

Epoch 4, batch 3919
training loss: 0.1769382357597351 

Epoch 4, batch 3920
training loss: 0.2811369001865387 

Epoch 4, batch 3921
training loss: 0.1005302220582962 

Epoch 4, batch 3922
training loss: 0.14390720427036285 

Epoch 4, batch 3923
training loss: 0.21051199734210968 

Epoch 4, batch 3924
training loss: 0.01786116138100624 

Epoch 4, batch 3925
training loss: 0.021594572812318802 

Epoch 4, batch 3926
training loss: 0.2747231125831604 

Epoch 4, batch 3927
training loss: 0.06745831668376923 

Epoch 4, batch 3928
training loss: 0.09571222215890884 

Epoch 4, batch 3929
training loss: 0.04287498816847801 

Epoch 4, batch 3930
training loss: 0.09587620943784714 

Epoch 4, batch 3931
training loss: 0.0226235743612051 

Epoch 4, batch 3932
training loss: 0

Epoch 4, batch 4139
training loss: 0.15172290802001953 

Epoch 4, batch 4140
training loss: 0.04650329425930977 

Epoch 4, batch 4141
training loss: 0.08534064888954163 

Epoch 4, batch 4142
training loss: 0.1310596764087677 

Epoch 4, batch 4143
training loss: 0.23959186673164368 

Epoch 4, batch 4144
training loss: 0.033897846937179565 

Epoch 4, batch 4145
training loss: 0.2962583899497986 

Epoch 4, batch 4146
training loss: 0.04132004827260971 

Epoch 4, batch 4147
training loss: 0.006866142153739929 

Epoch 4, batch 4148
training loss: 0.16029909253120422 

Epoch 4, batch 4149
training loss: 0.09579736739397049 

Epoch 4, batch 4150
training loss: 0.07826614379882812 

Epoch 4, batch 4151
training loss: 0.028706688433885574 

Epoch 4, batch 4152
training loss: 0.06010551378130913 

Epoch 4, batch 4153
training loss: 0.012955807149410248 

Epoch 4, batch 4154
training loss: 0.32807958126068115 

Epoch 4, batch 4155
training loss: 0.03998269513249397 

Epoch 4, batch 4156
training 

Epoch 4, batch 4364
training loss: 0.13256242871284485 

Epoch 4, batch 4365
training loss: 0.10280672460794449 

Epoch 4, batch 4366
training loss: 0.22267469763755798 

Epoch 4, batch 4367
training loss: 0.12700501084327698 

Epoch 4, batch 4368
training loss: 0.15909509360790253 

Epoch 4, batch 4369
training loss: 0.18841338157653809 

Epoch 4, batch 4370
training loss: 0.6630114316940308 

Epoch 4, batch 4371
training loss: 0.046749942004680634 

Epoch 4, batch 4372
training loss: 0.05985928326845169 

Epoch 4, batch 4373
training loss: 0.014596645720303059 

Epoch 4, batch 4374
training loss: 0.20848853886127472 

Epoch 4, batch 4375
training loss: 0.7530788779258728 

Epoch 4, batch 4376
training loss: 0.33953702449798584 

Epoch 4, batch 4377
training loss: 0.17171837389469147 

Epoch 4, batch 4378
training loss: 0.02496691793203354 

Epoch 4, batch 4379
training loss: 0.015974868088960648 

Epoch 4, batch 4380
training loss: 0.1470693051815033 

Epoch 4, batch 4381
training lo

Epoch 4, batch 4589
training loss: 0.022660788148641586 

Epoch 4, batch 4590
training loss: 0.05616312101483345 

Epoch 4, batch 4591
training loss: 0.12396298348903656 

Epoch 4, batch 4592
training loss: 0.02392645739018917 

Epoch 4, batch 4593
training loss: 0.06203886866569519 

Epoch 4, batch 4594
training loss: 0.0887468233704567 

Epoch 4, batch 4595
training loss: 0.2942083179950714 

Epoch 4, batch 4596
training loss: 0.06473401933908463 

Epoch 4, batch 4597
training loss: 0.18527889251708984 

Epoch 4, batch 4598
training loss: 0.19489090144634247 

Epoch 4, batch 4599
training loss: 0.23151054978370667 

Epoch 4, batch 4600
training loss: 0.019991695880889893 

Epoch 4, batch 4601
training loss: 0.207455113530159 

Epoch 4, batch 4602
training loss: 0.05380818247795105 

Epoch 4, batch 4603
training loss: 0.4153802990913391 

Epoch 4, batch 4604
training loss: 0.09618730843067169 

Epoch 4, batch 4605
training loss: 0.244713693857193 

Epoch 4, batch 4606
training loss: 0

Epoch 4, batch 4810
training loss: 0.041151322424411774 

Epoch 4, batch 4811
training loss: 0.033194467425346375 

Epoch 4, batch 4812
training loss: 0.0293283574283123 

Epoch 4, batch 4813
training loss: 0.6746723055839539 

Epoch 4, batch 4814
training loss: 0.11155754327774048 

Epoch 4, batch 4815
training loss: 0.7801645398139954 

Epoch 4, batch 4816
training loss: 0.039812538772821426 

Epoch 4, batch 4817
training loss: 0.40792346000671387 

Epoch 4, batch 4818
training loss: 0.01417307835072279 

Epoch 4, batch 4819
training loss: 0.030006974935531616 

Epoch 4, batch 4820
training loss: 0.08736173808574677 

Epoch 4, batch 4821
training loss: 0.37654823064804077 

Epoch 4, batch 4822
training loss: 0.056487925350666046 

Epoch 4, batch 4823
training loss: 0.2810346186161041 

Epoch 4, batch 4824
training loss: 0.13242612779140472 

Epoch 4, batch 4825
training loss: 0.19344642758369446 

Epoch 4, batch 4826
training loss: 0.22890742123126984 

Epoch 4, batch 4827
training l

Epoch 4, batch 5030
training loss: 0.9181990623474121 

Epoch 4, batch 5031
training loss: 0.25252336263656616 

Epoch 4, batch 5032
training loss: 0.016319122165441513 

Epoch 4, batch 5033
training loss: 0.44482582807540894 

Epoch 4, batch 5034
training loss: 0.055520545691251755 

Epoch 4, batch 5035
training loss: 0.04876181110739708 

Epoch 4, batch 5036
training loss: 0.00743546849116683 

Epoch 4, batch 5037
training loss: 0.27134042978286743 

Epoch 4, batch 5038
training loss: 0.020569700747728348 

Epoch 4, batch 5039
training loss: 0.1748659908771515 

Epoch 4, batch 5040
training loss: 0.6748605966567993 

Epoch 4, batch 5041
training loss: 0.02606775239109993 

Epoch 4, batch 5042
training loss: 0.050221286714076996 

Epoch 4, batch 5043
training loss: 0.012400394305586815 

Epoch 4, batch 5044
training loss: 0.8475111126899719 

Epoch 4, batch 5045
training loss: 0.1863393485546112 

Epoch 4, batch 5046
training loss: 0.033738307654857635 

Epoch 4, batch 5047
training l

Epoch 4, batch 5250
training loss: 0.09769318252801895 

Epoch 4, batch 5251
training loss: 0.03359713405370712 

Epoch 4, batch 5252
training loss: 0.013878392055630684 

Epoch 4, batch 5253
training loss: 0.11077722162008286 

Epoch 4, batch 5254
training loss: 0.7117193341255188 

Epoch 4, batch 5255
training loss: 0.03245038911700249 

Epoch 4, batch 5256
training loss: 0.043147020041942596 

Epoch 4, batch 5257
training loss: 0.6857723593711853 

Epoch 4, batch 5258
training loss: 0.6335790157318115 

Epoch 4, batch 5259
training loss: 0.039570122957229614 

Epoch 4, batch 5260
training loss: 0.2354646921157837 

Epoch 4, batch 5261
training loss: 0.3114086389541626 

Epoch 4, batch 5262
training loss: 0.03647422790527344 

Epoch 4, batch 5263
training loss: 0.30115851759910583 

Epoch 4, batch 5264
training loss: 0.04481211677193642 

Epoch 4, batch 5265
training loss: 0.034844253212213516 

Epoch 4, batch 5266
training loss: 0.5215584635734558 

Epoch 4, batch 5267
training loss

Epoch 4, batch 5463
training loss: 0.008793383836746216 

Epoch 4, batch 5464
training loss: 0.642453134059906 

Epoch 4, batch 5465
training loss: 0.023867130279541016 

Epoch 4, batch 5466
training loss: 0.019740764051675797 

Epoch 4, batch 5467
training loss: 0.03718361258506775 

Epoch 4, batch 5468
training loss: 0.3890962302684784 

Epoch 4, batch 5469
training loss: 0.027543460950255394 

Epoch 4, batch 5470
training loss: 0.2084851711988449 

Epoch 4, batch 5471
training loss: 0.48695650696754456 

Epoch 4, batch 5472
training loss: 0.009470272809267044 

Epoch 4, batch 5473
training loss: 0.17759452760219574 

Epoch 4, batch 5474
training loss: 0.013087722472846508 

Epoch 4, batch 5475
training loss: 0.128729447722435 

Epoch 4, batch 5476
training loss: 0.07616876065731049 

Epoch 4, batch 5477
training loss: 0.01946583390235901 

Epoch 4, batch 5478
training loss: 0.1016884297132492 

Epoch 4, batch 5479
training loss: 0.044484976679086685 

Epoch 4, batch 5480
training lo

Epoch 4, batch 5683
training loss: 0.13520684838294983 

Epoch 4, batch 5684
training loss: 0.04558476433157921 

Epoch 4, batch 5685
training loss: 0.11712010949850082 

Epoch 4, batch 5686
training loss: 0.6885957717895508 

Epoch 4, batch 5687
training loss: 0.03512202948331833 

Epoch 4, batch 5688
training loss: 0.04438186064362526 

Epoch 4, batch 5689
training loss: 0.016767069697380066 

Epoch 4, batch 5690
training loss: 0.03359217569231987 

Epoch 4, batch 5691
training loss: 0.7307530641555786 

Epoch 4, batch 5692
training loss: 0.18116223812103271 

Epoch 4, batch 5693
training loss: 0.05627971887588501 

Epoch 4, batch 5694
training loss: 0.17601121962070465 

Epoch 4, batch 5695
training loss: 0.040463823825120926 

Epoch 4, batch 5696
training loss: 0.5716493725776672 

Epoch 4, batch 5697
training loss: 0.07135923206806183 

Epoch 4, batch 5698
training loss: 0.6469131112098694 

Epoch 4, batch 5699
training loss: 0.08967848122119904 

Epoch 4, batch 5700
training loss

Epoch 4, batch 5905
training loss: 0.18512384593486786 

Epoch 4, batch 5906
training loss: 0.028482193127274513 

Epoch 4, batch 5907
training loss: 1.0963430404663086 

Epoch 4, batch 5908
training loss: 0.271526575088501 

Epoch 4, batch 5909
training loss: 0.33427804708480835 

Epoch 4, batch 5910
training loss: 0.027782639488577843 

Epoch 4, batch 5911
training loss: 0.2723456025123596 

Epoch 4, batch 5912
training loss: 0.03337257727980614 

Epoch 4, batch 5913
training loss: 0.5581651926040649 

Epoch 4, batch 5914
training loss: 0.20054221153259277 

Epoch 4, batch 5915
training loss: 0.06916588544845581 

Epoch 4, batch 5916
training loss: 0.3756828308105469 

Epoch 4, batch 5917
training loss: 0.12639550864696503 

Epoch 4, batch 5918
training loss: 0.11250908672809601 

Epoch 4, batch 5919
training loss: 0.06759720295667648 

Epoch 4, batch 5920
training loss: 0.12028421461582184 

Epoch 4, batch 5921
training loss: 0.14654585719108582 

Epoch 4, batch 5922
training loss: 

Epoch 5, batch 121
training loss: 0.14082071185112 

Epoch 5, batch 122
training loss: 0.0038620170671492815 

Epoch 5, batch 123
training loss: 0.12161917984485626 

Epoch 5, batch 124
training loss: 0.05362505838274956 

Epoch 5, batch 125
training loss: 0.13908830285072327 

Epoch 5, batch 126
training loss: 0.019343378022313118 

Epoch 5, batch 127
training loss: 0.011614090763032436 

Epoch 5, batch 128
training loss: 0.16757459938526154 

Epoch 5, batch 129
training loss: 0.03382747620344162 

Epoch 5, batch 130
training loss: 0.03693590313196182 

Epoch 5, batch 131
training loss: 0.12981458008289337 

Epoch 5, batch 132
training loss: 0.6145542860031128 

Epoch 5, batch 133
training loss: 0.29741397500038147 

Epoch 5, batch 134
training loss: 0.47799259424209595 

Epoch 5, batch 135
training loss: 0.08309165388345718 

Epoch 5, batch 136
training loss: 0.026380708441138268 

Epoch 5, batch 137
training loss: 0.27735596895217896 

Epoch 5, batch 138
training loss: 0.42565846443

Epoch 5, batch 341
training loss: 0.04792313277721405 

Epoch 5, batch 342
training loss: 0.11071278899908066 

Epoch 5, batch 343
training loss: 0.022063378244638443 

Epoch 5, batch 344
training loss: 0.3480706810951233 

Epoch 5, batch 345
training loss: 0.08102715015411377 

Epoch 5, batch 346
training loss: 0.13068938255310059 

Epoch 5, batch 347
training loss: 0.04044298082590103 

Epoch 5, batch 348
training loss: 0.07563916593790054 

Epoch 5, batch 349
training loss: 0.29878050088882446 

Epoch 5, batch 350
training loss: 0.049731843173503876 

Epoch 5, batch 351
training loss: 0.07842260599136353 

Epoch 5, batch 352
training loss: 0.03806806728243828 

Epoch 5, batch 353
training loss: 0.009363762103021145 

Epoch 5, batch 354
training loss: 0.16340085864067078 

Epoch 5, batch 355
training loss: 0.06865439563989639 

Epoch 5, batch 356
training loss: 0.07625963538885117 

Epoch 5, batch 357
training loss: 0.3117523789405823 

Epoch 5, batch 358
training loss: 0.02434163354

Epoch 5, batch 566
training loss: 0.1386372447013855 

Epoch 5, batch 567
training loss: 0.24900713562965393 

Epoch 5, batch 568
training loss: 0.017737995833158493 

Epoch 5, batch 569
training loss: 0.07130877673625946 

Epoch 5, batch 570
training loss: 0.09870202839374542 

Epoch 5, batch 571
training loss: 0.6469592452049255 

Epoch 5, batch 572
training loss: 0.4444083273410797 

Epoch 5, batch 573
training loss: 0.14599725604057312 

Epoch 5, batch 574
training loss: 0.01078737247735262 

Epoch 5, batch 575
training loss: 0.004463613964617252 

Epoch 5, batch 576
training loss: 0.08850665390491486 

Epoch 5, batch 577
training loss: 0.3986274302005768 

Epoch 5, batch 578
training loss: 0.3307233452796936 

Epoch 5, batch 579
training loss: 0.01733131892979145 

Epoch 5, batch 580
training loss: 0.24151602387428284 

Epoch 5, batch 581
training loss: 0.004125765059143305 

Epoch 5, batch 582
training loss: 0.07186774909496307 

Epoch 5, batch 583
training loss: 0.03180174902081

Epoch 5, batch 788
training loss: 0.01870615780353546 

Epoch 5, batch 789
training loss: 0.8696401715278625 

Epoch 5, batch 790
training loss: 0.012777228839695454 

Epoch 5, batch 791
training loss: 0.05594277381896973 

Epoch 5, batch 792
training loss: 0.2644413709640503 

Epoch 5, batch 793
training loss: 0.027311142534017563 

Epoch 5, batch 794
training loss: 0.23202213644981384 

Epoch 5, batch 795
training loss: 0.025219757109880447 

Epoch 5, batch 796
training loss: 0.012346690520644188 

Epoch 5, batch 797
training loss: 0.18331654369831085 

Epoch 5, batch 798
training loss: 0.12574389576911926 

Epoch 5, batch 799
training loss: 0.05831925943493843 

Epoch 5, batch 800
training loss: 0.29134875535964966 

Epoch 5, batch 801
training loss: 0.16157224774360657 

Epoch 5, batch 802
training loss: 0.05177807807922363 

Epoch 5, batch 803
training loss: 0.01671454682946205 

Epoch 5, batch 804
training loss: 0.0825827345252037 

Epoch 5, batch 805
training loss: 0.10297811031

Epoch 5, batch 1006
training loss: 0.014072312042117119 

Epoch 5, batch 1007
training loss: 0.0597589835524559 

Epoch 5, batch 1008
training loss: 0.017109176144003868 

Epoch 5, batch 1009
training loss: 0.052789561450481415 

Epoch 5, batch 1010
training loss: 0.017018422484397888 

Epoch 5, batch 1011
training loss: 0.0159701406955719 

Epoch 5, batch 1012
training loss: 0.03318279609084129 

Epoch 5, batch 1013
training loss: 0.04135284200310707 

Epoch 5, batch 1014
training loss: 0.05486242100596428 

Epoch 5, batch 1015
training loss: 0.10702663660049438 

Epoch 5, batch 1016
training loss: 0.19765807688236237 

Epoch 5, batch 1017
training loss: 0.029540961608290672 

Epoch 5, batch 1018
training loss: 0.3368811011314392 

Epoch 5, batch 1019
training loss: 0.011231498792767525 

Epoch 5, batch 1020
training loss: 0.09262481331825256 

Epoch 5, batch 1021
training loss: 0.055459391325712204 

Epoch 5, batch 1022
training loss: 0.011556949466466904 

Epoch 5, batch 1023
traini

Epoch 5, batch 1228
training loss: 0.017264513298869133 

Epoch 5, batch 1229
training loss: 0.04909772798418999 

Epoch 5, batch 1230
training loss: 0.112005315721035 

Epoch 5, batch 1231
training loss: 0.02593766525387764 

Epoch 5, batch 1232
training loss: 0.14228121936321259 

Epoch 5, batch 1233
training loss: 0.014211894944310188 

Epoch 5, batch 1234
training loss: 0.11739702522754669 

Epoch 5, batch 1235
training loss: 0.20372983813285828 

Epoch 5, batch 1236
training loss: 0.10791227966547012 

Epoch 5, batch 1237
training loss: 0.03826833516359329 

Epoch 5, batch 1238
training loss: 0.03137846291065216 

Epoch 5, batch 1239
training loss: 1.0507184267044067 

Epoch 5, batch 1240
training loss: 0.015541593544185162 

Epoch 5, batch 1241
training loss: 0.034391261637210846 

Epoch 5, batch 1242
training loss: 0.01385944802314043 

Epoch 5, batch 1243
training loss: 0.17804357409477234 

Epoch 5, batch 1244
training loss: 0.015639811754226685 

Epoch 5, batch 1245
training 

Epoch 5, batch 1449
training loss: 0.26335951685905457 

Epoch 5, batch 1450
training loss: 0.07733551412820816 

Epoch 5, batch 1451
training loss: 0.027121922001242638 

Epoch 5, batch 1452
training loss: 0.3602730631828308 

Epoch 5, batch 1453
training loss: 0.009897509589791298 

Epoch 5, batch 1454
training loss: 0.163425475358963 

Epoch 5, batch 1455
training loss: 0.028388043865561485 

Epoch 5, batch 1456
training loss: 0.031200643628835678 

Epoch 5, batch 1457
training loss: 0.05120228976011276 

Epoch 5, batch 1458
training loss: 0.014283841475844383 

Epoch 5, batch 1459
training loss: 0.17667649686336517 

Epoch 5, batch 1460
training loss: 0.003032286185771227 

Epoch 5, batch 1461
training loss: 0.01474597118794918 

Epoch 5, batch 1462
training loss: 0.011987698264420033 

Epoch 5, batch 1463
training loss: 0.0729416012763977 

Epoch 5, batch 1464
training loss: 0.015228645876049995 

Epoch 5, batch 1465
training loss: 0.04402174800634384 

Epoch 5, batch 1466
trainin

Epoch 5, batch 1672
training loss: 0.29874998331069946 

Epoch 5, batch 1673
training loss: 0.12120777368545532 

Epoch 5, batch 1674
training loss: 0.06793414801359177 

Epoch 5, batch 1675
training loss: 0.16064389050006866 

Epoch 5, batch 1676
training loss: 0.049212805926799774 

Epoch 5, batch 1677
training loss: 0.07092611491680145 

Epoch 5, batch 1678
training loss: 0.1623144894838333 

Epoch 5, batch 1679
training loss: 0.005127105861902237 

Epoch 5, batch 1680
training loss: 0.11162398755550385 

Epoch 5, batch 1681
training loss: 0.05021033436059952 

Epoch 5, batch 1682
training loss: 0.03928690031170845 

Epoch 5, batch 1683
training loss: 0.054355185478925705 

Epoch 5, batch 1684
training loss: 0.8692567944526672 

Epoch 5, batch 1685
training loss: 0.24672546982765198 

Epoch 5, batch 1686
training loss: 0.19598332047462463 

Epoch 5, batch 1687
training loss: 0.04675193503499031 

Epoch 5, batch 1688
training loss: 0.036506835371255875 

Epoch 5, batch 1689
training 

Epoch 5, batch 1895
training loss: 0.1534224897623062 

Epoch 5, batch 1896
training loss: 0.052886318415403366 

Epoch 5, batch 1897
training loss: 0.17870251834392548 

Epoch 5, batch 1898
training loss: 0.15459956228733063 

Epoch 5, batch 1899
training loss: 0.028319358825683594 

Epoch 5, batch 1900
training loss: 0.007886767387390137 

Epoch 5, batch 1901
training loss: 0.21340210735797882 

Epoch 5, batch 1902
training loss: 0.16398510336875916 

Epoch 5, batch 1903
training loss: 0.06866510957479477 

Epoch 5, batch 1904
training loss: 0.7644144296646118 

Epoch 5, batch 1905
training loss: 0.06312890350818634 

Epoch 5, batch 1906
training loss: 0.1602802872657776 

Epoch 5, batch 1907
training loss: 0.02286127582192421 

Epoch 5, batch 1908
training loss: 0.03510754555463791 

Epoch 5, batch 1909
training loss: 0.8907986879348755 

Epoch 5, batch 1910
training loss: 0.046323880553245544 

Epoch 5, batch 1911
training loss: 0.1259351372718811 

Epoch 5, batch 1912
training los

Epoch 5, batch 2117
training loss: 0.5800560712814331 

Epoch 5, batch 2118
training loss: 0.08449693024158478 

Epoch 5, batch 2119
training loss: 0.561302125453949 

Epoch 5, batch 2120
training loss: 0.19841109216213226 

Epoch 5, batch 2121
training loss: 0.06643307954072952 

Epoch 5, batch 2122
training loss: 0.07410784065723419 

Epoch 5, batch 2123
training loss: 0.16902010142803192 

Epoch 5, batch 2124
training loss: 0.029447004199028015 

Epoch 5, batch 2125
training loss: 0.10662917047739029 

Epoch 5, batch 2126
training loss: 0.33401912450790405 

Epoch 5, batch 2127
training loss: 0.04056306555867195 

Epoch 5, batch 2128
training loss: 0.10512650012969971 

Epoch 5, batch 2129
training loss: 0.035674676299095154 

Epoch 5, batch 2130
training loss: 0.013410868123173714 

Epoch 5, batch 2131
training loss: 0.03273039311170578 

Epoch 5, batch 2132
training loss: 0.013515226542949677 

Epoch 5, batch 2133
training loss: 0.03466419875621796 

Epoch 5, batch 2134
training l

Epoch 5, batch 2340
training loss: 0.07163870334625244 

Epoch 5, batch 2341
training loss: 0.6911531090736389 

Epoch 5, batch 2342
training loss: 0.29607123136520386 

Epoch 5, batch 2343
training loss: 0.04163045436143875 

Epoch 5, batch 2344
training loss: 0.7380844354629517 

Epoch 5, batch 2345
training loss: 0.2816255986690521 

Epoch 5, batch 2346
training loss: 0.056648802012205124 

Epoch 5, batch 2347
training loss: 0.09315383434295654 

Epoch 5, batch 2348
training loss: 0.18458062410354614 

Epoch 5, batch 2349
training loss: 0.5041202902793884 

Epoch 5, batch 2350
training loss: 0.007136767264455557 

Epoch 5, batch 2351
training loss: 0.1667623221874237 

Epoch 5, batch 2352
training loss: 0.0555635467171669 

Epoch 5, batch 2353
training loss: 0.04540126770734787 

Epoch 5, batch 2354
training loss: 0.8470511436462402 

Epoch 5, batch 2355
training loss: 0.29729050397872925 

Epoch 5, batch 2356
training loss: 0.12107180058956146 

Epoch 5, batch 2357
training loss: 0

Epoch 5, batch 2564
training loss: 0.4072175621986389 

Epoch 5, batch 2565
training loss: 0.20520584285259247 

Epoch 5, batch 2566
training loss: 0.017304323613643646 

Epoch 5, batch 2567
training loss: 0.14989176392555237 

Epoch 5, batch 2568
training loss: 0.05568487569689751 

Epoch 5, batch 2569
training loss: 0.0338321253657341 

Epoch 5, batch 2570
training loss: 0.04719984158873558 

Epoch 5, batch 2571
training loss: 0.12602201104164124 

Epoch 5, batch 2572
training loss: 0.2915729582309723 

Epoch 5, batch 2573
training loss: 0.2930023670196533 

Epoch 5, batch 2574
training loss: 0.6674867868423462 

Epoch 5, batch 2575
training loss: 0.39485636353492737 

Epoch 5, batch 2576
training loss: 0.1592927873134613 

Epoch 5, batch 2577
training loss: 0.24600474536418915 

Epoch 5, batch 2578
training loss: 0.10502038151025772 

Epoch 5, batch 2579
training loss: 0.08028385788202286 

Epoch 5, batch 2580
training loss: 0.6416892409324646 

Epoch 5, batch 2581
training loss: 0.

Epoch 5, batch 2790
training loss: 0.740047812461853 

Epoch 5, batch 2791
training loss: 0.1421479433774948 

Epoch 5, batch 2792
training loss: 0.02878873609006405 

Epoch 5, batch 2793
training loss: 0.21352677047252655 

Epoch 5, batch 2794
training loss: 0.249006986618042 

Epoch 5, batch 2795
training loss: 0.022078920155763626 

Epoch 5, batch 2796
training loss: 0.015000557526946068 

Epoch 5, batch 2797
training loss: 0.21309097111225128 

Epoch 5, batch 2798
training loss: 0.17259855568408966 

Epoch 5, batch 2799
training loss: 0.03274831920862198 

Epoch 5, batch 2800
training loss: 0.0871427059173584 

Epoch 5, batch 2801
training loss: 0.4949924051761627 

Epoch 5, batch 2802
training loss: 0.04169561713933945 

Epoch 5, batch 2803
training loss: 0.037345852702856064 

Epoch 5, batch 2804
training loss: 0.014297771267592907 

Epoch 5, batch 2805
training loss: 0.18090513348579407 

Epoch 5, batch 2806
training loss: 0.07521601021289825 

Epoch 5, batch 2807
training loss:

Epoch 5, batch 3012
training loss: 0.2718837857246399 

Epoch 5, batch 3013
training loss: 0.015170465223491192 

Epoch 5, batch 3014
training loss: 0.0739273652434349 

Epoch 5, batch 3015
training loss: 0.011253366246819496 

Epoch 5, batch 3016
training loss: 0.028930461034178734 

Epoch 5, batch 3017
training loss: 0.016619164496660233 

Epoch 5, batch 3018
training loss: 0.032780058681964874 

Epoch 5, batch 3019
training loss: 0.03847494348883629 

Epoch 5, batch 3020
training loss: 0.15676584839820862 

Epoch 5, batch 3021
training loss: 0.2968387007713318 

Epoch 5, batch 3022
training loss: 0.08398675918579102 

Epoch 5, batch 3023
training loss: 0.005790125112980604 

Epoch 5, batch 3024
training loss: 0.0385761633515358 

Epoch 5, batch 3025
training loss: 0.2783176004886627 

Epoch 5, batch 3026
training loss: 0.049252189695835114 

Epoch 5, batch 3027
training loss: 0.32312676310539246 

Epoch 5, batch 3028
training loss: 0.06562597304582596 

Epoch 5, batch 3029
training 

Epoch 5, batch 3235
training loss: 0.23956997692584991 

Epoch 5, batch 3236
training loss: 0.020720498636364937 

Epoch 5, batch 3237
training loss: 0.15114855766296387 

Epoch 5, batch 3238
training loss: 0.17876036465168 

Epoch 5, batch 3239
training loss: 0.44075527787208557 

Epoch 5, batch 3240
training loss: 0.10538192838430405 

Epoch 5, batch 3241
training loss: 0.00589213240891695 

Epoch 5, batch 3242
training loss: 0.4798329472541809 

Epoch 5, batch 3243
training loss: 0.06300204992294312 

Epoch 5, batch 3244
training loss: 0.5663647651672363 

Epoch 5, batch 3245
training loss: 0.013124319724738598 

Epoch 5, batch 3246
training loss: 0.12484900653362274 

Epoch 5, batch 3247
training loss: 0.026232704520225525 

Epoch 5, batch 3248
training loss: 0.015416985377669334 

Epoch 5, batch 3249
training loss: 0.028618836775422096 

Epoch 5, batch 3250
training loss: 0.017489563673734665 

Epoch 5, batch 3251
training loss: 0.2875349521636963 

Epoch 5, batch 3252
training lo

Epoch 5, batch 3457
training loss: 0.023745087906718254 

Epoch 5, batch 3458
training loss: 0.0745336264371872 

Epoch 5, batch 3459
training loss: 0.015019243583083153 

Epoch 5, batch 3460
training loss: 0.05769004672765732 

Epoch 5, batch 3461
training loss: 0.2764349579811096 

Epoch 5, batch 3462
training loss: 0.14946205914020538 

Epoch 5, batch 3463
training loss: 0.06500829756259918 

Epoch 5, batch 3464
training loss: 0.17082761228084564 

Epoch 5, batch 3465
training loss: 0.08204778283834457 

Epoch 5, batch 3466
training loss: 0.17986837029457092 

Epoch 5, batch 3467
training loss: 0.07177673280239105 

Epoch 5, batch 3468
training loss: 0.44479450583457947 

Epoch 5, batch 3469
training loss: 0.1601056605577469 

Epoch 5, batch 3470
training loss: 0.15714259445667267 

Epoch 5, batch 3471
training loss: 0.24034488201141357 

Epoch 5, batch 3472
training loss: 0.24480195343494415 

Epoch 5, batch 3473
training loss: 0.633996307849884 

Epoch 5, batch 3474
training loss:

Epoch 5, batch 3672
training loss: 0.12094171345233917 

Epoch 5, batch 3673
training loss: 0.15699502825737 

Epoch 5, batch 3674
training loss: 0.830124020576477 

Epoch 5, batch 3675
training loss: 0.06287175416946411 

Epoch 5, batch 3676
training loss: 0.01828763633966446 

Epoch 5, batch 3677
training loss: 0.7891306281089783 

Epoch 5, batch 3678
training loss: 0.8212669491767883 

Epoch 5, batch 3679
training loss: 0.04271135479211807 

Epoch 5, batch 3680
training loss: 0.018839094787836075 

Epoch 5, batch 3681
training loss: 0.05200587585568428 

Epoch 5, batch 3682
training loss: 0.19235917925834656 

Epoch 5, batch 3683
training loss: 0.047079652547836304 

Epoch 5, batch 3684
training loss: 0.04651731997728348 

Epoch 5, batch 3685
training loss: 0.032148655503988266 

Epoch 5, batch 3686
training loss: 0.22522631287574768 

Epoch 5, batch 3687
training loss: 0.1288827359676361 

Epoch 5, batch 3688
training loss: 0.08190913498401642 

Epoch 5, batch 3689
training loss: 0

Epoch 5, batch 3893
training loss: 0.44589194655418396 

Epoch 5, batch 3894
training loss: 0.30238330364227295 

Epoch 5, batch 3895
training loss: 0.8686856031417847 

Epoch 5, batch 3896
training loss: 0.1459515541791916 

Epoch 5, batch 3897
training loss: 0.032375868409872055 

Epoch 5, batch 3898
training loss: 0.3865239918231964 

Epoch 5, batch 3899
training loss: 0.021007299423217773 

Epoch 5, batch 3900
training loss: 0.07365855574607849 

Epoch 5, batch 3901
training loss: 0.18950696289539337 

Epoch 5, batch 3902
training loss: 0.36277854442596436 

Epoch 5, batch 3903
training loss: 0.22274520993232727 

Epoch 5, batch 3904
training loss: 0.3370506167411804 

Epoch 5, batch 3905
training loss: 0.019571777433156967 

Epoch 5, batch 3906
training loss: 0.05419016629457474 

Epoch 5, batch 3907
training loss: 0.07888078689575195 

Epoch 5, batch 3908
training loss: 0.3221574127674103 

Epoch 5, batch 3909
training loss: 0.026009712368249893 

Epoch 5, batch 3910
training los

Epoch 5, batch 4115
training loss: 0.007608366664499044 

Epoch 5, batch 4116
training loss: 0.024929294362664223 

Epoch 5, batch 4117
training loss: 0.17787912487983704 

Epoch 5, batch 4118
training loss: 0.12263353914022446 

Epoch 5, batch 4119
training loss: 0.3672577738761902 

Epoch 5, batch 4120
training loss: 0.3790145516395569 

Epoch 5, batch 4121
training loss: 0.04766060411930084 

Epoch 5, batch 4122
training loss: 0.006200741045176983 

Epoch 5, batch 4123
training loss: 0.406977117061615 

Epoch 5, batch 4124
training loss: 0.2153785228729248 

Epoch 5, batch 4125
training loss: 0.03364337235689163 

Epoch 5, batch 4126
training loss: 0.054818641394376755 

Epoch 5, batch 4127
training loss: 0.02481865882873535 

Epoch 5, batch 4128
training loss: 0.05043210834264755 

Epoch 5, batch 4129
training loss: 0.06966851651668549 

Epoch 5, batch 4130
training loss: 0.07342755794525146 

Epoch 5, batch 4131
training loss: 0.04723341763019562 

Epoch 5, batch 4132
training los

Epoch 5, batch 4330
training loss: 0.222425177693367 

Epoch 5, batch 4331
training loss: 0.044996194541454315 

Epoch 5, batch 4332
training loss: 0.10509006679058075 

Epoch 5, batch 4333
training loss: 0.027669697999954224 

Epoch 5, batch 4334
training loss: 0.00643559917807579 

Epoch 5, batch 4335
training loss: 0.04570995271205902 

Epoch 5, batch 4336
training loss: 0.010441174730658531 

Epoch 5, batch 4337
training loss: 0.027055537328124046 

Epoch 5, batch 4338
training loss: 0.1982107162475586 

Epoch 5, batch 4339
training loss: 0.3178470730781555 

Epoch 5, batch 4340
training loss: 0.18963249027729034 

Epoch 5, batch 4341
training loss: 0.04226590692996979 

Epoch 5, batch 4342
training loss: 0.27324628829956055 

Epoch 5, batch 4343
training loss: 0.008219114504754543 

Epoch 5, batch 4344
training loss: 0.026425674557685852 

Epoch 5, batch 4345
training loss: 0.3968431055545807 

Epoch 5, batch 4346
training loss: 0.02307913452386856 

Epoch 5, batch 4347
training l

Epoch 5, batch 4554
training loss: 0.08345656841993332 

Epoch 5, batch 4555
training loss: 0.11327739804983139 

Epoch 5, batch 4556
training loss: 0.017141755670309067 

Epoch 5, batch 4557
training loss: 0.07569779455661774 

Epoch 5, batch 4558
training loss: 0.021020127460360527 

Epoch 5, batch 4559
training loss: 0.3307463228702545 

Epoch 5, batch 4560
training loss: 0.017561424523591995 

Epoch 5, batch 4561
training loss: 0.10148926079273224 

Epoch 5, batch 4562
training loss: 0.12404010444879532 

Epoch 5, batch 4563
training loss: 0.03908296674489975 

Epoch 5, batch 4564
training loss: 0.6850103139877319 

Epoch 5, batch 4565
training loss: 0.019089650362730026 

Epoch 5, batch 4566
training loss: 0.014601150527596474 

Epoch 5, batch 4567
training loss: 0.005045302212238312 

Epoch 5, batch 4568
training loss: 0.006545933894813061 

Epoch 5, batch 4569
training loss: 0.03228975459933281 

Epoch 5, batch 4570
training loss: 0.0075147515162825584 

Epoch 5, batch 4571
trai

Epoch 5, batch 4778
training loss: 0.011999840848147869 

Epoch 5, batch 4779
training loss: 0.13875597715377808 

Epoch 5, batch 4780
training loss: 0.007188253104686737 

Epoch 5, batch 4781
training loss: 0.5299161076545715 

Epoch 5, batch 4782
training loss: 0.08636210858821869 

Epoch 5, batch 4783
training loss: 0.01252101082354784 

Epoch 5, batch 4784
training loss: 0.10237669944763184 

Epoch 5, batch 4785
training loss: 0.013247847557067871 

Epoch 5, batch 4786
training loss: 0.4410478174686432 

Epoch 5, batch 4787
training loss: 0.010328839533030987 

Epoch 5, batch 4788
training loss: 0.022333992645144463 

Epoch 5, batch 4789
training loss: 0.1230490654706955 

Epoch 5, batch 4790
training loss: 0.07287494093179703 

Epoch 5, batch 4791
training loss: 0.021830972284078598 

Epoch 5, batch 4792
training loss: 0.06324125826358795 

Epoch 5, batch 4793
training loss: 0.06287263333797455 

Epoch 5, batch 4794
training loss: 0.4768676161766052 

Epoch 5, batch 4795
training 

Epoch 5, batch 5003
training loss: 0.12334223091602325 

Epoch 5, batch 5004
training loss: 0.01838645152747631 

Epoch 5, batch 5005
training loss: 0.224442720413208 

Epoch 5, batch 5006
training loss: 0.045364659279584885 

Epoch 5, batch 5007
training loss: 0.020370904356241226 

Epoch 5, batch 5008
training loss: 0.04892507940530777 

Epoch 5, batch 5009
training loss: 0.07058651745319366 

Epoch 5, batch 5010
training loss: 0.02490590699017048 

Epoch 5, batch 5011
training loss: 0.3205544352531433 

Epoch 5, batch 5012
training loss: 0.10707950592041016 

Epoch 5, batch 5013
training loss: 0.07152289897203445 

Epoch 5, batch 5014
training loss: 0.019370349124073982 

Epoch 5, batch 5015
training loss: 0.09302634000778198 

Epoch 5, batch 5016
training loss: 0.2838899493217468 

Epoch 5, batch 5017
training loss: 0.008708124980330467 

Epoch 5, batch 5018
training loss: 0.045790888369083405 

Epoch 5, batch 5019
training loss: 0.026621047407388687 

Epoch 5, batch 5020
training 

Epoch 5, batch 5226
training loss: 0.23990586400032043 

Epoch 5, batch 5227
training loss: 0.012274547480046749 

Epoch 5, batch 5228
training loss: 0.2902666926383972 

Epoch 5, batch 5229
training loss: 0.027032842859625816 

Epoch 5, batch 5230
training loss: 0.2072804719209671 

Epoch 5, batch 5231
training loss: 0.45582738518714905 

Epoch 5, batch 5232
training loss: 0.07234837114810944 

Epoch 5, batch 5233
training loss: 0.07319457828998566 

Epoch 5, batch 5234
training loss: 0.12183880805969238 

Epoch 5, batch 5235
training loss: 0.11614231765270233 

Epoch 5, batch 5236
training loss: 0.1789708286523819 

Epoch 5, batch 5237
training loss: 0.26511746644973755 

Epoch 5, batch 5238
training loss: 0.5595912933349609 

Epoch 5, batch 5239
training loss: 0.046193305402994156 

Epoch 5, batch 5240
training loss: 0.2592085003852844 

Epoch 5, batch 5241
training loss: 0.08138687908649445 

Epoch 5, batch 5242
training loss: 0.2556750178337097 

Epoch 5, batch 5243
training loss:

Epoch 5, batch 5445
training loss: 0.30548813939094543 

Epoch 5, batch 5446
training loss: 0.020977091044187546 

Epoch 5, batch 5447
training loss: 0.3038601577281952 

Epoch 5, batch 5448
training loss: 0.012026091106235981 

Epoch 5, batch 5449
training loss: 0.2708483040332794 

Epoch 5, batch 5450
training loss: 0.16005408763885498 

Epoch 5, batch 5451
training loss: 0.038610100746154785 

Epoch 5, batch 5452
training loss: 0.05902710556983948 

Epoch 5, batch 5453
training loss: 0.025083819404244423 

Epoch 5, batch 5454
training loss: 0.0650111511349678 

Epoch 5, batch 5455
training loss: 0.03695949167013168 

Epoch 5, batch 5456
training loss: 0.3548465073108673 

Epoch 5, batch 5457
training loss: 0.010859673842787743 

Epoch 5, batch 5458
training loss: 1.1569859981536865 

Epoch 5, batch 5459
training loss: 0.22851784527301788 

Epoch 5, batch 5460
training loss: 0.6859562993049622 

Epoch 5, batch 5461
training loss: 0.05459842085838318 

Epoch 5, batch 5462
training los

Epoch 5, batch 5668
training loss: 0.3938208818435669 

Epoch 5, batch 5669
training loss: 0.01207028143107891 

Epoch 5, batch 5670
training loss: 0.12484214454889297 

Epoch 5, batch 5671
training loss: 0.03932136669754982 

Epoch 5, batch 5672
training loss: 0.7156623005867004 

Epoch 5, batch 5673
training loss: 0.06882323324680328 

Epoch 5, batch 5674
training loss: 0.20779886841773987 

Epoch 5, batch 5675
training loss: 0.05387512594461441 

Epoch 5, batch 5676
training loss: 0.13474991917610168 

Epoch 5, batch 5677
training loss: 0.06522461026906967 

Epoch 5, batch 5678
training loss: 0.041758060455322266 

Epoch 5, batch 5679
training loss: 0.8629763722419739 

Epoch 5, batch 5680
training loss: 0.01887528784573078 

Epoch 5, batch 5681
training loss: 1.5240516662597656 

Epoch 5, batch 5682
training loss: 0.012879406102001667 

Epoch 5, batch 5683
training loss: 0.620449423789978 

Epoch 5, batch 5684
training loss: 0.00848173163831234 

Epoch 5, batch 5685
training loss: 

Epoch 5, batch 5890
training loss: 0.012056751176714897 

Epoch 5, batch 5891
training loss: 0.009670144878327847 

Epoch 5, batch 5892
training loss: 0.029483595862984657 

Epoch 5, batch 5893
training loss: 0.010735617950558662 

Epoch 5, batch 5894
training loss: 0.010395909659564495 

Epoch 5, batch 5895
training loss: 0.016510898247361183 

Epoch 5, batch 5896
training loss: 0.014988606795668602 

Epoch 5, batch 5897
training loss: 0.1271451860666275 

Epoch 5, batch 5898
training loss: 0.014693701639771461 

Epoch 5, batch 5899
training loss: 0.01691470853984356 

Epoch 5, batch 5900
training loss: 0.0564761683344841 

Epoch 5, batch 5901
training loss: 0.1600542664527893 

Epoch 5, batch 5902
training loss: 0.15066207945346832 

Epoch 5, batch 5903
training loss: 0.06139390543103218 

Epoch 5, batch 5904
training loss: 0.005131646990776062 

Epoch 5, batch 5905
training loss: 0.09184269607067108 

Epoch 5, batch 5906
training loss: 0.024580471217632294 

Epoch 5, batch 5907
trai

Epoch 6, batch 109
training loss: 0.29387184977531433 

Epoch 6, batch 110
training loss: 0.09167157113552094 

Epoch 6, batch 111
training loss: 0.3185635805130005 

Epoch 6, batch 112
training loss: 0.13092607259750366 

Epoch 6, batch 113
training loss: 0.12374137341976166 

Epoch 6, batch 114
training loss: 0.040350981056690216 

Epoch 6, batch 115
training loss: 0.16021069884300232 

Epoch 6, batch 116
training loss: 0.021980779245495796 

Epoch 6, batch 117
training loss: 0.1691727340221405 

Epoch 6, batch 118
training loss: 0.0863930955529213 

Epoch 6, batch 119
training loss: 0.021147433668375015 

Epoch 6, batch 120
training loss: 0.6206444501876831 

Epoch 6, batch 121
training loss: 0.022656705230474472 

Epoch 6, batch 122
training loss: 0.5668680667877197 

Epoch 6, batch 123
training loss: 0.0269392728805542 

Epoch 6, batch 124
training loss: 0.011469380930066109 

Epoch 6, batch 125
training loss: 0.03237040713429451 

Epoch 6, batch 126
training loss: 0.0312203355133

Epoch 6, batch 330
training loss: 0.020615164190530777 

Epoch 6, batch 331
training loss: 0.03549572080373764 

Epoch 6, batch 332
training loss: 0.4718770980834961 

Epoch 6, batch 333
training loss: 0.09667032212018967 

Epoch 6, batch 334
training loss: 0.3652884364128113 

Epoch 6, batch 335
training loss: 0.0876077339053154 

Epoch 6, batch 336
training loss: 0.15210266411304474 

Epoch 6, batch 337
training loss: 0.302250474691391 

Epoch 6, batch 338
training loss: 0.004429810680449009 

Epoch 6, batch 339
training loss: 0.023665282875299454 

Epoch 6, batch 340
training loss: 0.0635259822010994 

Epoch 6, batch 341
training loss: 0.0135792912915349 

Epoch 6, batch 342
training loss: 0.03460449352860451 

Epoch 6, batch 343
training loss: 0.1968904286623001 

Epoch 6, batch 344
training loss: 0.04960178956389427 

Epoch 6, batch 345
training loss: 0.07430307567119598 

Epoch 6, batch 346
training loss: 0.05146074295043945 

Epoch 6, batch 347
training loss: 0.11445393413305283

Epoch 6, batch 547
training loss: 0.046552516520023346 

Epoch 6, batch 548
training loss: 0.00900998804718256 

Epoch 6, batch 549
training loss: 0.01629028096795082 

Epoch 6, batch 550
training loss: 0.002941233105957508 

Epoch 6, batch 551
training loss: 0.027292797341942787 

Epoch 6, batch 552
training loss: 0.05907706171274185 

Epoch 6, batch 553
training loss: 0.03503567725419998 

Epoch 6, batch 554
training loss: 0.06892137229442596 

Epoch 6, batch 555
training loss: 0.05535149574279785 

Epoch 6, batch 556
training loss: 0.02173733524978161 

Epoch 6, batch 557
training loss: 0.0343351736664772 

Epoch 6, batch 558
training loss: 0.368586003780365 

Epoch 6, batch 559
training loss: 0.2224060595035553 

Epoch 6, batch 560
training loss: 0.10584646463394165 

Epoch 6, batch 561
training loss: 0.06872420012950897 

Epoch 6, batch 562
training loss: 0.4759292006492615 

Epoch 6, batch 563
training loss: 0.03165536746382713 

Epoch 6, batch 564
training loss: 0.05693913623690

Epoch 6, batch 768
training loss: 0.037769101560115814 

Epoch 6, batch 769
training loss: 0.012144247069954872 

Epoch 6, batch 770
training loss: 0.42757076025009155 

Epoch 6, batch 771
training loss: 0.014332440681755543 

Epoch 6, batch 772
training loss: 0.04292488843202591 

Epoch 6, batch 773
training loss: 0.030503273010253906 

Epoch 6, batch 774
training loss: 0.024332696571946144 

Epoch 6, batch 775
training loss: 0.00970827043056488 

Epoch 6, batch 776
training loss: 0.15567083656787872 

Epoch 6, batch 777
training loss: 0.09687403589487076 

Epoch 6, batch 778
training loss: 0.033548906445503235 

Epoch 6, batch 779
training loss: 0.871832013130188 

Epoch 6, batch 780
training loss: 0.12636443972587585 

Epoch 6, batch 781
training loss: 0.613176703453064 

Epoch 6, batch 782
training loss: 0.29453790187835693 

Epoch 6, batch 783
training loss: 0.03253820911049843 

Epoch 6, batch 784
training loss: 0.16990071535110474 

Epoch 6, batch 785
training loss: 0.0051118442

Epoch 6, batch 987
training loss: 0.17270156741142273 

Epoch 6, batch 988
training loss: 0.4607066512107849 

Epoch 6, batch 989
training loss: 0.2120814323425293 

Epoch 6, batch 990
training loss: 0.08255492895841599 

Epoch 6, batch 991
training loss: 0.1498342603445053 

Epoch 6, batch 992
training loss: 0.19054025411605835 

Epoch 6, batch 993
training loss: 0.12040361016988754 

Epoch 6, batch 994
training loss: 0.009514972567558289 

Epoch 6, batch 995
training loss: 0.009810645133256912 

Epoch 6, batch 996
training loss: 0.045122504234313965 

Epoch 6, batch 997
training loss: 0.12027864158153534 

Epoch 6, batch 998
training loss: 0.059725888073444366 

Epoch 6, batch 999
training loss: 0.5125705003738403 

Epoch 6, batch 1000
training loss: 0.03605762496590614 

Epoch 6, batch 1001
training loss: 0.1060517430305481 

Epoch 6, batch 1002
training loss: 0.015144874341785908 

Epoch 6, batch 1003
training loss: 0.027699554339051247 

Epoch 6, batch 1004
training loss: 0.082242

Epoch 6, batch 1205
training loss: 0.021755561232566833 

Epoch 6, batch 1206
training loss: 0.1728099286556244 

Epoch 6, batch 1207
training loss: 0.3386954069137573 

Epoch 6, batch 1208
training loss: 0.010619422420859337 

Epoch 6, batch 1209
training loss: 0.14378438889980316 

Epoch 6, batch 1210
training loss: 0.12544533610343933 

Epoch 6, batch 1211
training loss: 0.15141889452934265 

Epoch 6, batch 1212
training loss: 0.06184645742177963 

Epoch 6, batch 1213
training loss: 0.1026122197508812 

Epoch 6, batch 1214
training loss: 0.022319454699754715 

Epoch 6, batch 1215
training loss: 0.1202348843216896 

Epoch 6, batch 1216
training loss: 0.054419539868831635 

Epoch 6, batch 1217
training loss: 0.05355595424771309 

Epoch 6, batch 1218
training loss: 0.018637970089912415 

Epoch 6, batch 1219
training loss: 0.08907674252986908 

Epoch 6, batch 1220
training loss: 0.41474834084510803 

Epoch 6, batch 1221
training loss: 0.23135781288146973 

Epoch 6, batch 1222
training l

Epoch 6, batch 1425
training loss: 0.04228905215859413 

Epoch 6, batch 1426
training loss: 0.052896179258823395 

Epoch 6, batch 1427
training loss: 0.02770158275961876 

Epoch 6, batch 1428
training loss: 0.011573169380426407 

Epoch 6, batch 1429
training loss: 0.07777970284223557 

Epoch 6, batch 1430
training loss: 0.08033303171396255 

Epoch 6, batch 1431
training loss: 0.3004593849182129 

Epoch 6, batch 1432
training loss: 0.037940703332424164 

Epoch 6, batch 1433
training loss: 0.003845586208626628 

Epoch 6, batch 1434
training loss: 0.03617890924215317 

Epoch 6, batch 1435
training loss: 0.11847887188196182 

Epoch 6, batch 1436
training loss: 0.04868283122777939 

Epoch 6, batch 1437
training loss: 0.08268607407808304 

Epoch 6, batch 1438
training loss: 0.49157485365867615 

Epoch 6, batch 1439
training loss: 0.19802285730838776 

Epoch 6, batch 1440
training loss: 0.03203238919377327 

Epoch 6, batch 1441
training loss: 0.050607841461896896 

Epoch 6, batch 1442
trainin

Epoch 6, batch 1649
training loss: 0.06887492537498474 

Epoch 6, batch 1650
training loss: 0.0679866224527359 

Epoch 6, batch 1651
training loss: 0.06956150382757187 

Epoch 6, batch 1652
training loss: 0.012326959520578384 

Epoch 6, batch 1653
training loss: 0.23757889866828918 

Epoch 6, batch 1654
training loss: 0.02647264301776886 

Epoch 6, batch 1655
training loss: 0.027718234807252884 

Epoch 6, batch 1656
training loss: 0.08290837705135345 

Epoch 6, batch 1657
training loss: 0.009966491721570492 

Epoch 6, batch 1658
training loss: 0.03180483728647232 

Epoch 6, batch 1659
training loss: 0.6276532411575317 

Epoch 6, batch 1660
training loss: 0.031690195202827454 

Epoch 6, batch 1661
training loss: 0.007790878415107727 

Epoch 6, batch 1662
training loss: 0.14127382636070251 

Epoch 6, batch 1663
training loss: 0.006371228955686092 

Epoch 6, batch 1664
training loss: 0.18860042095184326 

Epoch 6, batch 1665
training loss: 0.012805169448256493 

Epoch 6, batch 1666
traini

Epoch 6, batch 1866
training loss: 0.3957396149635315 

Epoch 6, batch 1867
training loss: 0.025332432240247726 

Epoch 6, batch 1868
training loss: 0.7619918584823608 

Epoch 6, batch 1869
training loss: 0.011333843693137169 

Epoch 6, batch 1870
training loss: 0.013261775486171246 

Epoch 6, batch 1871
training loss: 0.02706281840801239 

Epoch 6, batch 1872
training loss: 0.013673365116119385 

Epoch 6, batch 1873
training loss: 0.09096065908670425 

Epoch 6, batch 1874
training loss: 0.16415484249591827 

Epoch 6, batch 1875
training loss: 0.015083283185958862 

Epoch 6, batch 1876
training loss: 0.6762207746505737 

Epoch 6, batch 1877
training loss: 0.22337813675403595 

Epoch 6, batch 1878
training loss: 0.034557536244392395 

Epoch 6, batch 1879
training loss: 0.48388949036598206 

Epoch 6, batch 1880
training loss: 0.11595200002193451 

Epoch 6, batch 1881
training loss: 0.23554980754852295 

Epoch 6, batch 1882
training loss: 0.09064976871013641 

Epoch 6, batch 1883
training

Epoch 6, batch 2083
training loss: 0.02856464684009552 

Epoch 6, batch 2084
training loss: 0.10227525234222412 

Epoch 6, batch 2085
training loss: 0.0807921439409256 

Epoch 6, batch 2086
training loss: 0.06326920539140701 

Epoch 6, batch 2087
training loss: 0.016258955001831055 

Epoch 6, batch 2088
training loss: 0.04154789075255394 

Epoch 6, batch 2089
training loss: 0.13651692867279053 

Epoch 6, batch 2090
training loss: 0.26117512583732605 

Epoch 6, batch 2091
training loss: 0.07034843415021896 

Epoch 6, batch 2092
training loss: 0.1270819753408432 

Epoch 6, batch 2093
training loss: 0.04478378966450691 

Epoch 6, batch 2094
training loss: 0.18189315497875214 

Epoch 6, batch 2095
training loss: 0.05676160007715225 

Epoch 6, batch 2096
training loss: 0.08667068183422089 

Epoch 6, batch 2097
training loss: 0.34016287326812744 

Epoch 6, batch 2098
training loss: 0.07350875437259674 

Epoch 6, batch 2099
training loss: 0.005824160762131214 

Epoch 6, batch 2100
training lo

Epoch 6, batch 2297
training loss: 0.21196675300598145 

Epoch 6, batch 2298
training loss: 0.676864504814148 

Epoch 6, batch 2299
training loss: 0.06186367943882942 

Epoch 6, batch 2300
training loss: 0.17507842183113098 

Epoch 6, batch 2301
training loss: 0.24989712238311768 

Epoch 6, batch 2302
training loss: 0.0154707757756114 

Epoch 6, batch 2303
training loss: 0.06089390441775322 

Epoch 6, batch 2304
training loss: 0.061186064034700394 

Epoch 6, batch 2305
training loss: 0.0028365743346512318 

Epoch 6, batch 2306
training loss: 0.1463669240474701 

Epoch 6, batch 2307
training loss: 0.012075248174369335 

Epoch 6, batch 2308
training loss: 0.015116390772163868 

Epoch 6, batch 2309
training loss: 0.17356857657432556 

Epoch 6, batch 2310
training loss: 0.3784298300743103 

Epoch 6, batch 2311
training loss: 0.03533145785331726 

Epoch 6, batch 2312
training loss: 0.04739641398191452 

Epoch 6, batch 2313
training loss: 0.3025163412094116 

Epoch 6, batch 2314
training los

Epoch 6, batch 2513
training loss: 0.03584297373890877 

Epoch 6, batch 2514
training loss: 0.02805803343653679 

Epoch 6, batch 2515
training loss: 0.007897084578871727 

Epoch 6, batch 2516
training loss: 0.37136706709861755 

Epoch 6, batch 2517
training loss: 0.014996220357716084 

Epoch 6, batch 2518
training loss: 0.06291688978672028 

Epoch 6, batch 2519
training loss: 0.018536347895860672 

Epoch 6, batch 2520
training loss: 0.18743164837360382 

Epoch 6, batch 2521
training loss: 0.09459316730499268 

Epoch 6, batch 2522
training loss: 0.26110512018203735 

Epoch 6, batch 2523
training loss: 0.1804153025150299 

Epoch 6, batch 2524
training loss: 0.2536354959011078 

Epoch 6, batch 2525
training loss: 0.01021246425807476 

Epoch 6, batch 2526
training loss: 0.1218121200799942 

Epoch 6, batch 2527
training loss: 0.02126297913491726 

Epoch 6, batch 2528
training loss: 0.03258557617664337 

Epoch 6, batch 2529
training loss: 0.04936946928501129 

Epoch 6, batch 2530
training lo

Epoch 6, batch 2722
training loss: 0.27530044317245483 

Epoch 6, batch 2723
training loss: 0.04221590608358383 

Epoch 6, batch 2724
training loss: 0.05634162947535515 

Epoch 6, batch 2725
training loss: 0.579332709312439 

Epoch 6, batch 2726
training loss: 0.052494388073682785 

Epoch 6, batch 2727
training loss: 0.011802265420556068 

Epoch 6, batch 2728
training loss: 0.17138619720935822 

Epoch 6, batch 2729
training loss: 0.04254594445228577 

Epoch 6, batch 2730
training loss: 0.15915434062480927 

Epoch 6, batch 2731
training loss: 0.1722445785999298 

Epoch 6, batch 2732
training loss: 0.05321105569601059 

Epoch 6, batch 2733
training loss: 0.09463454782962799 

Epoch 6, batch 2734
training loss: 0.11204211413860321 

Epoch 6, batch 2735
training loss: 0.053902767598629 

Epoch 6, batch 2736
training loss: 0.06046166270971298 

Epoch 6, batch 2737
training loss: 0.005256029777228832 

Epoch 6, batch 2738
training loss: 0.010573040693998337 

Epoch 6, batch 2739
training los

Epoch 6, batch 2944
training loss: 0.20326490700244904 

Epoch 6, batch 2945
training loss: 0.5481757521629333 

Epoch 6, batch 2946
training loss: 0.017484556883573532 

Epoch 6, batch 2947
training loss: 0.5441280603408813 

Epoch 6, batch 2948
training loss: 0.8848645091056824 

Epoch 6, batch 2949
training loss: 0.0507412925362587 

Epoch 6, batch 2950
training loss: 0.04499150812625885 

Epoch 6, batch 2951
training loss: 0.020841384306550026 

Epoch 6, batch 2952
training loss: 0.0586002878844738 

Epoch 6, batch 2953
training loss: 0.236077219247818 

Epoch 6, batch 2954
training loss: 0.0855027511715889 

Epoch 6, batch 2955
training loss: 0.19747552275657654 

Epoch 6, batch 2956
training loss: 0.1141791120171547 

Epoch 6, batch 2957
training loss: 0.04882722720503807 

Epoch 6, batch 2958
training loss: 0.042131125926971436 

Epoch 6, batch 2959
training loss: 0.16538959741592407 

Epoch 6, batch 2960
training loss: 0.020892690867185593 

Epoch 6, batch 2961
training loss: 0

Epoch 6, batch 3164
training loss: 0.6365982294082642 

Epoch 6, batch 3165
training loss: 0.34560075402259827 

Epoch 6, batch 3166
training loss: 0.06955759227275848 

Epoch 6, batch 3167
training loss: 0.6567205190658569 

Epoch 6, batch 3168
training loss: 0.024195250123739243 

Epoch 6, batch 3169
training loss: 0.1653967797756195 

Epoch 6, batch 3170
training loss: 0.008708130568265915 

Epoch 6, batch 3171
training loss: 0.0304401908069849 

Epoch 6, batch 3172
training loss: 0.18680237233638763 

Epoch 6, batch 3173
training loss: 0.1062372550368309 

Epoch 6, batch 3174
training loss: 0.004092202056199312 

Epoch 6, batch 3175
training loss: 0.0964808240532875 

Epoch 6, batch 3176
training loss: 0.2771014869213104 

Epoch 6, batch 3177
training loss: 0.25708383321762085 

Epoch 6, batch 3178
training loss: 0.0045746988616883755 

Epoch 6, batch 3179
training loss: 0.3187485933303833 

Epoch 6, batch 3180
training loss: 0.22478167712688446 

Epoch 6, batch 3181
training loss:

Epoch 6, batch 3384
training loss: 0.17290574312210083 

Epoch 6, batch 3385
training loss: 0.04479213058948517 

Epoch 6, batch 3386
training loss: 0.1366168111562729 

Epoch 6, batch 3387
training loss: 0.4862540662288666 

Epoch 6, batch 3388
training loss: 0.06139938905835152 

Epoch 6, batch 3389
training loss: 0.08688588440418243 

Epoch 6, batch 3390
training loss: 0.0517750009894371 

Epoch 6, batch 3391
training loss: 0.08523281663656235 

Epoch 6, batch 3392
training loss: 0.5078178644180298 

Epoch 6, batch 3393
training loss: 0.06766451895236969 

Epoch 6, batch 3394
training loss: 0.3859887719154358 

Epoch 6, batch 3395
training loss: 0.018845435231924057 

Epoch 6, batch 3396
training loss: 0.2608388662338257 

Epoch 6, batch 3397
training loss: 0.4809928834438324 

Epoch 6, batch 3398
training loss: 0.014136970043182373 

Epoch 6, batch 3399
training loss: 0.8335233926773071 

Epoch 6, batch 3400
training loss: 0.033382803201675415 

Epoch 6, batch 3401
training loss: 0

Epoch 6, batch 3604
training loss: 0.18350261449813843 

Epoch 6, batch 3605
training loss: 0.15547466278076172 

Epoch 6, batch 3606
training loss: 0.2771216034889221 

Epoch 6, batch 3607
training loss: 0.02893821895122528 

Epoch 6, batch 3608
training loss: 0.03697144240140915 

Epoch 6, batch 3609
training loss: 0.03503953665494919 

Epoch 6, batch 3610
training loss: 0.08789734542369843 

Epoch 6, batch 3611
training loss: 0.01704219914972782 

Epoch 6, batch 3612
training loss: 0.012852141633629799 

Epoch 6, batch 3613
training loss: 0.6360002160072327 

Epoch 6, batch 3614
training loss: 0.014919492416083813 

Epoch 6, batch 3615
training loss: 0.016425682231783867 

Epoch 6, batch 3616
training loss: 0.015759458765387535 

Epoch 6, batch 3617
training loss: 0.09856986254453659 

Epoch 6, batch 3618
training loss: 0.6018375158309937 

Epoch 6, batch 3619
training loss: 0.24401693046092987 

Epoch 6, batch 3620
training loss: 0.009625822305679321 

Epoch 6, batch 3621
training 

Epoch 6, batch 3823
training loss: 0.5446348190307617 

Epoch 6, batch 3824
training loss: 0.023766513913869858 

Epoch 6, batch 3825
training loss: 0.0299219973385334 

Epoch 6, batch 3826
training loss: 0.24279026687145233 

Epoch 6, batch 3827
training loss: 0.010854611173272133 

Epoch 6, batch 3828
training loss: 0.06889382004737854 

Epoch 6, batch 3829
training loss: 0.009856665506958961 

Epoch 6, batch 3830
training loss: 0.007008219603449106 

Epoch 6, batch 3831
training loss: 0.0967564806342125 

Epoch 6, batch 3832
training loss: 0.025731533765792847 

Epoch 6, batch 3833
training loss: 0.06937585771083832 

Epoch 6, batch 3834
training loss: 0.414407879114151 

Epoch 6, batch 3835
training loss: 0.14246538281440735 

Epoch 6, batch 3836
training loss: 0.07064595818519592 

Epoch 6, batch 3837
training loss: 0.010645316913723946 

Epoch 6, batch 3838
training loss: 0.22450192272663116 

Epoch 6, batch 3839
training loss: 0.18847309052944183 

Epoch 6, batch 3840
training l

Epoch 6, batch 4036
training loss: 0.01970786787569523 

Epoch 6, batch 4037
training loss: 0.4607236981391907 

Epoch 6, batch 4038
training loss: 0.01479010283946991 

Epoch 6, batch 4039
training loss: 0.11750243604183197 

Epoch 6, batch 4040
training loss: 0.0033874809741973877 

Epoch 6, batch 4041
training loss: 0.0070544034242630005 

Epoch 6, batch 4042
training loss: 0.16818033158779144 

Epoch 6, batch 4043
training loss: 0.07914082705974579 

Epoch 6, batch 4044
training loss: 0.021183665841817856 

Epoch 6, batch 4045
training loss: 0.07094547897577286 

Epoch 6, batch 4046
training loss: 0.027542149648070335 

Epoch 6, batch 4047
training loss: 0.09884142875671387 

Epoch 6, batch 4048
training loss: 0.04728925973176956 

Epoch 6, batch 4049
training loss: 0.09784682840108871 

Epoch 6, batch 4050
training loss: 0.15812917053699493 

Epoch 6, batch 4051
training loss: 0.007938372902572155 

Epoch 6, batch 4052
training loss: 0.011744027957320213 

Epoch 6, batch 4053
trai

Epoch 6, batch 4256
training loss: 0.005970795638859272 

Epoch 6, batch 4257
training loss: 0.008336128666996956 

Epoch 6, batch 4258
training loss: 0.17548182606697083 

Epoch 6, batch 4259
training loss: 0.05262797325849533 

Epoch 6, batch 4260
training loss: 0.00480690598487854 

Epoch 6, batch 4261
training loss: 0.04061666876077652 

Epoch 6, batch 4262
training loss: 0.5744118690490723 

Epoch 6, batch 4263
training loss: 0.05949405953288078 

Epoch 6, batch 4264
training loss: 0.007618204690515995 

Epoch 6, batch 4265
training loss: 0.060684554278850555 

Epoch 6, batch 4266
training loss: 0.26464366912841797 

Epoch 6, batch 4267
training loss: 0.03335829824209213 

Epoch 6, batch 4268
training loss: 0.016696538776159286 

Epoch 6, batch 4269
training loss: 0.008136797696352005 

Epoch 6, batch 4270
training loss: 0.027559224516153336 

Epoch 6, batch 4271
training loss: 0.004769906867295504 

Epoch 6, batch 4272
training loss: 0.09889505058526993 

Epoch 6, batch 4273
trai

Epoch 6, batch 4477
training loss: 0.5109545588493347 

Epoch 6, batch 4478
training loss: 0.8804062008857727 

Epoch 6, batch 4479
training loss: 0.0764087662100792 

Epoch 6, batch 4480
training loss: 0.9332072138786316 

Epoch 6, batch 4481
training loss: 0.26072314381599426 

Epoch 6, batch 4482
training loss: 0.05347081273794174 

Epoch 6, batch 4483
training loss: 0.6521614789962769 

Epoch 6, batch 4484
training loss: 0.10794459283351898 

Epoch 6, batch 4485
training loss: 0.14606711268424988 

Epoch 6, batch 4486
training loss: 0.011094172485172749 

Epoch 6, batch 4487
training loss: 0.1553838700056076 

Epoch 6, batch 4488
training loss: 0.09027223289012909 

Epoch 6, batch 4489
training loss: 0.3054105043411255 

Epoch 6, batch 4490
training loss: 0.1475510150194168 

Epoch 6, batch 4491
training loss: 0.13643807172775269 

Epoch 6, batch 4492
training loss: 0.13187991082668304 

Epoch 6, batch 4493
training loss: 0.014863322488963604 

Epoch 6, batch 4494
training loss: 0.

Epoch 6, batch 4699
training loss: 0.007840270176529884 

Epoch 6, batch 4700
training loss: 0.6419882774353027 

Epoch 6, batch 4701
training loss: 0.0065125832334160805 

Epoch 6, batch 4702
training loss: 0.07775290310382843 

Epoch 6, batch 4703
training loss: 0.32692158222198486 

Epoch 6, batch 4704
training loss: 0.18339543044567108 

Epoch 6, batch 4705
training loss: 0.028483275324106216 

Epoch 6, batch 4706
training loss: 0.05245272442698479 

Epoch 6, batch 4707
training loss: 0.35696834325790405 

Epoch 6, batch 4708
training loss: 0.06571914255619049 

Epoch 6, batch 4709
training loss: 0.012770222499966621 

Epoch 6, batch 4710
training loss: 0.00996056105941534 

Epoch 6, batch 4711
training loss: 0.011559381149709225 

Epoch 6, batch 4712
training loss: 0.023200972005724907 

Epoch 6, batch 4713
training loss: 0.07007412612438202 

Epoch 6, batch 4714
training loss: 0.04757460206747055 

Epoch 6, batch 4715
training loss: 0.35191553831100464 

Epoch 6, batch 4716
train

Epoch 6, batch 4920
training loss: 0.050462137907743454 

Epoch 6, batch 4921
training loss: 0.07448957115411758 

Epoch 6, batch 4922
training loss: 0.1513374298810959 

Epoch 6, batch 4923
training loss: 0.02907312475144863 

Epoch 6, batch 4924
training loss: 0.01338349748402834 

Epoch 6, batch 4925
training loss: 0.014417899772524834 

Epoch 6, batch 4926
training loss: 0.04603176191449165 

Epoch 6, batch 4927
training loss: 0.07587099820375443 

Epoch 6, batch 4928
training loss: 0.46616607904434204 

Epoch 6, batch 4929
training loss: 0.12366907298564911 

Epoch 6, batch 4930
training loss: 0.01216041762381792 

Epoch 6, batch 4931
training loss: 0.051605772227048874 

Epoch 6, batch 4932
training loss: 0.0036093308590352535 

Epoch 6, batch 4933
training loss: 0.2775319218635559 

Epoch 6, batch 4934
training loss: 0.02635597065091133 

Epoch 6, batch 4935
training loss: 0.1609567105770111 

Epoch 6, batch 4936
training loss: 0.022691454738378525 

Epoch 6, batch 4937
training

Epoch 6, batch 5140
training loss: 0.020622702315449715 

Epoch 6, batch 5141
training loss: 0.3909105360507965 

Epoch 6, batch 5142
training loss: 0.14758968353271484 

Epoch 6, batch 5143
training loss: 0.17176316678524017 

Epoch 6, batch 5144
training loss: 0.3108353018760681 

Epoch 6, batch 5145
training loss: 0.024051493033766747 

Epoch 6, batch 5146
training loss: 0.10771676152944565 

Epoch 6, batch 5147
training loss: 0.016446705907583237 

Epoch 6, batch 5148
training loss: 0.06585099548101425 

Epoch 6, batch 5149
training loss: 0.022191891446709633 

Epoch 6, batch 5150
training loss: 0.14529570937156677 

Epoch 6, batch 5151
training loss: 0.06187571957707405 

Epoch 6, batch 5152
training loss: 0.0877033993601799 

Epoch 6, batch 5153
training loss: 0.153508260846138 

Epoch 6, batch 5154
training loss: 0.014362214133143425 

Epoch 6, batch 5155
training loss: 0.023794416338205338 

Epoch 6, batch 5156
training loss: 0.01301572471857071 

Epoch 6, batch 5157
training l

Epoch 6, batch 5359
training loss: 0.02011043392121792 

Epoch 6, batch 5360
training loss: 1.0060961246490479 

Epoch 6, batch 5361
training loss: 0.01945704035460949 

Epoch 6, batch 5362
training loss: 0.11175328493118286 

Epoch 6, batch 5363
training loss: 0.04512636363506317 

Epoch 6, batch 5364
training loss: 0.39823490381240845 

Epoch 6, batch 5365
training loss: 0.1140194907784462 

Epoch 6, batch 5366
training loss: 0.056621003895998 

Epoch 6, batch 5367
training loss: 0.052090954035520554 

Epoch 6, batch 5368
training loss: 0.0619368851184845 

Epoch 6, batch 5369
training loss: 0.17928233742713928 

Epoch 6, batch 5370
training loss: 0.048296909779310226 

Epoch 6, batch 5371
training loss: 0.5033212900161743 

Epoch 6, batch 5372
training loss: 0.012716243974864483 

Epoch 6, batch 5373
training loss: 0.01906477101147175 

Epoch 6, batch 5374
training loss: 0.013143179938197136 

Epoch 6, batch 5375
training loss: 0.11018171161413193 

Epoch 6, batch 5376
training loss

Epoch 6, batch 5582
training loss: 0.16646209359169006 

Epoch 6, batch 5583
training loss: 0.2873074412345886 

Epoch 6, batch 5584
training loss: 0.018437039107084274 

Epoch 6, batch 5585
training loss: 0.4242919385433197 

Epoch 6, batch 5586
training loss: 0.4574071764945984 

Epoch 6, batch 5587
training loss: 0.06941168010234833 

Epoch 6, batch 5588
training loss: 0.6635669469833374 

Epoch 6, batch 5589
training loss: 0.3030232787132263 

Epoch 6, batch 5590
training loss: 0.13153807818889618 

Epoch 6, batch 5591
training loss: 0.11358390748500824 

Epoch 6, batch 5592
training loss: 0.016183745115995407 

Epoch 6, batch 5593
training loss: 0.05959028750658035 

Epoch 6, batch 5594
training loss: 0.012523015029728413 

Epoch 6, batch 5595
training loss: 0.16420519351959229 

Epoch 6, batch 5596
training loss: 0.39361315965652466 

Epoch 6, batch 5597
training loss: 0.011642220430076122 

Epoch 6, batch 5598
training loss: 0.00957916583865881 

Epoch 6, batch 5599
training los

Epoch 6, batch 5803
training loss: 0.1222764253616333 

Epoch 6, batch 5804
training loss: 0.018329689279198647 

Epoch 6, batch 5805
training loss: 0.020293299108743668 

Epoch 6, batch 5806
training loss: 0.11380697786808014 

Epoch 6, batch 5807
training loss: 0.03940592706203461 

Epoch 6, batch 5808
training loss: 0.008736291900277138 

Epoch 6, batch 5809
training loss: 0.04044336825609207 

Epoch 6, batch 5810
training loss: 0.2126840353012085 

Epoch 6, batch 5811
training loss: 0.07323616743087769 

Epoch 6, batch 5812
training loss: 0.03374878317117691 

Epoch 6, batch 5813
training loss: 0.054828107357025146 

Epoch 6, batch 5814
training loss: 0.031069327145814896 

Epoch 6, batch 5815
training loss: 0.10681084543466568 

Epoch 6, batch 5816
training loss: 0.18459385633468628 

Epoch 6, batch 5817
training loss: 0.014159160666167736 

Epoch 6, batch 5818
training loss: 0.055952370166778564 

Epoch 6, batch 5819
training loss: 0.020606862381100655 

Epoch 6, batch 5820
train

Epoch 7, batch 18
training loss: 0.0041333409026265144 

Epoch 7, batch 19
training loss: 0.013128031976521015 

Epoch 7, batch 20
training loss: 0.10909418761730194 

Epoch 7, batch 21
training loss: 0.06699161231517792 

Epoch 7, batch 22
training loss: 0.08567242324352264 

Epoch 7, batch 23
training loss: 0.10306942462921143 

Epoch 7, batch 24
training loss: 0.09677119553089142 

Epoch 7, batch 25
training loss: 0.03680342808365822 

Epoch 7, batch 26
training loss: 0.026706645265221596 

Epoch 7, batch 27
training loss: 0.041751883924007416 

Epoch 7, batch 28
training loss: 0.01887291669845581 

Epoch 7, batch 29
training loss: 0.0958172082901001 

Epoch 7, batch 30
training loss: 0.02892959490418434 

Epoch 7, batch 31
training loss: 0.03418195992708206 

Epoch 7, batch 32
training loss: 0.010014794766902924 

Epoch 7, batch 33
training loss: 0.011529393494129181 

Epoch 7, batch 34
training loss: 0.04278535395860672 

Epoch 7, batch 35
training loss: 0.10449154675006866 

Epoc

Epoch 7, batch 234
training loss: 0.06295420229434967 

Epoch 7, batch 235
training loss: 0.7232552766799927 

Epoch 7, batch 236
training loss: 0.13486947119235992 

Epoch 7, batch 237
training loss: 0.030621016398072243 

Epoch 7, batch 238
training loss: 0.12618039548397064 

Epoch 7, batch 239
training loss: 0.01751450076699257 

Epoch 7, batch 240
training loss: 0.007914849556982517 

Epoch 7, batch 241
training loss: 0.02433074451982975 

Epoch 7, batch 242
training loss: 0.30873751640319824 

Epoch 7, batch 243
training loss: 0.1356199085712433 

Epoch 7, batch 244
training loss: 0.34273654222488403 

Epoch 7, batch 245
training loss: 0.0305666234344244 

Epoch 7, batch 246
training loss: 0.0848565623164177 

Epoch 7, batch 247
training loss: 0.07551757991313934 

Epoch 7, batch 248
training loss: 0.02387898601591587 

Epoch 7, batch 249
training loss: 0.08626386523246765 

Epoch 7, batch 250
training loss: 0.1242951899766922 

Epoch 7, batch 251
training loss: 0.108993008732795

Epoch 7, batch 456
training loss: 0.19319090247154236 

Epoch 7, batch 457
training loss: 0.01022682897746563 

Epoch 7, batch 458
training loss: 0.005107563454657793 

Epoch 7, batch 459
training loss: 0.6697551012039185 

Epoch 7, batch 460
training loss: 0.24153855443000793 

Epoch 7, batch 461
training loss: 0.1597367227077484 

Epoch 7, batch 462
training loss: 0.002384092193096876 

Epoch 7, batch 463
training loss: 0.008264882490038872 

Epoch 7, batch 464
training loss: 0.260112464427948 

Epoch 7, batch 465
training loss: 0.4836069643497467 

Epoch 7, batch 466
training loss: 0.03758718818426132 

Epoch 7, batch 467
training loss: 0.014500031247735023 

Epoch 7, batch 468
training loss: 0.0076385363936424255 

Epoch 7, batch 469
training loss: 0.144802063703537 

Epoch 7, batch 470
training loss: 0.029266661033034325 

Epoch 7, batch 471
training loss: 0.2764410376548767 

Epoch 7, batch 472
training loss: 0.09310992807149887 

Epoch 7, batch 473
training loss: 0.0138891693204

Epoch 7, batch 677
training loss: 0.005886164493858814 

Epoch 7, batch 678
training loss: 0.05169776827096939 

Epoch 7, batch 679
training loss: 0.11540912091732025 

Epoch 7, batch 680
training loss: 0.08952264487743378 

Epoch 7, batch 681
training loss: 0.5414397716522217 

Epoch 7, batch 682
training loss: 0.06896772980690002 

Epoch 7, batch 683
training loss: 0.01779261790215969 

Epoch 7, batch 684
training loss: 0.022941377013921738 

Epoch 7, batch 685
training loss: 0.1349492371082306 

Epoch 7, batch 686
training loss: 0.010414130985736847 

Epoch 7, batch 687
training loss: 0.015543155372142792 

Epoch 7, batch 688
training loss: 0.03792677819728851 

Epoch 7, batch 689
training loss: 0.07976243644952774 

Epoch 7, batch 690
training loss: 0.028194840997457504 

Epoch 7, batch 691
training loss: 0.041086845099925995 

Epoch 7, batch 692
training loss: 0.026783103123307228 

Epoch 7, batch 693
training loss: 0.04623613879084587 

Epoch 7, batch 694
training loss: 0.2141665

Epoch 7, batch 893
training loss: 0.020611826330423355 

Epoch 7, batch 894
training loss: 0.04726499319076538 

Epoch 7, batch 895
training loss: 0.0901820957660675 

Epoch 7, batch 896
training loss: 0.0023483135737478733 

Epoch 7, batch 897
training loss: 0.015322217717766762 

Epoch 7, batch 898
training loss: 0.01800462044775486 

Epoch 7, batch 899
training loss: 0.14903594553470612 

Epoch 7, batch 900
training loss: 0.011580203659832478 

Epoch 7, batch 901
training loss: 0.11314620822668076 

Epoch 7, batch 902
training loss: 0.00411731842905283 

Epoch 7, batch 903
training loss: 0.1191493421792984 

Epoch 7, batch 904
training loss: 0.00904014240950346 

Epoch 7, batch 905
training loss: 0.019002486020326614 

Epoch 7, batch 906
training loss: 0.8486034274101257 

Epoch 7, batch 907
training loss: 0.3326767385005951 

Epoch 7, batch 908
training loss: 0.012510046362876892 

Epoch 7, batch 909
training loss: 0.3210579752922058 

Epoch 7, batch 910
training loss: 0.2600102126

Epoch 7, batch 1110
training loss: 0.11290011554956436 

Epoch 7, batch 1111
training loss: 0.05063816159963608 

Epoch 7, batch 1112
training loss: 0.005262321792542934 

Epoch 7, batch 1113
training loss: 0.007262313272804022 

Epoch 7, batch 1114
training loss: 0.19845615327358246 

Epoch 7, batch 1115
training loss: 0.01377135794609785 

Epoch 7, batch 1116
training loss: 0.019910458475351334 

Epoch 7, batch 1117
training loss: 0.04697861894965172 

Epoch 7, batch 1118
training loss: 0.04992514103651047 

Epoch 7, batch 1119
training loss: 0.02951315976679325 

Epoch 7, batch 1120
training loss: 0.08259373158216476 

Epoch 7, batch 1121
training loss: 0.12063324451446533 

Epoch 7, batch 1122
training loss: 0.006238190922886133 

Epoch 7, batch 1123
training loss: 0.02289525792002678 

Epoch 7, batch 1124
training loss: 0.061701007187366486 

Epoch 7, batch 1125
training loss: 0.14817500114440918 

Epoch 7, batch 1126
training loss: 0.05671188235282898 

Epoch 7, batch 1127
traini

Epoch 7, batch 1327
training loss: 0.026898672804236412 

Epoch 7, batch 1328
training loss: 0.02635013498365879 

Epoch 7, batch 1329
training loss: 0.22594261169433594 

Epoch 7, batch 1330
training loss: 0.02267220802605152 

Epoch 7, batch 1331
training loss: 0.06243550032377243 

Epoch 7, batch 1332
training loss: 0.019345451146364212 

Epoch 7, batch 1333
training loss: 0.44256600737571716 

Epoch 7, batch 1334
training loss: 0.008020547218620777 

Epoch 7, batch 1335
training loss: 0.02032015658915043 

Epoch 7, batch 1336
training loss: 0.02710946463048458 

Epoch 7, batch 1337
training loss: 0.02144625596702099 

Epoch 7, batch 1338
training loss: 0.021159760653972626 

Epoch 7, batch 1339
training loss: 0.5382112860679626 

Epoch 7, batch 1340
training loss: 0.2690433859825134 

Epoch 7, batch 1341
training loss: 0.14689180254936218 

Epoch 7, batch 1342
training loss: 0.054088421165943146 

Epoch 7, batch 1343
training loss: 0.3609178960323334 

Epoch 7, batch 1344
training 

Epoch 7, batch 1546
training loss: 0.007824034430086613 

Epoch 7, batch 1547
training loss: 0.21967215836048126 

Epoch 7, batch 1548
training loss: 0.28860729932785034 

Epoch 7, batch 1549
training loss: 0.19555284082889557 

Epoch 7, batch 1550
training loss: 0.042804963886737823 

Epoch 7, batch 1551
training loss: 0.15473607182502747 

Epoch 7, batch 1552
training loss: 0.014403851702809334 

Epoch 7, batch 1553
training loss: 0.1908821165561676 

Epoch 7, batch 1554
training loss: 0.07360707223415375 

Epoch 7, batch 1555
training loss: 0.23893065750598907 

Epoch 7, batch 1556
training loss: 0.16728530824184418 

Epoch 7, batch 1557
training loss: 0.00710944551974535 

Epoch 7, batch 1558
training loss: 0.13654667139053345 

Epoch 7, batch 1559
training loss: 0.06175053119659424 

Epoch 7, batch 1560
training loss: 0.04333594813942909 

Epoch 7, batch 1561
training loss: 0.05614706873893738 

Epoch 7, batch 1562
training loss: 0.45535793900489807 

Epoch 7, batch 1563
training 

Epoch 7, batch 1765
training loss: 0.18747620284557343 

Epoch 7, batch 1766
training loss: 0.3377666175365448 

Epoch 7, batch 1767
training loss: 0.00888496171683073 

Epoch 7, batch 1768
training loss: 0.006794312037527561 

Epoch 7, batch 1769
training loss: 0.09490526467561722 

Epoch 7, batch 1770
training loss: 0.014140544459223747 

Epoch 7, batch 1771
training loss: 0.030520429834723473 

Epoch 7, batch 1772
training loss: 0.013651324436068535 

Epoch 7, batch 1773
training loss: 0.24287369847297668 

Epoch 7, batch 1774
training loss: 0.026813054457306862 

Epoch 7, batch 1775
training loss: 0.20047514140605927 

Epoch 7, batch 1776
training loss: 0.14294955134391785 

Epoch 7, batch 1777
training loss: 0.00455030333250761 

Epoch 7, batch 1778
training loss: 0.13364621996879578 

Epoch 7, batch 1779
training loss: 0.06124041602015495 

Epoch 7, batch 1780
training loss: 0.22982235252857208 

Epoch 7, batch 1781
training loss: 0.06207449361681938 

Epoch 7, batch 1782
trainin

Epoch 7, batch 1971
training loss: 0.005571651738137007 

Epoch 7, batch 1972
training loss: 0.018101820722222328 

Epoch 7, batch 1973
training loss: 0.03110601007938385 

Epoch 7, batch 1974
training loss: 0.016262734308838844 

Epoch 7, batch 1975
training loss: 0.04991019517183304 

Epoch 7, batch 1976
training loss: 0.020251402631402016 

Epoch 7, batch 1977
training loss: 0.6348077058792114 

Epoch 7, batch 1978
training loss: 0.026440853253006935 

Epoch 7, batch 1979
training loss: 0.3425895571708679 

Epoch 7, batch 1980
training loss: 0.055286236107349396 

Epoch 7, batch 1981
training loss: 0.02500702068209648 

Epoch 7, batch 1982
training loss: 0.32497185468673706 

Epoch 7, batch 1983
training loss: 0.017185237258672714 

Epoch 7, batch 1984
training loss: 0.025354836136102676 

Epoch 7, batch 1985
training loss: 0.06513528525829315 

Epoch 7, batch 1986
training loss: 0.029928911477327347 

Epoch 7, batch 1987
training loss: 0.0638575628399849 

Epoch 7, batch 1988
train

Epoch 7, batch 2189
training loss: 0.05913940817117691 

Epoch 7, batch 2190
training loss: 0.01928809843957424 

Epoch 7, batch 2191
training loss: 0.024002937600016594 

Epoch 7, batch 2192
training loss: 0.02643122337758541 

Epoch 7, batch 2193
training loss: 0.050176702439785004 

Epoch 7, batch 2194
training loss: 0.022277671843767166 

Epoch 7, batch 2195
training loss: 0.009490139782428741 

Epoch 7, batch 2196
training loss: 0.2900807857513428 

Epoch 7, batch 2197
training loss: 0.013216285035014153 

Epoch 7, batch 2198
training loss: 0.13667935132980347 

Epoch 7, batch 2199
training loss: 0.35259824991226196 

Epoch 7, batch 2200
training loss: 0.020744971930980682 

Epoch 7, batch 2201
training loss: 0.024063831195235252 

Epoch 7, batch 2202
training loss: 0.019011739641427994 

Epoch 7, batch 2203
training loss: 0.021796923130750656 

Epoch 7, batch 2204
training loss: 0.19606931507587433 

Epoch 7, batch 2205
training loss: 0.08751153945922852 

Epoch 7, batch 2206
tra

Epoch 7, batch 2409
training loss: 0.08454987406730652 

Epoch 7, batch 2410
training loss: 0.6415899991989136 

Epoch 7, batch 2411
training loss: 0.0031195199117064476 

Epoch 7, batch 2412
training loss: 0.04611470177769661 

Epoch 7, batch 2413
training loss: 0.14243856072425842 

Epoch 7, batch 2414
training loss: 0.14293572306632996 

Epoch 7, batch 2415
training loss: 0.5651780962944031 

Epoch 7, batch 2416
training loss: 0.6197251677513123 

Epoch 7, batch 2417
training loss: 0.016381625086069107 

Epoch 7, batch 2418
training loss: 0.0555030032992363 

Epoch 7, batch 2419
training loss: 0.08763166517019272 

Epoch 7, batch 2420
training loss: 0.017498750239610672 

Epoch 7, batch 2421
training loss: 0.2637854218482971 

Epoch 7, batch 2422
training loss: 0.18565301597118378 

Epoch 7, batch 2423
training loss: 0.16108766198158264 

Epoch 7, batch 2424
training loss: 0.019462328404188156 

Epoch 7, batch 2425
training loss: 0.24818961322307587 

Epoch 7, batch 2426
training lo

Epoch 7, batch 2630
training loss: 0.20830723643302917 

Epoch 7, batch 2631
training loss: 0.1356406956911087 

Epoch 7, batch 2632
training loss: 0.005760472267866135 

Epoch 7, batch 2633
training loss: 0.14528818428516388 

Epoch 7, batch 2634
training loss: 0.04413224011659622 

Epoch 7, batch 2635
training loss: 0.16462194919586182 

Epoch 7, batch 2636
training loss: 0.3669494092464447 

Epoch 7, batch 2637
training loss: 0.004818706773221493 

Epoch 7, batch 2638
training loss: 0.05593735724687576 

Epoch 7, batch 2639
training loss: 0.40019625425338745 

Epoch 7, batch 2640
training loss: 0.009620620869100094 

Epoch 7, batch 2641
training loss: 0.026954103261232376 

Epoch 7, batch 2642
training loss: 0.0252997986972332 

Epoch 7, batch 2643
training loss: 0.498340904712677 

Epoch 7, batch 2644
training loss: 0.138202965259552 

Epoch 7, batch 2645
training loss: 0.012499636970460415 

Epoch 7, batch 2646
training loss: 0.41873660683631897 

Epoch 7, batch 2647
training loss

Epoch 7, batch 2848
training loss: 0.011174452491104603 

Epoch 7, batch 2849
training loss: 0.2517331838607788 

Epoch 7, batch 2850
training loss: 0.015827596187591553 

Epoch 7, batch 2851
training loss: 0.15158379077911377 

Epoch 7, batch 2852
training loss: 0.012633050791919231 

Epoch 7, batch 2853
training loss: 0.13684701919555664 

Epoch 7, batch 2854
training loss: 1.0873119831085205 

Epoch 7, batch 2855
training loss: 0.047400783747434616 

Epoch 7, batch 2856
training loss: 0.21488742530345917 

Epoch 7, batch 2857
training loss: 0.015542307868599892 

Epoch 7, batch 2858
training loss: 0.09012175351381302 

Epoch 7, batch 2859
training loss: 0.1387888491153717 

Epoch 7, batch 2860
training loss: 0.018838733434677124 

Epoch 7, batch 2861
training loss: 0.3695605397224426 

Epoch 7, batch 2862
training loss: 0.036777883768081665 

Epoch 7, batch 2863
training loss: 0.03210019692778587 

Epoch 7, batch 2864
training loss: 0.07810517400503159 

Epoch 7, batch 2865
training

Epoch 7, batch 3070
training loss: 0.06937562674283981 

Epoch 7, batch 3071
training loss: 0.06071088835597038 

Epoch 7, batch 3072
training loss: 0.1664549708366394 

Epoch 7, batch 3073
training loss: 0.20490522682666779 

Epoch 7, batch 3074
training loss: 0.0077813356183469296 

Epoch 7, batch 3075
training loss: 0.23418135941028595 

Epoch 7, batch 3076
training loss: 0.03781537339091301 

Epoch 7, batch 3077
training loss: 0.20528843998908997 

Epoch 7, batch 3078
training loss: 0.012006806209683418 

Epoch 7, batch 3079
training loss: 0.06087244302034378 

Epoch 7, batch 3080
training loss: 0.03243769705295563 

Epoch 7, batch 3081
training loss: 0.012021936476230621 

Epoch 7, batch 3082
training loss: 0.014467032626271248 

Epoch 7, batch 3083
training loss: 0.04004455357789993 

Epoch 7, batch 3084
training loss: 0.07541118562221527 

Epoch 7, batch 3085
training loss: 0.32088977098464966 

Epoch 7, batch 3086
training loss: 0.11217398941516876 

Epoch 7, batch 3087
trainin

Epoch 7, batch 3289
training loss: 0.03764490783214569 

Epoch 7, batch 3290
training loss: 0.06294357776641846 

Epoch 7, batch 3291
training loss: 0.4361124634742737 

Epoch 7, batch 3292
training loss: 0.013650299981236458 

Epoch 7, batch 3293
training loss: 0.01561148650944233 

Epoch 7, batch 3294
training loss: 0.02453310415148735 

Epoch 7, batch 3295
training loss: 0.005932207219302654 

Epoch 7, batch 3296
training loss: 0.013869652524590492 

Epoch 7, batch 3297
training loss: 0.8085017204284668 

Epoch 7, batch 3298
training loss: 0.0460457019507885 

Epoch 7, batch 3299
training loss: 0.03293222188949585 

Epoch 7, batch 3300
training loss: 0.24683837592601776 

Epoch 7, batch 3301
training loss: 0.04330567643046379 

Epoch 7, batch 3302
training loss: 0.019897671416401863 

Epoch 7, batch 3303
training loss: 0.03317118436098099 

Epoch 7, batch 3304
training loss: 0.039985861629247665 

Epoch 7, batch 3305
training loss: 0.08170844614505768 

Epoch 7, batch 3306
training 

Epoch 7, batch 3509
training loss: 0.11043767631053925 

Epoch 7, batch 3510
training loss: 0.006282339803874493 

Epoch 7, batch 3511
training loss: 0.08154558390378952 

Epoch 7, batch 3512
training loss: 0.10373149812221527 

Epoch 7, batch 3513
training loss: 0.12445958703756332 

Epoch 7, batch 3514
training loss: 0.10991134494543076 

Epoch 7, batch 3515
training loss: 0.0454614982008934 

Epoch 7, batch 3516
training loss: 0.37622418999671936 

Epoch 7, batch 3517
training loss: 0.432972252368927 

Epoch 7, batch 3518
training loss: 0.1343897581100464 

Epoch 7, batch 3519
training loss: 0.13355307281017303 

Epoch 7, batch 3520
training loss: 0.04252356290817261 

Epoch 7, batch 3521
training loss: 0.06442465633153915 

Epoch 7, batch 3522
training loss: 0.08287524431943893 

Epoch 7, batch 3523
training loss: 0.008586994372308254 

Epoch 7, batch 3524
training loss: 0.7128223776817322 

Epoch 7, batch 3525
training loss: 0.09372372180223465 

Epoch 7, batch 3526
training loss:

Epoch 7, batch 3727
training loss: 0.08532103151082993 

Epoch 7, batch 3728
training loss: 0.08879697322845459 

Epoch 7, batch 3729
training loss: 0.06319475919008255 

Epoch 7, batch 3730
training loss: 0.04770687222480774 

Epoch 7, batch 3731
training loss: 0.09377018362283707 

Epoch 7, batch 3732
training loss: 0.256809264421463 

Epoch 7, batch 3733
training loss: 0.30781808495521545 

Epoch 7, batch 3734
training loss: 0.049292124807834625 

Epoch 7, batch 3735
training loss: 0.2182089388370514 

Epoch 7, batch 3736
training loss: 0.036153167486190796 

Epoch 7, batch 3737
training loss: 0.060087449848651886 

Epoch 7, batch 3738
training loss: 0.07800132036209106 

Epoch 7, batch 3739
training loss: 0.0586308054625988 

Epoch 7, batch 3740
training loss: 0.2564602494239807 

Epoch 7, batch 3741
training loss: 0.0778137594461441 

Epoch 7, batch 3742
training loss: 0.028629112988710403 

Epoch 7, batch 3743
training loss: 0.089996337890625 

Epoch 7, batch 3744
training loss: 

Epoch 7, batch 3947
training loss: 0.9733594655990601 

Epoch 7, batch 3948
training loss: 0.012788744643330574 

Epoch 7, batch 3949
training loss: 0.02194271609187126 

Epoch 7, batch 3950
training loss: 0.014568226411938667 

Epoch 7, batch 3951
training loss: 0.07102986425161362 

Epoch 7, batch 3952
training loss: 0.014363701455295086 

Epoch 7, batch 3953
training loss: 0.02625102363526821 

Epoch 7, batch 3954
training loss: 0.02845287322998047 

Epoch 7, batch 3955
training loss: 0.01809476688504219 

Epoch 7, batch 3956
training loss: 0.36090466380119324 

Epoch 7, batch 3957
training loss: 0.030807077884674072 

Epoch 7, batch 3958
training loss: 0.04858741536736488 

Epoch 7, batch 3959
training loss: 0.019294338300824165 

Epoch 7, batch 3960
training loss: 0.017110323533415794 

Epoch 7, batch 3961
training loss: 0.06727739423513412 

Epoch 7, batch 3962
training loss: 0.17717817425727844 

Epoch 7, batch 3963
training loss: 0.03968008607625961 

Epoch 7, batch 3964
traini

Epoch 7, batch 4169
training loss: 0.15802261233329773 

Epoch 7, batch 4170
training loss: 0.02294340543448925 

Epoch 7, batch 4171
training loss: 0.12651535868644714 

Epoch 7, batch 4172
training loss: 0.013124572113156319 

Epoch 7, batch 4173
training loss: 0.4140886664390564 

Epoch 7, batch 4174
training loss: 0.14752915501594543 

Epoch 7, batch 4175
training loss: 0.018625345081090927 

Epoch 7, batch 4176
training loss: 0.023654701188206673 

Epoch 7, batch 4177
training loss: 0.1476183980703354 

Epoch 7, batch 4178
training loss: 0.006952798459678888 

Epoch 7, batch 4179
training loss: 0.055933959782123566 

Epoch 7, batch 4180
training loss: 0.023142069578170776 

Epoch 7, batch 4181
training loss: 0.05312230437994003 

Epoch 7, batch 4182
training loss: 0.40389490127563477 

Epoch 7, batch 4183
training loss: 0.004986257757991552 

Epoch 7, batch 4184
training loss: 0.10858973115682602 

Epoch 7, batch 4185
training loss: 0.36904358863830566 

Epoch 7, batch 4186
traini

Epoch 7, batch 4390
training loss: 0.007928220555186272 

Epoch 7, batch 4391
training loss: 0.16782455146312714 

Epoch 7, batch 4392
training loss: 0.16956782341003418 

Epoch 7, batch 4393
training loss: 0.08846956491470337 

Epoch 7, batch 4394
training loss: 0.012754037976264954 

Epoch 7, batch 4395
training loss: 0.014923940412700176 

Epoch 7, batch 4396
training loss: 0.8837310075759888 

Epoch 7, batch 4397
training loss: 0.40464115142822266 

Epoch 7, batch 4398
training loss: 0.18727359175682068 

Epoch 7, batch 4399
training loss: 0.08827318251132965 

Epoch 7, batch 4400
training loss: 0.06308327615261078 

Epoch 7, batch 4401
training loss: 0.015495561063289642 

Epoch 7, batch 4402
training loss: 0.021481039002537727 

Epoch 7, batch 4403
training loss: 0.011753800325095654 

Epoch 7, batch 4404
training loss: 0.4508306086063385 

Epoch 7, batch 4405
training loss: 0.012016532942652702 

Epoch 7, batch 4406
training loss: 0.017233045771718025 

Epoch 7, batch 4407
train

Epoch 7, batch 4605
training loss: 0.6461986303329468 

Epoch 7, batch 4606
training loss: 0.13081294298171997 

Epoch 7, batch 4607
training loss: 0.013954751193523407 

Epoch 7, batch 4608
training loss: 0.011407343670725822 

Epoch 7, batch 4609
training loss: 0.06050960347056389 

Epoch 7, batch 4610
training loss: 0.2410092055797577 

Epoch 7, batch 4611
training loss: 0.03635469824075699 

Epoch 7, batch 4612
training loss: 0.00839940831065178 

Epoch 7, batch 4613
training loss: 0.2521854043006897 

Epoch 7, batch 4614
training loss: 0.02225380577147007 

Epoch 7, batch 4615
training loss: 0.004217987414449453 

Epoch 7, batch 4616
training loss: 0.016262482851743698 

Epoch 7, batch 4617
training loss: 0.031410057097673416 

Epoch 7, batch 4618
training loss: 0.6626302003860474 

Epoch 7, batch 4619
training loss: 0.00532721308991313 

Epoch 7, batch 4620
training loss: 0.01652652397751808 

Epoch 7, batch 4621
training loss: 0.014466775581240654 

Epoch 7, batch 4622
training 

Epoch 7, batch 4826
training loss: 0.008178471587598324 

Epoch 7, batch 4827
training loss: 0.17224764823913574 

Epoch 7, batch 4828
training loss: 0.20050248503684998 

Epoch 7, batch 4829
training loss: 0.026810860261321068 

Epoch 7, batch 4830
training loss: 0.14858615398406982 

Epoch 7, batch 4831
training loss: 0.10103663057088852 

Epoch 7, batch 4832
training loss: 0.26425957679748535 

Epoch 7, batch 4833
training loss: 0.007927569560706615 

Epoch 7, batch 4834
training loss: 0.039230942726135254 

Epoch 7, batch 4835
training loss: 0.1084655374288559 

Epoch 7, batch 4836
training loss: 0.026652734726667404 

Epoch 7, batch 4837
training loss: 0.04237079247832298 

Epoch 7, batch 4838
training loss: 0.4232591986656189 

Epoch 7, batch 4839
training loss: 0.01174355112016201 

Epoch 7, batch 4840
training loss: 0.05950724333524704 

Epoch 7, batch 4841
training loss: 0.00826578214764595 

Epoch 7, batch 4842
training loss: 0.11955473572015762 

Epoch 7, batch 4843
training

Epoch 7, batch 5044
training loss: 0.019370948895812035 

Epoch 7, batch 5045
training loss: 0.6865392923355103 

Epoch 7, batch 5046
training loss: 0.053008150309324265 

Epoch 7, batch 5047
training loss: 0.013020726852118969 

Epoch 7, batch 5048
training loss: 0.08358027040958405 

Epoch 7, batch 5049
training loss: 0.1458888053894043 

Epoch 7, batch 5050
training loss: 0.0613647922873497 

Epoch 7, batch 5051
training loss: 0.12679901719093323 

Epoch 7, batch 5052
training loss: 0.4617999494075775 

Epoch 7, batch 5053
training loss: 0.006713539361953735 

Epoch 7, batch 5054
training loss: 0.03914885222911835 

Epoch 7, batch 5055
training loss: 0.009502379223704338 

Epoch 7, batch 5056
training loss: 0.02942778170108795 

Epoch 7, batch 5057
training loss: 0.15937864780426025 

Epoch 7, batch 5058
training loss: 0.0462418757379055 

Epoch 7, batch 5059
training loss: 0.24751970171928406 

Epoch 7, batch 5060
training loss: 1.1078120470046997 

Epoch 7, batch 5061
training los

Epoch 7, batch 5262
training loss: 0.3753132224082947 

Epoch 7, batch 5263
training loss: 0.31655165553092957 

Epoch 7, batch 5264
training loss: 0.28607696294784546 

Epoch 7, batch 5265
training loss: 0.1896434873342514 

Epoch 7, batch 5266
training loss: 0.026136552914977074 

Epoch 7, batch 5267
training loss: 0.03631233423948288 

Epoch 7, batch 5268
training loss: 0.0624132938683033 

Epoch 7, batch 5269
training loss: 0.07992490381002426 

Epoch 7, batch 5270
training loss: 0.048215869814157486 

Epoch 7, batch 5271
training loss: 0.016347995027899742 

Epoch 7, batch 5272
training loss: 0.027166545391082764 

Epoch 7, batch 5273
training loss: 0.13542166352272034 

Epoch 7, batch 5274
training loss: 0.05658842250704765 

Epoch 7, batch 5275
training loss: 0.03683152049779892 

Epoch 7, batch 5276
training loss: 0.052637260407209396 

Epoch 7, batch 5277
training loss: 0.028143856674432755 

Epoch 7, batch 5278
training loss: 0.05551198869943619 

Epoch 7, batch 5279
training

Epoch 7, batch 5485
training loss: 0.013336924836039543 

Epoch 7, batch 5486
training loss: 0.15135103464126587 

Epoch 7, batch 5487
training loss: 0.006805178709328175 

Epoch 7, batch 5488
training loss: 0.006917194928973913 

Epoch 7, batch 5489
training loss: 0.09386129677295685 

Epoch 7, batch 5490
training loss: 0.0020568366162478924 

Epoch 7, batch 5491
training loss: 0.09685058146715164 

Epoch 7, batch 5492
training loss: 0.02524365857243538 

Epoch 7, batch 5493
training loss: 0.042635537683963776 

Epoch 7, batch 5494
training loss: 0.2719293236732483 

Epoch 7, batch 5495
training loss: 0.07059259712696075 

Epoch 7, batch 5496
training loss: 0.0747327208518982 

Epoch 7, batch 5497
training loss: 0.06269760429859161 

Epoch 7, batch 5498
training loss: 0.01470959186553955 

Epoch 7, batch 5499
training loss: 0.21344205737113953 

Epoch 7, batch 5500
training loss: 0.07435518503189087 

Epoch 7, batch 5501
training loss: 0.2640976905822754 

Epoch 7, batch 5502
training

Epoch 7, batch 5706
training loss: 0.04094286262989044 

Epoch 7, batch 5707
training loss: 0.31206613779067993 

Epoch 7, batch 5708
training loss: 0.013435003347694874 

Epoch 7, batch 5709
training loss: 0.0949915200471878 

Epoch 7, batch 5710
training loss: 0.35729318857192993 

Epoch 7, batch 5711
training loss: 0.02021852508187294 

Epoch 7, batch 5712
training loss: 0.37319615483283997 

Epoch 7, batch 5713
training loss: 0.02910013496875763 

Epoch 7, batch 5714
training loss: 0.09024044126272202 

Epoch 7, batch 5715
training loss: 0.07066916674375534 

Epoch 7, batch 5716
training loss: 0.8041553497314453 

Epoch 7, batch 5717
training loss: 0.090036541223526 

Epoch 7, batch 5718
training loss: 0.04439458250999451 

Epoch 7, batch 5719
training loss: 0.02976399101316929 

Epoch 7, batch 5720
training loss: 0.3049164414405823 

Epoch 7, batch 5721
training loss: 0.007396265864372253 

Epoch 7, batch 5722
training loss: 0.022951778024435043 

Epoch 7, batch 5723
training loss

Epoch 7, batch 5930
training loss: 0.005868437234312296 

Epoch 7, batch 5931
training loss: 0.06486458331346512 

Epoch 7, batch 5932
training loss: 0.18420688807964325 

Epoch 7, batch 5933
training loss: 0.12487737089395523 

Epoch 7, batch 5934
training loss: 0.016080733388662338 

Epoch 7, batch 5935
training loss: 0.3708176612854004 

Epoch 7, batch 5936
training loss: 0.2652234137058258 

Epoch 7, batch 5937
training loss: 0.14909979701042175 

Epoch 7, batch 5938
training loss: 0.017767833545804024 

Epoch 7, batch 5939
training loss: 0.030617546290159225 

Epoch 7, batch 5940
training loss: 0.04872281104326248 

Epoch 7, batch 5941
training loss: 0.10936033725738525 

Epoch 7, batch 5942
training loss: 0.20457077026367188 

Epoch 7, batch 5943
training loss: 0.032132722437381744 

Epoch 7, batch 5944
training loss: 0.055015064775943756 

Epoch 7, batch 5945
training loss: 0.018869828432798386 

Epoch 7, batch 5946
training loss: 0.030897116288542747 

Epoch 7, batch 5947
train

Epoch 8, batch 148
training loss: 0.038176555186510086 

Epoch 8, batch 149
training loss: 0.011180071160197258 

Epoch 8, batch 150
training loss: 0.007408274803310633 

Epoch 8, batch 151
training loss: 0.3054130971431732 

Epoch 8, batch 152
training loss: 0.08475078642368317 

Epoch 8, batch 153
training loss: 0.08464878797531128 

Epoch 8, batch 154
training loss: 0.03760115057229996 

Epoch 8, batch 155
training loss: 0.003136744722723961 

Epoch 8, batch 156
training loss: 0.541054368019104 

Epoch 8, batch 157
training loss: 0.07731984555721283 

Epoch 8, batch 158
training loss: 0.10537244379520416 

Epoch 8, batch 159
training loss: 0.09345061331987381 

Epoch 8, batch 160
training loss: 0.019274555146694183 

Epoch 8, batch 161
training loss: 0.2156129777431488 

Epoch 8, batch 162
training loss: 0.03590188920497894 

Epoch 8, batch 163
training loss: 0.4373820722103119 

Epoch 8, batch 164
training loss: 1.0806158781051636 

Epoch 8, batch 165
training loss: 0.0128957135602

Epoch 8, batch 371
training loss: 0.10618311166763306 

Epoch 8, batch 372
training loss: 0.007643203251063824 

Epoch 8, batch 373
training loss: 0.004303078167140484 

Epoch 8, batch 374
training loss: 0.05410321429371834 

Epoch 8, batch 375
training loss: 0.13156960904598236 

Epoch 8, batch 376
training loss: 0.06585393100976944 

Epoch 8, batch 377
training loss: 0.008597508072853088 

Epoch 8, batch 378
training loss: 0.16976261138916016 

Epoch 8, batch 379
training loss: 0.12231378257274628 

Epoch 8, batch 380
training loss: 0.03970836475491524 

Epoch 8, batch 381
training loss: 0.022844482213258743 

Epoch 8, batch 382
training loss: 0.06667301058769226 

Epoch 8, batch 383
training loss: 0.01855304278433323 

Epoch 8, batch 384
training loss: 0.004362717270851135 

Epoch 8, batch 385
training loss: 0.06712466478347778 

Epoch 8, batch 386
training loss: 0.14708258211612701 

Epoch 8, batch 387
training loss: 0.01142494659870863 

Epoch 8, batch 388
training loss: 0.0287146

Epoch 8, batch 593
training loss: 0.3934401571750641 

Epoch 8, batch 594
training loss: 0.10066956281661987 

Epoch 8, batch 595
training loss: 0.9771970510482788 

Epoch 8, batch 596
training loss: 0.08206849545240402 

Epoch 8, batch 597
training loss: 0.010602914728224277 

Epoch 8, batch 598
training loss: 0.032373156398534775 

Epoch 8, batch 599
training loss: 0.20046675205230713 

Epoch 8, batch 600
training loss: 0.004490247927606106 

Epoch 8, batch 601
training loss: 0.17003759741783142 

Epoch 8, batch 602
training loss: 0.21076688170433044 

Epoch 8, batch 603
training loss: 0.2377053052186966 

Epoch 8, batch 604
training loss: 0.04300231486558914 

Epoch 8, batch 605
training loss: 0.25088298320770264 

Epoch 8, batch 606
training loss: 0.001973093021661043 

Epoch 8, batch 607
training loss: 0.0020690388046205044 

Epoch 8, batch 608
training loss: 0.05990912392735481 

Epoch 8, batch 609
training loss: 0.03422131389379501 

Epoch 8, batch 610
training loss: 0.042217753

Epoch 8, batch 804
training loss: 0.050278790295124054 

Epoch 8, batch 805
training loss: 0.05905995890498161 

Epoch 8, batch 806
training loss: 0.09044843167066574 

Epoch 8, batch 807
training loss: 0.0403449572622776 

Epoch 8, batch 808
training loss: 0.2575821578502655 

Epoch 8, batch 809
training loss: 0.009758969768881798 

Epoch 8, batch 810
training loss: 0.6055395603179932 

Epoch 8, batch 811
training loss: 0.05099738761782646 

Epoch 8, batch 812
training loss: 0.08675290644168854 

Epoch 8, batch 813
training loss: 0.06634130328893661 

Epoch 8, batch 814
training loss: 0.0912044495344162 

Epoch 8, batch 815
training loss: 0.004626053385436535 

Epoch 8, batch 816
training loss: 0.01337224431335926 

Epoch 8, batch 817
training loss: 0.2474973201751709 

Epoch 8, batch 818
training loss: 0.05170701816678047 

Epoch 8, batch 819
training loss: 0.19811168313026428 

Epoch 8, batch 820
training loss: 0.0719137042760849 

Epoch 8, batch 821
training loss: 0.007236403878778

Epoch 8, batch 1023
training loss: 0.0882614329457283 

Epoch 8, batch 1024
training loss: 0.04569239169359207 

Epoch 8, batch 1025
training loss: 0.20705029368400574 

Epoch 8, batch 1026
training loss: 0.008536523208022118 

Epoch 8, batch 1027
training loss: 0.006505665369331837 

Epoch 8, batch 1028
training loss: 0.8055933713912964 

Epoch 8, batch 1029
training loss: 0.13026386499404907 

Epoch 8, batch 1030
training loss: 0.14560110867023468 

Epoch 8, batch 1031
training loss: 0.011257613077759743 

Epoch 8, batch 1032
training loss: 0.011519355699419975 

Epoch 8, batch 1033
training loss: 0.34489041566848755 

Epoch 8, batch 1034
training loss: 0.05383114889264107 

Epoch 8, batch 1035
training loss: 0.06039818003773689 

Epoch 8, batch 1036
training loss: 0.28459998965263367 

Epoch 8, batch 1037
training loss: 0.030960511416196823 

Epoch 8, batch 1038
training loss: 0.045608680695295334 

Epoch 8, batch 1039
training loss: 0.02878684177994728 

Epoch 8, batch 1040
trainin

Epoch 8, batch 1242
training loss: 0.12727180123329163 

Epoch 8, batch 1243
training loss: 0.12391563504934311 

Epoch 8, batch 1244
training loss: 0.08174730837345123 

Epoch 8, batch 1245
training loss: 0.03702555224299431 

Epoch 8, batch 1246
training loss: 0.0028974697925150394 

Epoch 8, batch 1247
training loss: 0.00729315634816885 

Epoch 8, batch 1248
training loss: 0.009965692646801472 

Epoch 8, batch 1249
training loss: 0.006222503259778023 

Epoch 8, batch 1250
training loss: 0.005006006918847561 

Epoch 8, batch 1251
training loss: 0.11247728019952774 

Epoch 8, batch 1252
training loss: 0.004396666307002306 

Epoch 8, batch 1253
training loss: 0.027847999706864357 

Epoch 8, batch 1254
training loss: 0.006799840368330479 

Epoch 8, batch 1255
training loss: 0.10002952814102173 

Epoch 8, batch 1256
training loss: 0.04274728521704674 

Epoch 8, batch 1257
training loss: 0.07480189204216003 

Epoch 8, batch 1258
training loss: 0.3181474804878235 

Epoch 8, batch 1259
trai

Epoch 8, batch 1462
training loss: 0.4139278531074524 

Epoch 8, batch 1463
training loss: 0.018798010423779488 

Epoch 8, batch 1464
training loss: 0.017959650605916977 

Epoch 8, batch 1465
training loss: 0.03273167833685875 

Epoch 8, batch 1466
training loss: 0.011844327673316002 

Epoch 8, batch 1467
training loss: 0.03654121235013008 

Epoch 8, batch 1468
training loss: 0.12528222799301147 

Epoch 8, batch 1469
training loss: 0.012519510462880135 

Epoch 8, batch 1470
training loss: 0.17671792209148407 

Epoch 8, batch 1471
training loss: 0.05426584556698799 

Epoch 8, batch 1472
training loss: 0.009990090504288673 

Epoch 8, batch 1473
training loss: 0.1817101538181305 

Epoch 8, batch 1474
training loss: 0.07505641877651215 

Epoch 8, batch 1475
training loss: 0.03290444612503052 

Epoch 8, batch 1476
training loss: 0.13171519339084625 

Epoch 8, batch 1477
training loss: 0.054408542811870575 

Epoch 8, batch 1478
training loss: 0.014738010242581367 

Epoch 8, batch 1479
traini

Epoch 8, batch 1674
training loss: 0.19742359220981598 

Epoch 8, batch 1675
training loss: 0.2216707170009613 

Epoch 8, batch 1676
training loss: 0.13711896538734436 

Epoch 8, batch 1677
training loss: 0.14435221254825592 

Epoch 8, batch 1678
training loss: 0.018360231071710587 

Epoch 8, batch 1679
training loss: 0.13488373160362244 

Epoch 8, batch 1680
training loss: 0.21015575528144836 

Epoch 8, batch 1681
training loss: 0.15262073278427124 

Epoch 8, batch 1682
training loss: 0.06362082809209824 

Epoch 8, batch 1683
training loss: 0.06393446773290634 

Epoch 8, batch 1684
training loss: 0.042320385575294495 

Epoch 8, batch 1685
training loss: 0.05115170031785965 

Epoch 8, batch 1686
training loss: 0.12135157734155655 

Epoch 8, batch 1687
training loss: 0.02019433118402958 

Epoch 8, batch 1688
training loss: 0.1790388971567154 

Epoch 8, batch 1689
training loss: 0.17135022580623627 

Epoch 8, batch 1690
training loss: 0.014833812601864338 

Epoch 8, batch 1691
training l

Epoch 8, batch 1896
training loss: 0.34777769446372986 

Epoch 8, batch 1897
training loss: 0.41073498129844666 

Epoch 8, batch 1898
training loss: 0.029502669349312782 

Epoch 8, batch 1899
training loss: 0.008812771178781986 

Epoch 8, batch 1900
training loss: 0.03875906392931938 

Epoch 8, batch 1901
training loss: 0.15194770693778992 

Epoch 8, batch 1902
training loss: 0.44750547409057617 

Epoch 8, batch 1903
training loss: 0.026882534846663475 

Epoch 8, batch 1904
training loss: 0.008801477029919624 

Epoch 8, batch 1905
training loss: 0.19742146134376526 

Epoch 8, batch 1906
training loss: 0.007212822791188955 

Epoch 8, batch 1907
training loss: 0.24842636287212372 

Epoch 8, batch 1908
training loss: 0.018192825838923454 

Epoch 8, batch 1909
training loss: 0.04830777645111084 

Epoch 8, batch 1910
training loss: 0.01717802882194519 

Epoch 8, batch 1911
training loss: 0.025290891528129578 

Epoch 8, batch 1912
training loss: 0.009686261415481567 

Epoch 8, batch 1913
tra

Epoch 8, batch 2116
training loss: 0.12670409679412842 

Epoch 8, batch 2117
training loss: 0.38746416568756104 

Epoch 8, batch 2118
training loss: 0.05131174996495247 

Epoch 8, batch 2119
training loss: 0.0074865445494651794 

Epoch 8, batch 2120
training loss: 0.09507676213979721 

Epoch 8, batch 2121
training loss: 0.3536064028739929 

Epoch 8, batch 2122
training loss: 0.13958227634429932 

Epoch 8, batch 2123
training loss: 0.8416560888290405 

Epoch 8, batch 2124
training loss: 0.026066362857818604 

Epoch 8, batch 2125
training loss: 0.13778308033943176 

Epoch 8, batch 2126
training loss: 0.3978036046028137 

Epoch 8, batch 2127
training loss: 0.034997060894966125 

Epoch 8, batch 2128
training loss: 0.24491000175476074 

Epoch 8, batch 2129
training loss: 0.29067447781562805 

Epoch 8, batch 2130
training loss: 0.1468832790851593 

Epoch 8, batch 2131
training loss: 0.02956397831439972 

Epoch 8, batch 2132
training loss: 0.0032099683303385973 

Epoch 8, batch 2133
training 

Epoch 8, batch 2338
training loss: 0.034490324556827545 

Epoch 8, batch 2339
training loss: 0.20030243694782257 

Epoch 8, batch 2340
training loss: 0.01602247543632984 

Epoch 8, batch 2341
training loss: 0.03367730230093002 

Epoch 8, batch 2342
training loss: 0.5102272033691406 

Epoch 8, batch 2343
training loss: 0.1864178627729416 

Epoch 8, batch 2344
training loss: 0.012577695772051811 

Epoch 8, batch 2345
training loss: 0.1859535574913025 

Epoch 8, batch 2346
training loss: 0.05067354440689087 

Epoch 8, batch 2347
training loss: 0.030313562601804733 

Epoch 8, batch 2348
training loss: 0.08281713724136353 

Epoch 8, batch 2349
training loss: 0.029634807258844376 

Epoch 8, batch 2350
training loss: 0.025700364261865616 

Epoch 8, batch 2351
training loss: 0.1538034975528717 

Epoch 8, batch 2352
training loss: 0.41166695952415466 

Epoch 8, batch 2353
training loss: 0.04042990133166313 

Epoch 8, batch 2354
training loss: 0.013010603375732899 

Epoch 8, batch 2355
training 

Epoch 8, batch 2559
training loss: 0.0855875089764595 

Epoch 8, batch 2560
training loss: 0.013598212972283363 

Epoch 8, batch 2561
training loss: 0.1267479956150055 

Epoch 8, batch 2562
training loss: 0.2971092164516449 

Epoch 8, batch 2563
training loss: 0.030801821500062943 

Epoch 8, batch 2564
training loss: 0.049520693719387054 

Epoch 8, batch 2565
training loss: 0.019501542672514915 

Epoch 8, batch 2566
training loss: 0.014788773842155933 

Epoch 8, batch 2567
training loss: 0.23062734305858612 

Epoch 8, batch 2568
training loss: 0.006472565233707428 

Epoch 8, batch 2569
training loss: 0.011562874540686607 

Epoch 8, batch 2570
training loss: 0.02536913752555847 

Epoch 8, batch 2571
training loss: 0.038927361369132996 

Epoch 8, batch 2572
training loss: 0.1490664929151535 

Epoch 8, batch 2573
training loss: 0.48527249693870544 

Epoch 8, batch 2574
training loss: 0.032853204756975174 

Epoch 8, batch 2575
training loss: 0.06678420305252075 

Epoch 8, batch 2576
traini

Epoch 8, batch 2779
training loss: 0.007870075292885303 

Epoch 8, batch 2780
training loss: 0.06051493436098099 

Epoch 8, batch 2781
training loss: 0.15266388654708862 

Epoch 8, batch 2782
training loss: 0.05710761994123459 

Epoch 8, batch 2783
training loss: 0.014961043372750282 

Epoch 8, batch 2784
training loss: 0.10093913227319717 

Epoch 8, batch 2785
training loss: 0.03323153406381607 

Epoch 8, batch 2786
training loss: 0.429049551486969 

Epoch 8, batch 2787
training loss: 0.1511927992105484 

Epoch 8, batch 2788
training loss: 0.0998089462518692 

Epoch 8, batch 2789
training loss: 0.014108854345977306 

Epoch 8, batch 2790
training loss: 0.07529222220182419 

Epoch 8, batch 2791
training loss: 0.03734252601861954 

Epoch 8, batch 2792
training loss: 0.13842806220054626 

Epoch 8, batch 2793
training loss: 0.027700331062078476 

Epoch 8, batch 2794
training loss: 0.03919392451643944 

Epoch 8, batch 2795
training loss: 0.1575208306312561 

Epoch 8, batch 2796
training los

Epoch 8, batch 3000
training loss: 0.018162867054343224 

Epoch 8, batch 3001
training loss: 0.41507667303085327 

Epoch 8, batch 3002
training loss: 0.04742252826690674 

Epoch 8, batch 3003
training loss: 0.03231433033943176 

Epoch 8, batch 3004
training loss: 0.09866879880428314 

Epoch 8, batch 3005
training loss: 0.01893952116370201 

Epoch 8, batch 3006
training loss: 0.07446109503507614 

Epoch 8, batch 3007
training loss: 0.11673995107412338 

Epoch 8, batch 3008
training loss: 0.05117088556289673 

Epoch 8, batch 3009
training loss: 0.03503343462944031 

Epoch 8, batch 3010
training loss: 0.16525903344154358 

Epoch 8, batch 3011
training loss: 0.16890151798725128 

Epoch 8, batch 3012
training loss: 0.05000365525484085 

Epoch 8, batch 3013
training loss: 0.02277226559817791 

Epoch 8, batch 3014
training loss: 0.008840332739055157 

Epoch 8, batch 3015
training loss: 0.09152631461620331 

Epoch 8, batch 3016
training loss: 0.011553977616131306 

Epoch 8, batch 3017
training

Epoch 8, batch 3218
training loss: 0.24044053256511688 

Epoch 8, batch 3219
training loss: 0.03952321410179138 

Epoch 8, batch 3220
training loss: 0.05892179533839226 

Epoch 8, batch 3221
training loss: 0.3887781798839569 

Epoch 8, batch 3222
training loss: 0.01431487686932087 

Epoch 8, batch 3223
training loss: 0.3594951033592224 

Epoch 8, batch 3224
training loss: 0.07309689372777939 

Epoch 8, batch 3225
training loss: 0.1004876047372818 

Epoch 8, batch 3226
training loss: 0.01622222736477852 

Epoch 8, batch 3227
training loss: 0.004996991250663996 

Epoch 8, batch 3228
training loss: 0.04043414443731308 

Epoch 8, batch 3229
training loss: 0.05632021278142929 

Epoch 8, batch 3230
training loss: 0.2178429812192917 

Epoch 8, batch 3231
training loss: 0.09122269600629807 

Epoch 8, batch 3232
training loss: 0.11204417794942856 

Epoch 8, batch 3233
training loss: 0.029162529855966568 

Epoch 8, batch 3234
training loss: 0.006765715777873993 

Epoch 8, batch 3235
training los

Epoch 8, batch 3439
training loss: 0.036161262542009354 

Epoch 8, batch 3440
training loss: 0.018314993008971214 

Epoch 8, batch 3441
training loss: 0.14131572842597961 

Epoch 8, batch 3442
training loss: 0.04378516972064972 

Epoch 8, batch 3443
training loss: 0.13216865062713623 

Epoch 8, batch 3444
training loss: 0.07863441854715347 

Epoch 8, batch 3445
training loss: 0.1488555520772934 

Epoch 8, batch 3446
training loss: 0.12694256007671356 

Epoch 8, batch 3447
training loss: 0.0068403990007936954 

Epoch 8, batch 3448
training loss: 0.07568858563899994 

Epoch 8, batch 3449
training loss: 0.0063065700232982635 

Epoch 8, batch 3450
training loss: 0.13260839879512787 

Epoch 8, batch 3451
training loss: 0.0143668781965971 

Epoch 8, batch 3452
training loss: 0.3357557952404022 

Epoch 8, batch 3453
training loss: 0.09603573381900787 

Epoch 8, batch 3454
training loss: 0.021332425996661186 

Epoch 8, batch 3455
training loss: 0.5394195318222046 

Epoch 8, batch 3456
training

Epoch 8, batch 3660
training loss: 0.04836782068014145 

Epoch 8, batch 3661
training loss: 0.015050245448946953 

Epoch 8, batch 3662
training loss: 0.014953291043639183 

Epoch 8, batch 3663
training loss: 0.04736632853746414 

Epoch 8, batch 3664
training loss: 0.003330348525196314 

Epoch 8, batch 3665
training loss: 0.6501497030258179 

Epoch 8, batch 3666
training loss: 0.05960816144943237 

Epoch 8, batch 3667
training loss: 0.1189897283911705 

Epoch 8, batch 3668
training loss: 0.05243254825472832 

Epoch 8, batch 3669
training loss: 0.03795917332172394 

Epoch 8, batch 3670
training loss: 0.15279468894004822 

Epoch 8, batch 3671
training loss: 0.5465058088302612 

Epoch 8, batch 3672
training loss: 0.4401708245277405 

Epoch 8, batch 3673
training loss: 0.023398585617542267 

Epoch 8, batch 3674
training loss: 0.029864948242902756 

Epoch 8, batch 3675
training loss: 0.3281829059123993 

Epoch 8, batch 3676
training loss: 1.0025337934494019 

Epoch 8, batch 3677
training los

Epoch 8, batch 3880
training loss: 0.23675787448883057 

Epoch 8, batch 3881
training loss: 0.16006603837013245 

Epoch 8, batch 3882
training loss: 0.00948883406817913 

Epoch 8, batch 3883
training loss: 0.007162906229496002 

Epoch 8, batch 3884
training loss: 0.04577375575900078 

Epoch 8, batch 3885
training loss: 0.014964600093662739 

Epoch 8, batch 3886
training loss: 0.1587129533290863 

Epoch 8, batch 3887
training loss: 0.06476987153291702 

Epoch 8, batch 3888
training loss: 0.03091438114643097 

Epoch 8, batch 3889
training loss: 0.3071208596229553 

Epoch 8, batch 3890
training loss: 0.03525851294398308 

Epoch 8, batch 3891
training loss: 0.009151458740234375 

Epoch 8, batch 3892
training loss: 0.048305660486221313 

Epoch 8, batch 3893
training loss: 0.23793983459472656 

Epoch 8, batch 3894
training loss: 0.20682330429553986 

Epoch 8, batch 3895
training loss: 0.03802326321601868 

Epoch 8, batch 3896
training loss: 0.02943468652665615 

Epoch 8, batch 3897
training 

Epoch 8, batch 4102
training loss: 0.05358950421214104 

Epoch 8, batch 4103
training loss: 0.012940523214638233 

Epoch 8, batch 4104
training loss: 0.06516354531049728 

Epoch 8, batch 4105
training loss: 0.003762459382414818 

Epoch 8, batch 4106
training loss: 0.03226973116397858 

Epoch 8, batch 4107
training loss: 0.2656622529029846 

Epoch 8, batch 4108
training loss: 0.08550893515348434 

Epoch 8, batch 4109
training loss: 0.8168174028396606 

Epoch 8, batch 4110
training loss: 0.019160684198141098 

Epoch 8, batch 4111
training loss: 0.21087749302387238 

Epoch 8, batch 4112
training loss: 0.009578440338373184 

Epoch 8, batch 4113
training loss: 0.012358981184661388 

Epoch 8, batch 4114
training loss: 0.09399864077568054 

Epoch 8, batch 4115
training loss: 0.05478566884994507 

Epoch 8, batch 4116
training loss: 0.02101515606045723 

Epoch 8, batch 4117
training loss: 0.12937895953655243 

Epoch 8, batch 4118
training loss: 0.9974652528762817 

Epoch 8, batch 4119
training 

Epoch 8, batch 4324
training loss: 0.1632377952337265 

Epoch 8, batch 4325
training loss: 0.04300672560930252 

Epoch 8, batch 4326
training loss: 0.40208688378334045 

Epoch 8, batch 4327
training loss: 0.07566101849079132 

Epoch 8, batch 4328
training loss: 0.009805282577872276 

Epoch 8, batch 4329
training loss: 0.0923970490694046 

Epoch 8, batch 4330
training loss: 0.04930334538221359 

Epoch 8, batch 4331
training loss: 0.22444915771484375 

Epoch 8, batch 4332
training loss: 0.03301514312624931 

Epoch 8, batch 4333
training loss: 0.013862033374607563 

Epoch 8, batch 4334
training loss: 0.01767258532345295 

Epoch 8, batch 4335
training loss: 0.0028179255314171314 

Epoch 8, batch 4336
training loss: 0.020578578114509583 

Epoch 8, batch 4337
training loss: 0.27265188097953796 

Epoch 8, batch 4338
training loss: 0.031396105885505676 

Epoch 8, batch 4339
training loss: 0.04303668439388275 

Epoch 8, batch 4340
training loss: 0.16875059902668 

Epoch 8, batch 4341
training l

Epoch 8, batch 4546
training loss: 0.04956363886594772 

Epoch 8, batch 4547
training loss: 0.06740503013134003 

Epoch 8, batch 4548
training loss: 0.007409333251416683 

Epoch 8, batch 4549
training loss: 0.27615147829055786 

Epoch 8, batch 4550
training loss: 0.011511081829667091 

Epoch 8, batch 4551
training loss: 0.07203898578882217 

Epoch 8, batch 4552
training loss: 0.00819387100636959 

Epoch 8, batch 4553
training loss: 0.12669093906879425 

Epoch 8, batch 4554
training loss: 0.012599244713783264 

Epoch 8, batch 4555
training loss: 0.039928924292325974 

Epoch 8, batch 4556
training loss: 0.13154374063014984 

Epoch 8, batch 4557
training loss: 0.05951660871505737 

Epoch 8, batch 4558
training loss: 0.06169562786817551 

Epoch 8, batch 4559
training loss: 0.024064145982265472 

Epoch 8, batch 4560
training loss: 0.04359468072652817 

Epoch 8, batch 4561
training loss: 0.07193601876497269 

Epoch 8, batch 4562
training loss: 0.052978239953517914 

Epoch 8, batch 4563
train

Epoch 8, batch 4769
training loss: 0.3321344554424286 

Epoch 8, batch 4770
training loss: 0.08062048256397247 

Epoch 8, batch 4771
training loss: 0.01766723021864891 

Epoch 8, batch 4772
training loss: 0.3000350594520569 

Epoch 8, batch 4773
training loss: 0.10666362941265106 

Epoch 8, batch 4774
training loss: 0.020802848041057587 

Epoch 8, batch 4775
training loss: 0.07453136146068573 

Epoch 8, batch 4776
training loss: 0.050587259232997894 

Epoch 8, batch 4777
training loss: 0.07812817394733429 

Epoch 8, batch 4778
training loss: 0.056646931916475296 

Epoch 8, batch 4779
training loss: 0.01390692126005888 

Epoch 8, batch 4780
training loss: 0.3437972068786621 

Epoch 8, batch 4781
training loss: 0.03322792798280716 

Epoch 8, batch 4782
training loss: 0.08518502861261368 

Epoch 8, batch 4783
training loss: 0.1850300431251526 

Epoch 8, batch 4784
training loss: 0.009358907118439674 

Epoch 8, batch 4785
training loss: 0.011597555130720139 

Epoch 8, batch 4786
training l

Epoch 8, batch 4989
training loss: 0.0037110187113285065 

Epoch 8, batch 4990
training loss: 0.013217982836067677 

Epoch 8, batch 4991
training loss: 0.03771501034498215 

Epoch 8, batch 4992
training loss: 0.39407384395599365 

Epoch 8, batch 4993
training loss: 0.05524919554591179 

Epoch 8, batch 4994
training loss: 0.02478950098156929 

Epoch 8, batch 4995
training loss: 0.22907087206840515 

Epoch 8, batch 4996
training loss: 0.026708949357271194 

Epoch 8, batch 4997
training loss: 0.1397807002067566 

Epoch 8, batch 4998
training loss: 0.0254233218729496 

Epoch 8, batch 4999
training loss: 0.2222779542207718 

Epoch 8, batch 5000
training loss: 0.043563857674598694 

Epoch 8, batch 5001
training loss: 0.0071586137637495995 

Epoch 8, batch 5002
training loss: 0.3264469504356384 

Epoch 8, batch 5003
training loss: 0.025568369776010513 

Epoch 8, batch 5004
training loss: 0.023544343188405037 

Epoch 8, batch 5005
training loss: 0.12849880754947662 

Epoch 8, batch 5006
traini

Epoch 8, batch 5209
training loss: 0.10135164111852646 

Epoch 8, batch 5210
training loss: 0.058963485062122345 

Epoch 8, batch 5211
training loss: 0.0571383535861969 

Epoch 8, batch 5212
training loss: 0.057739369571208954 

Epoch 8, batch 5213
training loss: 0.06838695704936981 

Epoch 8, batch 5214
training loss: 0.22418078780174255 

Epoch 8, batch 5215
training loss: 0.022028768435120583 

Epoch 8, batch 5216
training loss: 0.1502668708562851 

Epoch 8, batch 5217
training loss: 0.050115734338760376 

Epoch 8, batch 5218
training loss: 0.7305803894996643 

Epoch 8, batch 5219
training loss: 0.1839287132024765 

Epoch 8, batch 5220
training loss: 0.018152663484215736 

Epoch 8, batch 5221
training loss: 0.13877977430820465 

Epoch 8, batch 5222
training loss: 0.25694072246551514 

Epoch 8, batch 5223
training loss: 0.048759523779153824 

Epoch 8, batch 5224
training loss: 0.007662855088710785 

Epoch 8, batch 5225
training loss: 0.27592235803604126 

Epoch 8, batch 5226
training

Epoch 8, batch 5429
training loss: 0.12032520771026611 

Epoch 8, batch 5430
training loss: 0.049994535744190216 

Epoch 8, batch 5431
training loss: 0.03763536363840103 

Epoch 8, batch 5432
training loss: 0.23357398808002472 

Epoch 8, batch 5433
training loss: 0.01810413971543312 

Epoch 8, batch 5434
training loss: 0.01196970697492361 

Epoch 8, batch 5435
training loss: 0.2506555914878845 

Epoch 8, batch 5436
training loss: 0.014038977213203907 

Epoch 8, batch 5437
training loss: 0.03682843595743179 

Epoch 8, batch 5438
training loss: 0.17439809441566467 

Epoch 8, batch 5439
training loss: 0.07804439961910248 

Epoch 8, batch 5440
training loss: 0.05332634970545769 

Epoch 8, batch 5441
training loss: 0.02599775418639183 

Epoch 8, batch 5442
training loss: 0.21829207241535187 

Epoch 8, batch 5443
training loss: 0.39383676648139954 

Epoch 8, batch 5444
training loss: 0.10466722398996353 

Epoch 8, batch 5445
training loss: 0.008627249859273434 

Epoch 8, batch 5446
training 

Epoch 8, batch 5649
training loss: 0.10111626237630844 

Epoch 8, batch 5650
training loss: 0.039147429168224335 

Epoch 8, batch 5651
training loss: 0.23899772763252258 

Epoch 8, batch 5652
training loss: 0.47862809896469116 

Epoch 8, batch 5653
training loss: 0.04713800922036171 

Epoch 8, batch 5654
training loss: 0.043183907866477966 

Epoch 8, batch 5655
training loss: 0.015387470833957195 

Epoch 8, batch 5656
training loss: 0.034585826098918915 

Epoch 8, batch 5657
training loss: 0.04339415580034256 

Epoch 8, batch 5658
training loss: 0.037593334913253784 

Epoch 8, batch 5659
training loss: 0.20383624732494354 

Epoch 8, batch 5660
training loss: 0.420214980840683 

Epoch 8, batch 5661
training loss: 0.6011620759963989 

Epoch 8, batch 5662
training loss: 0.02214437909424305 

Epoch 8, batch 5663
training loss: 0.03862155228853226 

Epoch 8, batch 5664
training loss: 0.07319135963916779 

Epoch 8, batch 5665
training loss: 0.12524709105491638 

Epoch 8, batch 5666
training 

Epoch 8, batch 5872
training loss: 0.027455171570181847 

Epoch 8, batch 5873
training loss: 0.0081894900649786 

Epoch 8, batch 5874
training loss: 0.11711291968822479 

Epoch 8, batch 5875
training loss: 0.3017996549606323 

Epoch 8, batch 5876
training loss: 0.28852054476737976 

Epoch 8, batch 5877
training loss: 0.226365327835083 

Epoch 8, batch 5878
training loss: 0.016736861318349838 

Epoch 8, batch 5879
training loss: 0.2382805049419403 

Epoch 8, batch 5880
training loss: 0.010178091004490852 

Epoch 8, batch 5881
training loss: 0.03824003413319588 

Epoch 8, batch 5882
training loss: 0.01262268703430891 

Epoch 8, batch 5883
training loss: 0.2548554539680481 

Epoch 8, batch 5884
training loss: 0.024376733228564262 

Epoch 8, batch 5885
training loss: 0.25834280252456665 

Epoch 8, batch 5886
training loss: 0.055959682911634445 

Epoch 8, batch 5887
training loss: 0.17230761051177979 

Epoch 8, batch 5888
training loss: 0.2800859808921814 

Epoch 8, batch 5889
training loss

Epoch 9, batch 93
training loss: 0.03596961498260498 

Epoch 9, batch 94
training loss: 0.08565213531255722 

Epoch 9, batch 95
training loss: 0.0014266377547755837 

Epoch 9, batch 96
training loss: 0.020685747265815735 

Epoch 9, batch 97
training loss: 0.03032129630446434 

Epoch 9, batch 98
training loss: 0.236078143119812 

Epoch 9, batch 99
training loss: 0.005411891732364893 

Epoch 9, batch 100
training loss: 0.013636678457260132 

Epoch 9, batch 101
training loss: 0.10670782625675201 

Epoch 9, batch 102
training loss: 0.16556914150714874 

Epoch 9, batch 103
training loss: 0.003239565761759877 

Epoch 9, batch 104
training loss: 0.894305408000946 

Epoch 9, batch 105
training loss: 0.39840877056121826 

Epoch 9, batch 106
training loss: 0.24779780209064484 

Epoch 9, batch 107
training loss: 0.1317693591117859 

Epoch 9, batch 108
training loss: 0.5083345174789429 

Epoch 9, batch 109
training loss: 1.2382731437683105 

Epoch 9, batch 110
training loss: 0.0901498943567276 

E

Epoch 9, batch 315
training loss: 0.1509696990251541 

Epoch 9, batch 316
training loss: 0.03135911747813225 

Epoch 9, batch 317
training loss: 0.001782184699550271 

Epoch 9, batch 318
training loss: 0.09369846433401108 

Epoch 9, batch 319
training loss: 0.011087178252637386 

Epoch 9, batch 320
training loss: 0.3500533401966095 

Epoch 9, batch 321
training loss: 0.019896667450666428 

Epoch 9, batch 322
training loss: 0.005146824289113283 

Epoch 9, batch 323
training loss: 0.1350550353527069 

Epoch 9, batch 324
training loss: 0.020937591791152954 

Epoch 9, batch 325
training loss: 0.07750336825847626 

Epoch 9, batch 326
training loss: 0.017654070630669594 

Epoch 9, batch 327
training loss: 0.21352753043174744 

Epoch 9, batch 328
training loss: 0.12464523315429688 

Epoch 9, batch 329
training loss: 0.01929086074233055 

Epoch 9, batch 330
training loss: 0.32134538888931274 

Epoch 9, batch 331
training loss: 0.11992515623569489 

Epoch 9, batch 332
training loss: 0.108209118

Epoch 9, batch 537
training loss: 0.0037328233011066914 

Epoch 9, batch 538
training loss: 0.03967936709523201 

Epoch 9, batch 539
training loss: 0.14482896029949188 

Epoch 9, batch 540
training loss: 0.0028940069023519754 

Epoch 9, batch 541
training loss: 0.00948838796466589 

Epoch 9, batch 542
training loss: 0.535910427570343 

Epoch 9, batch 543
training loss: 0.017511015757918358 

Epoch 9, batch 544
training loss: 0.029893886297941208 

Epoch 9, batch 545
training loss: 0.17527733743190765 

Epoch 9, batch 546
training loss: 0.35137611627578735 

Epoch 9, batch 547
training loss: 0.06340928375720978 

Epoch 9, batch 548
training loss: 0.38382962346076965 

Epoch 9, batch 549
training loss: 0.06803326308727264 

Epoch 9, batch 550
training loss: 0.06754057109355927 

Epoch 9, batch 551
training loss: 0.01023049745708704 

Epoch 9, batch 552
training loss: 0.038690872490406036 

Epoch 9, batch 553
training loss: 0.007096876390278339 

Epoch 9, batch 554
training loss: 0.213495

Epoch 9, batch 761
training loss: 0.03461834043264389 

Epoch 9, batch 762
training loss: 0.07516764104366302 

Epoch 9, batch 763
training loss: 0.33641430735588074 

Epoch 9, batch 764
training loss: 0.07865101844072342 

Epoch 9, batch 765
training loss: 0.0024832026101648808 

Epoch 9, batch 766
training loss: 0.27624452114105225 

Epoch 9, batch 767
training loss: 0.05581348389387131 

Epoch 9, batch 768
training loss: 0.016917461529374123 

Epoch 9, batch 769
training loss: 0.1516505777835846 

Epoch 9, batch 770
training loss: 0.3530721962451935 

Epoch 9, batch 771
training loss: 0.0034778923727571964 

Epoch 9, batch 772
training loss: 0.11166535317897797 

Epoch 9, batch 773
training loss: 0.2622644305229187 

Epoch 9, batch 774
training loss: 0.07520712912082672 

Epoch 9, batch 775
training loss: 0.09743283689022064 

Epoch 9, batch 776
training loss: 0.11376986652612686 

Epoch 9, batch 777
training loss: 0.22280292212963104 

Epoch 9, batch 778
training loss: 0.0455092899

Epoch 9, batch 983
training loss: 0.012981006875634193 

Epoch 9, batch 984
training loss: 0.03715364634990692 

Epoch 9, batch 985
training loss: 0.021704401820898056 

Epoch 9, batch 986
training loss: 0.13621601462364197 

Epoch 9, batch 987
training loss: 0.031172040849924088 

Epoch 9, batch 988
training loss: 0.07032613456249237 

Epoch 9, batch 989
training loss: 0.005737786181271076 

Epoch 9, batch 990
training loss: 0.04473968595266342 

Epoch 9, batch 991
training loss: 0.01071365550160408 

Epoch 9, batch 992
training loss: 0.21116895973682404 

Epoch 9, batch 993
training loss: 0.023400653153657913 

Epoch 9, batch 994
training loss: 0.05206950381398201 

Epoch 9, batch 995
training loss: 0.008570177480578423 

Epoch 9, batch 996
training loss: 0.26725631952285767 

Epoch 9, batch 997
training loss: 0.09740196168422699 

Epoch 9, batch 998
training loss: 0.12890875339508057 

Epoch 9, batch 999
training loss: 0.048097699880599976 

Epoch 9, batch 1000
training loss: 0.1857

Epoch 9, batch 1203
training loss: 0.018390346318483353 

Epoch 9, batch 1204
training loss: 0.05422412231564522 

Epoch 9, batch 1205
training loss: 0.021039269864559174 

Epoch 9, batch 1206
training loss: 0.03113236092031002 

Epoch 9, batch 1207
training loss: 0.040805384516716 

Epoch 9, batch 1208
training loss: 0.09181123971939087 

Epoch 9, batch 1209
training loss: 0.026144858449697495 

Epoch 9, batch 1210
training loss: 0.07242719829082489 

Epoch 9, batch 1211
training loss: 0.08798066526651382 

Epoch 9, batch 1212
training loss: 0.026304343715310097 

Epoch 9, batch 1213
training loss: 0.0706186592578888 

Epoch 9, batch 1214
training loss: 0.04127340763807297 

Epoch 9, batch 1215
training loss: 0.016110341995954514 

Epoch 9, batch 1216
training loss: 0.13047124445438385 

Epoch 9, batch 1217
training loss: 0.02309034951031208 

Epoch 9, batch 1218
training loss: 0.012363554909825325 

Epoch 9, batch 1219
training loss: 0.00866266991943121 

Epoch 9, batch 1220
training

Epoch 9, batch 1424
training loss: 0.24243895709514618 

Epoch 9, batch 1425
training loss: 0.04372166469693184 

Epoch 9, batch 1426
training loss: 0.017017964273691177 

Epoch 9, batch 1427
training loss: 0.02843652106821537 

Epoch 9, batch 1428
training loss: 0.06900043785572052 

Epoch 9, batch 1429
training loss: 0.11799158900976181 

Epoch 9, batch 1430
training loss: 0.2823796272277832 

Epoch 9, batch 1431
training loss: 0.017039882019162178 

Epoch 9, batch 1432
training loss: 0.2677772641181946 

Epoch 9, batch 1433
training loss: 0.014733185060322285 

Epoch 9, batch 1434
training loss: 0.049691930413246155 

Epoch 9, batch 1435
training loss: 0.0302877277135849 

Epoch 9, batch 1436
training loss: 0.45129090547561646 

Epoch 9, batch 1437
training loss: 0.013398626819252968 

Epoch 9, batch 1438
training loss: 0.017353029921650887 

Epoch 9, batch 1439
training loss: 0.12281008064746857 

Epoch 9, batch 1440
training loss: 0.08105982840061188 

Epoch 9, batch 1441
training

Epoch 9, batch 1645
training loss: 0.004333898890763521 

Epoch 9, batch 1646
training loss: 0.04425454139709473 

Epoch 9, batch 1647
training loss: 0.007008391432464123 

Epoch 9, batch 1648
training loss: 0.019581280648708344 

Epoch 9, batch 1649
training loss: 0.06258323043584824 

Epoch 9, batch 1650
training loss: 0.07146351039409637 

Epoch 9, batch 1651
training loss: 0.049129582941532135 

Epoch 9, batch 1652
training loss: 0.014848923310637474 

Epoch 9, batch 1653
training loss: 0.00993184745311737 

Epoch 9, batch 1654
training loss: 0.11693765968084335 

Epoch 9, batch 1655
training loss: 0.0264614038169384 

Epoch 9, batch 1656
training loss: 0.06989289075136185 

Epoch 9, batch 1657
training loss: 0.061832912266254425 

Epoch 9, batch 1658
training loss: 0.004837718792259693 

Epoch 9, batch 1659
training loss: 0.035549964755773544 

Epoch 9, batch 1660
training loss: 0.15274570882320404 

Epoch 9, batch 1661
training loss: 0.016741830855607986 

Epoch 9, batch 1662
tra

Epoch 9, batch 1854
training loss: 0.1559584140777588 

Epoch 9, batch 1855
training loss: 0.13844051957130432 

Epoch 9, batch 1856
training loss: 0.09281273186206818 

Epoch 9, batch 1857
training loss: 0.22329814732074738 

Epoch 9, batch 1858
training loss: 0.014971902593970299 

Epoch 9, batch 1859
training loss: 0.1374269425868988 

Epoch 9, batch 1860
training loss: 0.009459661319851875 

Epoch 9, batch 1861
training loss: 0.7815030813217163 

Epoch 9, batch 1862
training loss: 0.0575835220515728 

Epoch 9, batch 1863
training loss: 0.20337672531604767 

Epoch 9, batch 1864
training loss: 0.07386717200279236 

Epoch 9, batch 1865
training loss: 0.003790422808378935 

Epoch 9, batch 1866
training loss: 0.02601677179336548 

Epoch 9, batch 1867
training loss: 0.224201038479805 

Epoch 9, batch 1868
training loss: 0.10200954973697662 

Epoch 9, batch 1869
training loss: 0.11082295328378677 

Epoch 9, batch 1870
training loss: 0.0879954844713211 

Epoch 9, batch 1871
training loss: 

Epoch 9, batch 2072
training loss: 0.03883174806833267 

Epoch 9, batch 2073
training loss: 0.01717299595475197 

Epoch 9, batch 2074
training loss: 0.08020729571580887 

Epoch 9, batch 2075
training loss: 0.07750914245843887 

Epoch 9, batch 2076
training loss: 0.019910523667931557 

Epoch 9, batch 2077
training loss: 0.11749191582202911 

Epoch 9, batch 2078
training loss: 0.18158473074436188 

Epoch 9, batch 2079
training loss: 0.07735675573348999 

Epoch 9, batch 2080
training loss: 0.0372699573636055 

Epoch 9, batch 2081
training loss: 0.20337148010730743 

Epoch 9, batch 2082
training loss: 0.024094905704259872 

Epoch 9, batch 2083
training loss: 0.00845249556005001 

Epoch 9, batch 2084
training loss: 0.03093266487121582 

Epoch 9, batch 2085
training loss: 0.005598938558250666 

Epoch 9, batch 2086
training loss: 0.02195562794804573 

Epoch 9, batch 2087
training loss: 0.00884209480136633 

Epoch 9, batch 2088
training loss: 0.025853103026747704 

Epoch 9, batch 2089
training

Epoch 9, batch 2290
training loss: 0.08083804696798325 

Epoch 9, batch 2291
training loss: 0.019351545721292496 

Epoch 9, batch 2292
training loss: 0.2591804563999176 

Epoch 9, batch 2293
training loss: 0.11164163053035736 

Epoch 9, batch 2294
training loss: 0.32842421531677246 

Epoch 9, batch 2295
training loss: 0.004505158867686987 

Epoch 9, batch 2296
training loss: 0.04321304336190224 

Epoch 9, batch 2297
training loss: 0.5959271192550659 

Epoch 9, batch 2298
training loss: 0.03946183994412422 

Epoch 9, batch 2299
training loss: 0.03503432124853134 

Epoch 9, batch 2300
training loss: 0.18955539166927338 

Epoch 9, batch 2301
training loss: 0.0804695338010788 

Epoch 9, batch 2302
training loss: 0.04292214661836624 

Epoch 9, batch 2303
training loss: 0.016429845243692398 

Epoch 9, batch 2304
training loss: 0.0026587536558508873 

Epoch 9, batch 2305
training loss: 0.030050674453377724 

Epoch 9, batch 2306
training loss: 0.024212025105953217 

Epoch 9, batch 2307
trainin

Epoch 9, batch 2508
training loss: 0.2109331339597702 

Epoch 9, batch 2509
training loss: 0.27059561014175415 

Epoch 9, batch 2510
training loss: 0.06447572261095047 

Epoch 9, batch 2511
training loss: 0.018574604764580727 

Epoch 9, batch 2512
training loss: 0.01178799755871296 

Epoch 9, batch 2513
training loss: 0.2632427215576172 

Epoch 9, batch 2514
training loss: 0.09399603307247162 

Epoch 9, batch 2515
training loss: 0.044199589639902115 

Epoch 9, batch 2516
training loss: 0.6017822623252869 

Epoch 9, batch 2517
training loss: 0.07476233690977097 

Epoch 9, batch 2518
training loss: 0.25271645188331604 

Epoch 9, batch 2519
training loss: 0.10302100330591202 

Epoch 9, batch 2520
training loss: 0.02798839844763279 

Epoch 9, batch 2521
training loss: 0.037475258111953735 

Epoch 9, batch 2522
training loss: 0.1920967400074005 

Epoch 9, batch 2523
training loss: 0.4531119465827942 

Epoch 9, batch 2524
training loss: 0.25693750381469727 

Epoch 9, batch 2525
training loss

Epoch 9, batch 2728
training loss: 0.027427975088357925 

Epoch 9, batch 2729
training loss: 0.06859098374843597 

Epoch 9, batch 2730
training loss: 0.011379016563296318 

Epoch 9, batch 2731
training loss: 0.2483077496290207 

Epoch 9, batch 2732
training loss: 0.0370507687330246 

Epoch 9, batch 2733
training loss: 0.12556152045726776 

Epoch 9, batch 2734
training loss: 0.34529608488082886 

Epoch 9, batch 2735
training loss: 0.004083108622580767 

Epoch 9, batch 2736
training loss: 0.01738196238875389 

Epoch 9, batch 2737
training loss: 0.1821211725473404 

Epoch 9, batch 2738
training loss: 0.05367220193147659 

Epoch 9, batch 2739
training loss: 0.013624945655465126 

Epoch 9, batch 2740
training loss: 0.11592236906290054 

Epoch 9, batch 2741
training loss: 0.06609965860843658 

Epoch 9, batch 2742
training loss: 0.11364998668432236 

Epoch 9, batch 2743
training loss: 0.296221524477005 

Epoch 9, batch 2744
training loss: 0.0285917017608881 

Epoch 9, batch 2745
training loss

Epoch 9, batch 2947
training loss: 0.07459511607885361 

Epoch 9, batch 2948
training loss: 0.19964657723903656 

Epoch 9, batch 2949
training loss: 0.008922032080590725 

Epoch 9, batch 2950
training loss: 0.07171911001205444 

Epoch 9, batch 2951
training loss: 0.03320206329226494 

Epoch 9, batch 2952
training loss: 0.6623464822769165 

Epoch 9, batch 2953
training loss: 0.03156080096960068 

Epoch 9, batch 2954
training loss: 0.09048789739608765 

Epoch 9, batch 2955
training loss: 0.010109717957675457 

Epoch 9, batch 2956
training loss: 0.05068963021039963 

Epoch 9, batch 2957
training loss: 0.29373735189437866 

Epoch 9, batch 2958
training loss: 0.012356680817902088 

Epoch 9, batch 2959
training loss: 0.026176825165748596 

Epoch 9, batch 2960
training loss: 0.1534460484981537 

Epoch 9, batch 2961
training loss: 0.012194410897791386 

Epoch 9, batch 2962
training loss: 0.30337101221084595 

Epoch 9, batch 2963
training loss: 0.29715847969055176 

Epoch 9, batch 2964
training

Epoch 9, batch 3167
training loss: 0.0034784593153744936 

Epoch 9, batch 3168
training loss: 0.11888536065816879 

Epoch 9, batch 3169
training loss: 0.00965820997953415 

Epoch 9, batch 3170
training loss: 0.07192341983318329 

Epoch 9, batch 3171
training loss: 0.0011984666343778372 

Epoch 9, batch 3172
training loss: 0.13354068994522095 

Epoch 9, batch 3173
training loss: 0.09158734232187271 

Epoch 9, batch 3174
training loss: 0.403531938791275 

Epoch 9, batch 3175
training loss: 0.050816841423511505 

Epoch 9, batch 3176
training loss: 0.01037084124982357 

Epoch 9, batch 3177
training loss: 0.031279556453228 

Epoch 9, batch 3178
training loss: 0.10369555652141571 

Epoch 9, batch 3179
training loss: 0.6252495646476746 

Epoch 9, batch 3180
training loss: 0.048301197588443756 

Epoch 9, batch 3181
training loss: 0.19896256923675537 

Epoch 9, batch 3182
training loss: 0.16173365712165833 

Epoch 9, batch 3183
training loss: 0.2796178460121155 

Epoch 9, batch 3184
training lo

Epoch 9, batch 3384
training loss: 0.04182342067360878 

Epoch 9, batch 3385
training loss: 0.04943183809518814 

Epoch 9, batch 3386
training loss: 0.44704824686050415 

Epoch 9, batch 3387
training loss: 0.23894348740577698 

Epoch 9, batch 3388
training loss: 0.00643206387758255 

Epoch 9, batch 3389
training loss: 0.029008662328124046 

Epoch 9, batch 3390
training loss: 0.020891640335321426 

Epoch 9, batch 3391
training loss: 0.004644871223717928 

Epoch 9, batch 3392
training loss: 0.027742132544517517 

Epoch 9, batch 3393
training loss: 0.15564076602458954 

Epoch 9, batch 3394
training loss: 0.21700234711170197 

Epoch 9, batch 3395
training loss: 0.02201526239514351 

Epoch 9, batch 3396
training loss: 0.03691435977816582 

Epoch 9, batch 3397
training loss: 0.31132298707962036 

Epoch 9, batch 3398
training loss: 0.02007969096302986 

Epoch 9, batch 3399
training loss: 0.33413684368133545 

Epoch 9, batch 3400
training loss: 0.01607673428952694 

Epoch 9, batch 3401
trainin

Epoch 9, batch 3601
training loss: 0.013452591374516487 

Epoch 9, batch 3602
training loss: 0.4162237048149109 

Epoch 9, batch 3603
training loss: 0.4489527642726898 

Epoch 9, batch 3604
training loss: 0.013722133822739124 

Epoch 9, batch 3605
training loss: 0.03615548834204674 

Epoch 9, batch 3606
training loss: 0.007445149123668671 

Epoch 9, batch 3607
training loss: 0.42265087366104126 

Epoch 9, batch 3608
training loss: 0.01633310131728649 

Epoch 9, batch 3609
training loss: 0.4989350438117981 

Epoch 9, batch 3610
training loss: 0.27258411049842834 

Epoch 9, batch 3611
training loss: 0.12554974853992462 

Epoch 9, batch 3612
training loss: 0.17914526164531708 

Epoch 9, batch 3613
training loss: 0.01385069452226162 

Epoch 9, batch 3614
training loss: 0.01821320690214634 

Epoch 9, batch 3615
training loss: 0.627831757068634 

Epoch 9, batch 3616
training loss: 0.014054084196686745 

Epoch 9, batch 3617
training loss: 0.11745603382587433 

Epoch 9, batch 3618
training los

Epoch 9, batch 3818
training loss: 0.0826970785856247 

Epoch 9, batch 3819
training loss: 0.012331308797001839 

Epoch 9, batch 3820
training loss: 0.00960535742342472 

Epoch 9, batch 3821
training loss: 0.008041965775191784 

Epoch 9, batch 3822
training loss: 0.041520457714796066 

Epoch 9, batch 3823
training loss: 0.5213085412979126 

Epoch 9, batch 3824
training loss: 0.01025616005063057 

Epoch 9, batch 3825
training loss: 0.036277495324611664 

Epoch 9, batch 3826
training loss: 0.006590086966753006 

Epoch 9, batch 3827
training loss: 0.019760848954319954 

Epoch 9, batch 3828
training loss: 0.010763322934508324 

Epoch 9, batch 3829
training loss: 0.006311463657766581 

Epoch 9, batch 3830
training loss: 0.0240509994328022 

Epoch 9, batch 3831
training loss: 0.010925495997071266 

Epoch 9, batch 3832
training loss: 0.005769313313066959 

Epoch 9, batch 3833
training loss: 0.008747930638492107 

Epoch 9, batch 3834
training loss: 0.10505829006433487 

Epoch 9, batch 3835
tra

Epoch 9, batch 4034
training loss: 0.09896855801343918 

Epoch 9, batch 4035
training loss: 0.09998701512813568 

Epoch 9, batch 4036
training loss: 0.12160183489322662 

Epoch 9, batch 4037
training loss: 0.64234858751297 

Epoch 9, batch 4038
training loss: 0.084089495241642 

Epoch 9, batch 4039
training loss: 0.4165499806404114 

Epoch 9, batch 4040
training loss: 0.017935875803232193 

Epoch 9, batch 4041
training loss: 0.27461355924606323 

Epoch 9, batch 4042
training loss: 0.019689250737428665 

Epoch 9, batch 4043
training loss: 0.024324335157871246 

Epoch 9, batch 4044
training loss: 0.03307114914059639 

Epoch 9, batch 4045
training loss: 0.0029716775752604008 

Epoch 9, batch 4046
training loss: 0.019105635583400726 

Epoch 9, batch 4047
training loss: 0.1085527166724205 

Epoch 9, batch 4048
training loss: 0.027484014630317688 

Epoch 9, batch 4049
training loss: 0.07647193223237991 

Epoch 9, batch 4050
training loss: 0.02245006337761879 

Epoch 9, batch 4051
training lo

Epoch 9, batch 4253
training loss: 0.6568304300308228 

Epoch 9, batch 4254
training loss: 0.05423711612820625 

Epoch 9, batch 4255
training loss: 0.0483214296400547 

Epoch 9, batch 4256
training loss: 0.11949761211872101 

Epoch 9, batch 4257
training loss: 1.0275202989578247 

Epoch 9, batch 4258
training loss: 0.16212037205696106 

Epoch 9, batch 4259
training loss: 0.518001914024353 

Epoch 9, batch 4260
training loss: 0.13988062739372253 

Epoch 9, batch 4261
training loss: 0.9737012982368469 

Epoch 9, batch 4262
training loss: 0.10988502204418182 

Epoch 9, batch 4263
training loss: 0.37049347162246704 

Epoch 9, batch 4264
training loss: 0.07766066491603851 

Epoch 9, batch 4265
training loss: 0.19221119582653046 

Epoch 9, batch 4266
training loss: 0.19020366668701172 

Epoch 9, batch 4267
training loss: 0.04800565540790558 

Epoch 9, batch 4268
training loss: 0.08540545403957367 

Epoch 9, batch 4269
training loss: 0.008201980032026768 

Epoch 9, batch 4270
training loss: 0

Epoch 9, batch 4470
training loss: 0.003320736810564995 

Epoch 9, batch 4471
training loss: 0.249015212059021 

Epoch 9, batch 4472
training loss: 0.11387167125940323 

Epoch 9, batch 4473
training loss: 0.04159499704837799 

Epoch 9, batch 4474
training loss: 0.21550914645195007 

Epoch 9, batch 4475
training loss: 0.13461990654468536 

Epoch 9, batch 4476
training loss: 0.1514430046081543 

Epoch 9, batch 4477
training loss: 0.05732392147183418 

Epoch 9, batch 4478
training loss: 0.1966417133808136 

Epoch 9, batch 4479
training loss: 0.010297881439328194 

Epoch 9, batch 4480
training loss: 0.010913518257439137 

Epoch 9, batch 4481
training loss: 0.055676836520433426 

Epoch 9, batch 4482
training loss: 0.1556634157896042 

Epoch 9, batch 4483
training loss: 0.13968849182128906 

Epoch 9, batch 4484
training loss: 0.02334992215037346 

Epoch 9, batch 4485
training loss: 0.5062558650970459 

Epoch 9, batch 4486
training loss: 0.08490005880594254 

Epoch 9, batch 4487
training loss

Epoch 9, batch 4694
training loss: 0.025883737951517105 

Epoch 9, batch 4695
training loss: 0.012195797637104988 

Epoch 9, batch 4696
training loss: 0.0185785461217165 

Epoch 9, batch 4697
training loss: 0.02239479497075081 

Epoch 9, batch 4698
training loss: 0.005331492982804775 

Epoch 9, batch 4699
training loss: 0.006502112839370966 

Epoch 9, batch 4700
training loss: 0.023816430941224098 

Epoch 9, batch 4701
training loss: 0.058409370481967926 

Epoch 9, batch 4702
training loss: 0.08287979662418365 

Epoch 9, batch 4703
training loss: 0.007390419952571392 

Epoch 9, batch 4704
training loss: 0.005703511647880077 

Epoch 9, batch 4705
training loss: 0.025609463453292847 

Epoch 9, batch 4706
training loss: 0.2931194305419922 

Epoch 9, batch 4707
training loss: 0.03071792796254158 

Epoch 9, batch 4708
training loss: 0.0030499256681650877 

Epoch 9, batch 4709
training loss: 0.0898018330335617 

Epoch 9, batch 4710
training loss: 0.008770913816988468 

Epoch 9, batch 4711
tr

Epoch 9, batch 4917
training loss: 0.06991400569677353 

Epoch 9, batch 4918
training loss: 0.0475558266043663 

Epoch 9, batch 4919
training loss: 0.10765375196933746 

Epoch 9, batch 4920
training loss: 0.613925576210022 

Epoch 9, batch 4921
training loss: 0.08824644237756729 

Epoch 9, batch 4922
training loss: 0.021509597077965736 

Epoch 9, batch 4923
training loss: 0.05376727133989334 

Epoch 9, batch 4924
training loss: 0.010851352475583553 

Epoch 9, batch 4925
training loss: 0.00905726756900549 

Epoch 9, batch 4926
training loss: 0.012209727428853512 

Epoch 9, batch 4927
training loss: 0.005434788763523102 

Epoch 9, batch 4928
training loss: 0.03968504071235657 

Epoch 9, batch 4929
training loss: 0.20192506909370422 

Epoch 9, batch 4930
training loss: 0.35232681035995483 

Epoch 9, batch 4931
training loss: 0.0028420770540833473 

Epoch 9, batch 4932
training loss: 0.016185294836759567 

Epoch 9, batch 4933
training loss: 0.18346866965293884 

Epoch 9, batch 4934
trainin

Epoch 9, batch 5139
training loss: 0.1271342635154724 

Epoch 9, batch 5140
training loss: 0.01912710815668106 

Epoch 9, batch 5141
training loss: 0.030764663591980934 

Epoch 9, batch 5142
training loss: 0.3592328429222107 

Epoch 9, batch 5143
training loss: 0.11381296068429947 

Epoch 9, batch 5144
training loss: 0.04455292224884033 

Epoch 9, batch 5145
training loss: 0.010522978380322456 

Epoch 9, batch 5146
training loss: 0.23951339721679688 

Epoch 9, batch 5147
training loss: 0.039835281670093536 

Epoch 9, batch 5148
training loss: 0.03291584178805351 

Epoch 9, batch 5149
training loss: 0.07425598800182343 

Epoch 9, batch 5150
training loss: 0.0045426818542182446 

Epoch 9, batch 5151
training loss: 0.006043442990630865 

Epoch 9, batch 5152
training loss: 0.0192517451941967 

Epoch 9, batch 5153
training loss: 0.014548989944159985 

Epoch 9, batch 5154
training loss: 0.0363006629049778 

Epoch 9, batch 5155
training loss: 0.0852058082818985 

Epoch 9, batch 5156
training 

Epoch 9, batch 5364
training loss: 0.21013858914375305 

Epoch 9, batch 5365
training loss: 0.024523835629224777 

Epoch 9, batch 5366
training loss: 0.08326868712902069 

Epoch 9, batch 5367
training loss: 0.30443114042282104 

Epoch 9, batch 5368
training loss: 0.10163822025060654 

Epoch 9, batch 5369
training loss: 0.0877409428358078 

Epoch 9, batch 5370
training loss: 0.006266591604799032 

Epoch 9, batch 5371
training loss: 0.5655670762062073 

Epoch 9, batch 5372
training loss: 0.040583536028862 

Epoch 9, batch 5373
training loss: 0.013377347961068153 

Epoch 9, batch 5374
training loss: 0.03185509145259857 

Epoch 9, batch 5375
training loss: 0.14321359992027283 

Epoch 9, batch 5376
training loss: 0.023880673572421074 

Epoch 9, batch 5377
training loss: 0.015350093133747578 

Epoch 9, batch 5378
training loss: 0.0022213177289813757 

Epoch 9, batch 5379
training loss: 0.008097417652606964 

Epoch 9, batch 5380
training loss: 0.057238779962062836 

Epoch 9, batch 5381
traini

Epoch 9, batch 5585
training loss: 0.0063977790996432304 

Epoch 9, batch 5586
training loss: 0.04422269016504288 

Epoch 9, batch 5587
training loss: 0.020990079268813133 

Epoch 9, batch 5588
training loss: 0.012108661234378815 

Epoch 9, batch 5589
training loss: 0.12411801517009735 

Epoch 9, batch 5590
training loss: 0.16942057013511658 

Epoch 9, batch 5591
training loss: 0.1531042903661728 

Epoch 9, batch 5592
training loss: 0.1767542064189911 

Epoch 9, batch 5593
training loss: 0.0076728700660169125 

Epoch 9, batch 5594
training loss: 0.24032458662986755 

Epoch 9, batch 5595
training loss: 0.027795076370239258 

Epoch 9, batch 5596
training loss: 0.011324277147650719 

Epoch 9, batch 5597
training loss: 0.3371012210845947 

Epoch 9, batch 5598
training loss: 0.11663015931844711 

Epoch 9, batch 5599
training loss: 0.0050201741978526115 

Epoch 9, batch 5600
training loss: 0.006263683550059795 

Epoch 9, batch 5601
training loss: 0.009008039720356464 

Epoch 9, batch 5602
tr

Epoch 9, batch 5805
training loss: 0.0043819742277264595 

Epoch 9, batch 5806
training loss: 0.05713571235537529 

Epoch 9, batch 5807
training loss: 0.0822170302271843 

Epoch 9, batch 5808
training loss: 0.028979772701859474 

Epoch 9, batch 5809
training loss: 0.3459186851978302 

Epoch 9, batch 5810
training loss: 0.10354907810688019 

Epoch 9, batch 5811
training loss: 0.08108530938625336 

Epoch 9, batch 5812
training loss: 0.6583142876625061 

Epoch 9, batch 5813
training loss: 0.006353339646011591 

Epoch 9, batch 5814
training loss: 0.05317951366305351 

Epoch 9, batch 5815
training loss: 0.0586395338177681 

Epoch 9, batch 5816
training loss: 0.004563618451356888 

Epoch 9, batch 5817
training loss: 0.26820477843284607 

Epoch 9, batch 5818
training loss: 0.01873091235756874 

Epoch 9, batch 5819
training loss: 0.016934750601649284 

Epoch 9, batch 5820
training loss: 0.01734032668173313 

Epoch 9, batch 5821
training loss: 0.11730418354272842 

Epoch 9, batch 5822
training 

Epoch 10, batch 25
training loss: 0.09683248400688171 

Epoch 10, batch 26
training loss: 0.0075683691538870335 

Epoch 10, batch 27
training loss: 0.005168442148715258 

Epoch 10, batch 28
training loss: 0.00499035743996501 

Epoch 10, batch 29
training loss: 0.013469142839312553 

Epoch 10, batch 30
training loss: 0.005480892024934292 

Epoch 10, batch 31
training loss: 0.06332478672266006 

Epoch 10, batch 32
training loss: 0.7207471132278442 

Epoch 10, batch 33
training loss: 0.0039023063145577908 

Epoch 10, batch 34
training loss: 0.02716812491416931 

Epoch 10, batch 35
training loss: 0.04857829958200455 

Epoch 10, batch 36
training loss: 0.11693441867828369 

Epoch 10, batch 37
training loss: 0.012097449973225594 

Epoch 10, batch 38
training loss: 0.13449285924434662 

Epoch 10, batch 39
training loss: 0.01462898962199688 

Epoch 10, batch 40
training loss: 0.015409896150231361 

Epoch 10, batch 41
training loss: 0.09073973447084427 

Epoch 10, batch 42
training loss: 0.0494

Epoch 10, batch 237
training loss: 0.10491912066936493 

Epoch 10, batch 238
training loss: 0.010488814674317837 

Epoch 10, batch 239
training loss: 0.12868787348270416 

Epoch 10, batch 240
training loss: 0.0646333172917366 

Epoch 10, batch 241
training loss: 0.079627126455307 

Epoch 10, batch 242
training loss: 0.1900731921195984 

Epoch 10, batch 243
training loss: 0.06494248658418655 

Epoch 10, batch 244
training loss: 0.012873448431491852 

Epoch 10, batch 245
training loss: 0.5542586445808411 

Epoch 10, batch 246
training loss: 0.004723338410258293 

Epoch 10, batch 247
training loss: 0.02643462084233761 

Epoch 10, batch 248
training loss: 0.015227722004055977 

Epoch 10, batch 249
training loss: 0.07345521450042725 

Epoch 10, batch 250
training loss: 0.0033567429054528475 

Epoch 10, batch 251
training loss: 0.02427086792886257 

Epoch 10, batch 252
training loss: 0.013410809449851513 

Epoch 10, batch 253
training loss: 0.06303351372480392 

Epoch 10, batch 254
training 

Epoch 10, batch 458
training loss: 0.01762506365776062 

Epoch 10, batch 459
training loss: 0.04378899186849594 

Epoch 10, batch 460
training loss: 0.012410306371748447 

Epoch 10, batch 461
training loss: 0.03479095175862312 

Epoch 10, batch 462
training loss: 0.002128326566889882 

Epoch 10, batch 463
training loss: 0.02871515229344368 

Epoch 10, batch 464
training loss: 0.020004525780677795 

Epoch 10, batch 465
training loss: 0.14032629132270813 

Epoch 10, batch 466
training loss: 0.024350643157958984 

Epoch 10, batch 467
training loss: 0.10331344604492188 

Epoch 10, batch 468
training loss: 0.06245095655322075 

Epoch 10, batch 469
training loss: 0.08560200035572052 

Epoch 10, batch 470
training loss: 0.0443301722407341 

Epoch 10, batch 471
training loss: 0.052344225347042084 

Epoch 10, batch 472
training loss: 0.01320600789040327 

Epoch 10, batch 473
training loss: 0.03457081690430641 

Epoch 10, batch 474
training loss: 0.011280827224254608 

Epoch 10, batch 475
traini

Epoch 10, batch 678
training loss: 0.4627501368522644 

Epoch 10, batch 679
training loss: 0.047787826508283615 

Epoch 10, batch 680
training loss: 0.030771862715482712 

Epoch 10, batch 681
training loss: 0.08092556893825531 

Epoch 10, batch 682
training loss: 0.07813651859760284 

Epoch 10, batch 683
training loss: 0.05580607056617737 

Epoch 10, batch 684
training loss: 0.2462584525346756 

Epoch 10, batch 685
training loss: 0.04407908767461777 

Epoch 10, batch 686
training loss: 0.06670482456684113 

Epoch 10, batch 687
training loss: 0.06136130541563034 

Epoch 10, batch 688
training loss: 0.03433837741613388 

Epoch 10, batch 689
training loss: 0.09856213629245758 

Epoch 10, batch 690
training loss: 0.016223084181547165 

Epoch 10, batch 691
training loss: 0.052473943680524826 

Epoch 10, batch 692
training loss: 0.7451174855232239 

Epoch 10, batch 693
training loss: 0.09069906175136566 

Epoch 10, batch 694
training loss: 0.14254648983478546 

Epoch 10, batch 695
training l

Epoch 10, batch 897
training loss: 0.05448610708117485 

Epoch 10, batch 898
training loss: 0.026818236336112022 

Epoch 10, batch 899
training loss: 0.07131408154964447 

Epoch 10, batch 900
training loss: 0.050946492701768875 

Epoch 10, batch 901
training loss: 0.12328390777111053 

Epoch 10, batch 902
training loss: 0.057512134313583374 

Epoch 10, batch 903
training loss: 0.12049033492803574 

Epoch 10, batch 904
training loss: 0.0020731990225613117 

Epoch 10, batch 905
training loss: 0.057776130735874176 

Epoch 10, batch 906
training loss: 0.025764569640159607 

Epoch 10, batch 907
training loss: 0.10777361690998077 

Epoch 10, batch 908
training loss: 0.029191484674811363 

Epoch 10, batch 909
training loss: 0.0450785867869854 

Epoch 10, batch 910
training loss: 0.005140113178640604 

Epoch 10, batch 911
training loss: 0.006328210234642029 

Epoch 10, batch 912
training loss: 0.02580070123076439 

Epoch 10, batch 913
training loss: 0.010499110445380211 

Epoch 10, batch 914
t

Epoch 10, batch 1118
training loss: 0.04292856529355049 

Epoch 10, batch 1119
training loss: 0.3589296042919159 

Epoch 10, batch 1120
training loss: 0.02746480703353882 

Epoch 10, batch 1121
training loss: 0.21362993121147156 

Epoch 10, batch 1122
training loss: 0.07016628980636597 

Epoch 10, batch 1123
training loss: 0.034103989601135254 

Epoch 10, batch 1124
training loss: 0.014518819749355316 

Epoch 10, batch 1125
training loss: 0.035975486040115356 

Epoch 10, batch 1126
training loss: 0.07140527665615082 

Epoch 10, batch 1127
training loss: 0.06643606722354889 

Epoch 10, batch 1128
training loss: 0.005669800098985434 

Epoch 10, batch 1129
training loss: 0.0796993225812912 

Epoch 10, batch 1130
training loss: 0.0078814085572958 

Epoch 10, batch 1131
training loss: 0.007777959108352661 

Epoch 10, batch 1132
training loss: 0.005797137506306171 

Epoch 10, batch 1133
training loss: 0.042584192007780075 

Epoch 10, batch 1134
training loss: 0.002097783610224724 

Epoch 10,

Epoch 10, batch 1335
training loss: 0.0035343323834240437 

Epoch 10, batch 1336
training loss: 0.008083844557404518 

Epoch 10, batch 1337
training loss: 0.009462589398026466 

Epoch 10, batch 1338
training loss: 0.013155976310372353 

Epoch 10, batch 1339
training loss: 0.004331781528890133 

Epoch 10, batch 1340
training loss: 0.06234865263104439 

Epoch 10, batch 1341
training loss: 0.010172687470912933 

Epoch 10, batch 1342
training loss: 0.02211391180753708 

Epoch 10, batch 1343
training loss: 0.035490572452545166 

Epoch 10, batch 1344
training loss: 0.058569710701704025 

Epoch 10, batch 1345
training loss: 0.6037660837173462 

Epoch 10, batch 1346
training loss: 0.1942799985408783 

Epoch 10, batch 1347
training loss: 0.053621429949998856 

Epoch 10, batch 1348
training loss: 0.05357102304697037 

Epoch 10, batch 1349
training loss: 0.8720806837081909 

Epoch 10, batch 1350
training loss: 0.014777074567973614 

Epoch 10, batch 1351
training loss: 0.019207289442420006 

Epoch

Epoch 10, batch 1555
training loss: 0.015130753628909588 

Epoch 10, batch 1556
training loss: 0.1158180832862854 

Epoch 10, batch 1557
training loss: 0.10345838963985443 

Epoch 10, batch 1558
training loss: 0.010191528126597404 

Epoch 10, batch 1559
training loss: 0.11751381307840347 

Epoch 10, batch 1560
training loss: 0.024956904351711273 

Epoch 10, batch 1561
training loss: 0.10322876274585724 

Epoch 10, batch 1562
training loss: 0.03285405784845352 

Epoch 10, batch 1563
training loss: 0.026180382817983627 

Epoch 10, batch 1564
training loss: 0.003145680297166109 

Epoch 10, batch 1565
training loss: 0.012762775644659996 

Epoch 10, batch 1566
training loss: 0.029712051153182983 

Epoch 10, batch 1567
training loss: 0.4516494870185852 

Epoch 10, batch 1568
training loss: 0.01269774604588747 

Epoch 10, batch 1569
training loss: 0.02898133173584938 

Epoch 10, batch 1570
training loss: 0.20196446776390076 

Epoch 10, batch 1571
training loss: 0.012380997650325298 

Epoch 10

Epoch 10, batch 1766
training loss: 0.04470960423350334 

Epoch 10, batch 1767
training loss: 0.0030914905946701765 

Epoch 10, batch 1768
training loss: 0.29888415336608887 

Epoch 10, batch 1769
training loss: 0.004374098964035511 

Epoch 10, batch 1770
training loss: 0.03999187424778938 

Epoch 10, batch 1771
training loss: 0.05395630747079849 

Epoch 10, batch 1772
training loss: 0.6328604817390442 

Epoch 10, batch 1773
training loss: 0.05523676797747612 

Epoch 10, batch 1774
training loss: 0.01264632772654295 

Epoch 10, batch 1775
training loss: 0.04380274564027786 

Epoch 10, batch 1776
training loss: 0.09845846891403198 

Epoch 10, batch 1777
training loss: 0.0024073487147688866 

Epoch 10, batch 1778
training loss: 0.009076239541172981 

Epoch 10, batch 1779
training loss: 0.029557684436440468 

Epoch 10, batch 1780
training loss: 0.6563084721565247 

Epoch 10, batch 1781
training loss: 0.10165431350469589 

Epoch 10, batch 1782
training loss: 0.012559126131236553 

Epoch 10

Epoch 10, batch 1979
training loss: 0.022306106984615326 

Epoch 10, batch 1980
training loss: 0.3597193658351898 

Epoch 10, batch 1981
training loss: 0.8331102132797241 

Epoch 10, batch 1982
training loss: 0.09096948802471161 

Epoch 10, batch 1983
training loss: 0.01054296363145113 

Epoch 10, batch 1984
training loss: 0.20331287384033203 

Epoch 10, batch 1985
training loss: 0.05541254207491875 

Epoch 10, batch 1986
training loss: 0.25481313467025757 

Epoch 10, batch 1987
training loss: 0.2004869431257248 

Epoch 10, batch 1988
training loss: 0.04110623151063919 

Epoch 10, batch 1989
training loss: 0.16383865475654602 

Epoch 10, batch 1990
training loss: 0.008843431249260902 

Epoch 10, batch 1991
training loss: 0.060879092663526535 

Epoch 10, batch 1992
training loss: 0.013076407834887505 

Epoch 10, batch 1993
training loss: 0.007689435034990311 

Epoch 10, batch 1994
training loss: 0.027580389752984047 

Epoch 10, batch 1995
training loss: 0.2690969407558441 

Epoch 10, ba

Epoch 10, batch 2198
training loss: 0.19874827563762665 

Epoch 10, batch 2199
training loss: 0.0032839581836014986 

Epoch 10, batch 2200
training loss: 0.005349600221961737 

Epoch 10, batch 2201
training loss: 0.01569782756268978 

Epoch 10, batch 2202
training loss: 0.013531342148780823 

Epoch 10, batch 2203
training loss: 0.11249657720327377 

Epoch 10, batch 2204
training loss: 0.018398767337203026 

Epoch 10, batch 2205
training loss: 0.024886399507522583 

Epoch 10, batch 2206
training loss: 0.007791283540427685 

Epoch 10, batch 2207
training loss: 0.02460591122508049 

Epoch 10, batch 2208
training loss: 0.3925972580909729 

Epoch 10, batch 2209
training loss: 0.061821967363357544 

Epoch 10, batch 2210
training loss: 0.09891010820865631 

Epoch 10, batch 2211
training loss: 0.030419597402215004 

Epoch 10, batch 2212
training loss: 0.14899295568466187 

Epoch 10, batch 2213
training loss: 0.02363092079758644 

Epoch 10, batch 2214
training loss: 0.03144528344273567 

Epoch 

Epoch 10, batch 2418
training loss: 0.07263055443763733 

Epoch 10, batch 2419
training loss: 0.19734525680541992 

Epoch 10, batch 2420
training loss: 0.031793832778930664 

Epoch 10, batch 2421
training loss: 0.04107203334569931 

Epoch 10, batch 2422
training loss: 0.02027195319533348 

Epoch 10, batch 2423
training loss: 0.004248192999511957 

Epoch 10, batch 2424
training loss: 0.1123473197221756 

Epoch 10, batch 2425
training loss: 0.15054239332675934 

Epoch 10, batch 2426
training loss: 0.02107315883040428 

Epoch 10, batch 2427
training loss: 0.009360276162624359 

Epoch 10, batch 2428
training loss: 0.12972542643547058 

Epoch 10, batch 2429
training loss: 0.21827013790607452 

Epoch 10, batch 2430
training loss: 0.5066702961921692 

Epoch 10, batch 2431
training loss: 0.09259192645549774 

Epoch 10, batch 2432
training loss: 0.056500811129808426 

Epoch 10, batch 2433
training loss: 0.09691757708787918 

Epoch 10, batch 2434
training loss: 0.009701890870928764 

Epoch 10, b

Epoch 10, batch 2634
training loss: 0.4119602143764496 

Epoch 10, batch 2635
training loss: 0.040277086198329926 

Epoch 10, batch 2636
training loss: 0.008407571353018284 

Epoch 10, batch 2637
training loss: 0.03497889265418053 

Epoch 10, batch 2638
training loss: 0.004289468750357628 

Epoch 10, batch 2639
training loss: 0.011779803782701492 

Epoch 10, batch 2640
training loss: 0.12408248335123062 

Epoch 10, batch 2641
training loss: 0.07298271358013153 

Epoch 10, batch 2642
training loss: 0.02914750948548317 

Epoch 10, batch 2643
training loss: 0.0051187933422625065 

Epoch 10, batch 2644
training loss: 0.006675553973764181 

Epoch 10, batch 2645
training loss: 0.07234184443950653 

Epoch 10, batch 2646
training loss: 0.010443917475640774 

Epoch 10, batch 2647
training loss: 0.09248755872249603 

Epoch 10, batch 2648
training loss: 0.018148431554436684 

Epoch 10, batch 2649
training loss: 0.2194625586271286 

Epoch 10, batch 2650
training loss: 0.012116050347685814 

Epoch 

Epoch 10, batch 2851
training loss: 0.4858309328556061 

Epoch 10, batch 2852
training loss: 0.747343122959137 

Epoch 10, batch 2853
training loss: 0.3033188581466675 

Epoch 10, batch 2854
training loss: 0.09767962992191315 

Epoch 10, batch 2855
training loss: 0.020857691764831543 

Epoch 10, batch 2856
training loss: 0.024367287755012512 

Epoch 10, batch 2857
training loss: 0.13702143728733063 

Epoch 10, batch 2858
training loss: 0.6200231313705444 

Epoch 10, batch 2859
training loss: 0.2563660740852356 

Epoch 10, batch 2860
training loss: 0.008375449106097221 

Epoch 10, batch 2861
training loss: 0.29764309525489807 

Epoch 10, batch 2862
training loss: 0.052016206085681915 

Epoch 10, batch 2863
training loss: 0.7432516813278198 

Epoch 10, batch 2864
training loss: 0.011129060760140419 

Epoch 10, batch 2865
training loss: 0.16377030313014984 

Epoch 10, batch 2866
training loss: 0.018192579969763756 

Epoch 10, batch 2867
training loss: 0.020520437508821487 

Epoch 10, batc

Epoch 10, batch 3073
training loss: 0.21818354725837708 

Epoch 10, batch 3074
training loss: 0.00651902798563242 

Epoch 10, batch 3075
training loss: 0.0040693096816539764 

Epoch 10, batch 3076
training loss: 0.03643433749675751 

Epoch 10, batch 3077
training loss: 0.012856224551796913 

Epoch 10, batch 3078
training loss: 0.022340521216392517 

Epoch 10, batch 3079
training loss: 0.024789558723568916 

Epoch 10, batch 3080
training loss: 0.01606190949678421 

Epoch 10, batch 3081
training loss: 0.1285773366689682 

Epoch 10, batch 3082
training loss: 0.01189226470887661 

Epoch 10, batch 3083
training loss: 0.21694543957710266 

Epoch 10, batch 3084
training loss: 0.022084418684244156 

Epoch 10, batch 3085
training loss: 0.15371033549308777 

Epoch 10, batch 3086
training loss: 0.013602753169834614 

Epoch 10, batch 3087
training loss: 0.03393571078777313 

Epoch 10, batch 3088
training loss: 0.14557340741157532 

Epoch 10, batch 3089
training loss: 0.040009066462516785 

Epoch 1

Epoch 10, batch 3298
training loss: 0.006078606937080622 

Epoch 10, batch 3299
training loss: 0.028811339288949966 

Epoch 10, batch 3300
training loss: 0.01583951525390148 

Epoch 10, batch 3301
training loss: 0.0045923045836389065 

Epoch 10, batch 3302
training loss: 0.06855268031358719 

Epoch 10, batch 3303
training loss: 0.3382335305213928 

Epoch 10, batch 3304
training loss: 0.09379666298627853 

Epoch 10, batch 3305
training loss: 0.23822753131389618 

Epoch 10, batch 3306
training loss: 0.06258437037467957 

Epoch 10, batch 3307
training loss: 0.022639606148004532 

Epoch 10, batch 3308
training loss: 0.10434259474277496 

Epoch 10, batch 3309
training loss: 0.008658485487103462 

Epoch 10, batch 3310
training loss: 0.005421909503638744 

Epoch 10, batch 3311
training loss: 0.042617715895175934 

Epoch 10, batch 3312
training loss: 0.26620766520500183 

Epoch 10, batch 3313
training loss: 0.10904457420110703 

Epoch 10, batch 3314
training loss: 0.012963141314685345 

Epoch 

Epoch 10, batch 3523
training loss: 0.058046381920576096 

Epoch 10, batch 3524
training loss: 0.1378551423549652 

Epoch 10, batch 3525
training loss: 0.5096501111984253 

Epoch 10, batch 3526
training loss: 0.180332213640213 

Epoch 10, batch 3527
training loss: 0.006681571248918772 

Epoch 10, batch 3528
training loss: 0.0918491929769516 

Epoch 10, batch 3529
training loss: 0.01899312250316143 

Epoch 10, batch 3530
training loss: 0.0046373941004276276 

Epoch 10, batch 3531
training loss: 0.09333029389381409 

Epoch 10, batch 3532
training loss: 0.09654758870601654 

Epoch 10, batch 3533
training loss: 0.010452214628458023 

Epoch 10, batch 3534
training loss: 0.1915838122367859 

Epoch 10, batch 3535
training loss: 0.008730193600058556 

Epoch 10, batch 3536
training loss: 0.06756912916898727 

Epoch 10, batch 3537
training loss: 0.08104528486728668 

Epoch 10, batch 3538
training loss: 0.018110137432813644 

Epoch 10, batch 3539
training loss: 0.07369251549243927 

Epoch 10, bat

Epoch 10, batch 3745
training loss: 0.11921001970767975 

Epoch 10, batch 3746
training loss: 0.1287010908126831 

Epoch 10, batch 3747
training loss: 0.07444505393505096 

Epoch 10, batch 3748
training loss: 0.047935061156749725 

Epoch 10, batch 3749
training loss: 0.10162851959466934 

Epoch 10, batch 3750
training loss: 0.08421184122562408 

Epoch 10, batch 3751
training loss: 0.41870737075805664 

Epoch 10, batch 3752
training loss: 0.03139404207468033 

Epoch 10, batch 3753
training loss: 0.09380575269460678 

Epoch 10, batch 3754
training loss: 0.009241851046681404 

Epoch 10, batch 3755
training loss: 0.16825972497463226 

Epoch 10, batch 3756
training loss: 0.10447248071432114 

Epoch 10, batch 3757
training loss: 0.019641544669866562 

Epoch 10, batch 3758
training loss: 0.030243556946516037 

Epoch 10, batch 3759
training loss: 0.002972081769257784 

Epoch 10, batch 3760
training loss: 0.030330747365951538 

Epoch 10, batch 3761
training loss: 0.1126473993062973 

Epoch 10, 

Epoch 10, batch 3970
training loss: 0.008492517285048962 

Epoch 10, batch 3971
training loss: 0.8058620691299438 

Epoch 10, batch 3972
training loss: 0.0392608568072319 

Epoch 10, batch 3973
training loss: 0.18267814815044403 

Epoch 10, batch 3974
training loss: 0.0021725809201598167 

Epoch 10, batch 3975
training loss: 0.023735489696264267 

Epoch 10, batch 3976
training loss: 0.30202093720436096 

Epoch 10, batch 3977
training loss: 0.0060326093807816505 

Epoch 10, batch 3978
training loss: 0.03227964788675308 

Epoch 10, batch 3979
training loss: 0.23275122046470642 

Epoch 10, batch 3980
training loss: 0.00783831812441349 

Epoch 10, batch 3981
training loss: 0.29227036237716675 

Epoch 10, batch 3982
training loss: 0.12926419079303741 

Epoch 10, batch 3983
training loss: 0.328634113073349 

Epoch 10, batch 3984
training loss: 0.017038492485880852 

Epoch 10, batch 3985
training loss: 0.3038250803947449 

Epoch 10, batch 3986
training loss: 0.024151431396603584 

Epoch 10, b

Epoch 10, batch 4196
training loss: 0.1592298001050949 

Epoch 10, batch 4197
training loss: 0.7709307074546814 

Epoch 10, batch 4198
training loss: 0.01270351093262434 

Epoch 10, batch 4199
training loss: 0.062018923461437225 

Epoch 10, batch 4200
training loss: 0.04215376079082489 

Epoch 10, batch 4201
training loss: 0.024684593081474304 

Epoch 10, batch 4202
training loss: 0.6435695290565491 

Epoch 10, batch 4203
training loss: 0.03317985683679581 

Epoch 10, batch 4204
training loss: 0.02093033865094185 

Epoch 10, batch 4205
training loss: 0.20935019850730896 

Epoch 10, batch 4206
training loss: 0.03589282184839249 

Epoch 10, batch 4207
training loss: 0.2174038589000702 

Epoch 10, batch 4208
training loss: 0.005419283639639616 

Epoch 10, batch 4209
training loss: 0.0023678201250731945 

Epoch 10, batch 4210
training loss: 0.05348880961537361 

Epoch 10, batch 4211
training loss: 0.012434253469109535 

Epoch 10, batch 4212
training loss: 0.007213742472231388 

Epoch 10, b

Epoch 10, batch 4422
training loss: 0.12062293291091919 

Epoch 10, batch 4423
training loss: 0.10838960111141205 

Epoch 10, batch 4424
training loss: 0.035968754440546036 

Epoch 10, batch 4425
training loss: 0.1319907307624817 

Epoch 10, batch 4426
training loss: 0.014510194770991802 

Epoch 10, batch 4427
training loss: 0.025439638644456863 

Epoch 10, batch 4428
training loss: 0.13443878293037415 

Epoch 10, batch 4429
training loss: 0.02964203618466854 

Epoch 10, batch 4430
training loss: 0.027314523234963417 

Epoch 10, batch 4431
training loss: 0.030780375003814697 

Epoch 10, batch 4432
training loss: 0.12564754486083984 

Epoch 10, batch 4433
training loss: 0.006348565220832825 

Epoch 10, batch 4434
training loss: 0.046387817710638046 

Epoch 10, batch 4435
training loss: 0.01662970334291458 

Epoch 10, batch 4436
training loss: 0.15763242542743683 

Epoch 10, batch 4437
training loss: 0.03883387893438339 

Epoch 10, batch 4438
training loss: 0.29350247979164124 

Epoch 10

Epoch 10, batch 4639
training loss: 0.05219195410609245 

Epoch 10, batch 4640
training loss: 0.01663276180624962 

Epoch 10, batch 4641
training loss: 0.0955076813697815 

Epoch 10, batch 4642
training loss: 0.04044591262936592 

Epoch 10, batch 4643
training loss: 0.015425602905452251 

Epoch 10, batch 4644
training loss: 0.09738896787166595 

Epoch 10, batch 4645
training loss: 0.012291916646063328 

Epoch 10, batch 4646
training loss: 0.005543042905628681 

Epoch 10, batch 4647
training loss: 0.047369249165058136 

Epoch 10, batch 4648
training loss: 0.04654798284173012 

Epoch 10, batch 4649
training loss: 0.24666814506053925 

Epoch 10, batch 4650
training loss: 0.0025127865374088287 

Epoch 10, batch 4651
training loss: 0.038701131939888 

Epoch 10, batch 4652
training loss: 0.015744024887681007 

Epoch 10, batch 4653
training loss: 0.3629201650619507 

Epoch 10, batch 4654
training loss: 0.007670844439417124 

Epoch 10, batch 4655
training loss: 0.01348658837378025 

Epoch 10, 

Epoch 10, batch 4858
training loss: 0.35737285017967224 

Epoch 10, batch 4859
training loss: 0.043107397854328156 

Epoch 10, batch 4860
training loss: 0.5754503011703491 

Epoch 10, batch 4861
training loss: 0.036674126982688904 

Epoch 10, batch 4862
training loss: 0.005252066068351269 

Epoch 10, batch 4863
training loss: 0.007575713098049164 

Epoch 10, batch 4864
training loss: 0.05024982616305351 

Epoch 10, batch 4865
training loss: 0.6133497953414917 

Epoch 10, batch 4866
training loss: 0.13133546710014343 

Epoch 10, batch 4867
training loss: 0.4279659688472748 

Epoch 10, batch 4868
training loss: 0.18979927897453308 

Epoch 10, batch 4869
training loss: 0.01037059910595417 

Epoch 10, batch 4870
training loss: 0.024738619104027748 

Epoch 10, batch 4871
training loss: 0.005212593358010054 

Epoch 10, batch 4872
training loss: 0.39897072315216064 

Epoch 10, batch 4873
training loss: 0.01125444658100605 

Epoch 10, batch 4874
training loss: 0.17696617543697357 

Epoch 10, b

Epoch 10, batch 5074
training loss: 0.0030695763416588306 

Epoch 10, batch 5075
training loss: 0.03604178503155708 

Epoch 10, batch 5076
training loss: 0.04377087205648422 

Epoch 10, batch 5077
training loss: 0.004244149196892977 

Epoch 10, batch 5078
training loss: 0.0015014868695288897 

Epoch 10, batch 5079
training loss: 0.4235685467720032 

Epoch 10, batch 5080
training loss: 0.03519805520772934 

Epoch 10, batch 5081
training loss: 0.010913265869021416 

Epoch 10, batch 5082
training loss: 0.005104199983179569 

Epoch 10, batch 5083
training loss: 0.03598051518201828 

Epoch 10, batch 5084
training loss: 0.30639931559562683 

Epoch 10, batch 5085
training loss: 0.07218387722969055 

Epoch 10, batch 5086
training loss: 0.021989893168210983 

Epoch 10, batch 5087
training loss: 0.6993380784988403 

Epoch 10, batch 5088
training loss: 0.055031925439834595 

Epoch 10, batch 5089
training loss: 0.3524378836154938 

Epoch 10, batch 5090
training loss: 0.03903677314519882 

Epoch 10

Epoch 10, batch 5279
training loss: 0.03972681239247322 

Epoch 10, batch 5280
training loss: 0.06156370788812637 

Epoch 10, batch 5281
training loss: 0.005381846334785223 

Epoch 10, batch 5282
training loss: 0.12459834665060043 

Epoch 10, batch 5283
training loss: 0.009229034185409546 

Epoch 10, batch 5284
training loss: 0.07433050870895386 

Epoch 10, batch 5285
training loss: 0.14629067480564117 

Epoch 10, batch 5286
training loss: 0.022284839302301407 

Epoch 10, batch 5287
training loss: 0.08055723458528519 

Epoch 10, batch 5288
training loss: 0.024544568732380867 

Epoch 10, batch 5289
training loss: 0.01460225135087967 

Epoch 10, batch 5290
training loss: 0.695652425289154 

Epoch 10, batch 5291
training loss: 0.017695780843496323 

Epoch 10, batch 5292
training loss: 0.9325550198554993 

Epoch 10, batch 5293
training loss: 0.18832698464393616 

Epoch 10, batch 5294
training loss: 0.5344575643539429 

Epoch 10, batch 5295
training loss: 0.7154471278190613 

Epoch 10, batc

Epoch 10, batch 5499
training loss: 0.06748189777135849 

Epoch 10, batch 5500
training loss: 0.12090200185775757 

Epoch 10, batch 5501
training loss: 0.009155086241662502 

Epoch 10, batch 5502
training loss: 0.0015208396362140775 

Epoch 10, batch 5503
training loss: 0.04406416416168213 

Epoch 10, batch 5504
training loss: 0.03778504207730293 

Epoch 10, batch 5505
training loss: 0.00691188732162118 

Epoch 10, batch 5506
training loss: 0.1874304711818695 

Epoch 10, batch 5507
training loss: 0.004771158564835787 

Epoch 10, batch 5508
training loss: 0.15694797039031982 

Epoch 10, batch 5509
training loss: 0.003163248999044299 

Epoch 10, batch 5510
training loss: 0.7142764329910278 

Epoch 10, batch 5511
training loss: 0.305085688829422 

Epoch 10, batch 5512
training loss: 0.003789375303313136 

Epoch 10, batch 5513
training loss: 0.007867975160479546 

Epoch 10, batch 5514
training loss: 0.008625623770058155 

Epoch 10, batch 5515
training loss: 0.1776919960975647 

Epoch 10, b

Epoch 10, batch 5718
training loss: 0.014170488342642784 

Epoch 10, batch 5719
training loss: 0.03437361866235733 

Epoch 10, batch 5720
training loss: 0.026579609140753746 

Epoch 10, batch 5721
training loss: 0.061947762966156006 

Epoch 10, batch 5722
training loss: 0.027497131377458572 

Epoch 10, batch 5723
training loss: 0.007967429235577583 

Epoch 10, batch 5724
training loss: 0.15178218483924866 

Epoch 10, batch 5725
training loss: 0.08484599739313126 

Epoch 10, batch 5726
training loss: 0.03625309094786644 

Epoch 10, batch 5727
training loss: 0.003516852157190442 

Epoch 10, batch 5728
training loss: 0.0038017493207007647 

Epoch 10, batch 5729
training loss: 0.4544835090637207 

Epoch 10, batch 5730
training loss: 0.012511332519352436 

Epoch 10, batch 5731
training loss: 0.3888254761695862 

Epoch 10, batch 5732
training loss: 0.08151806890964508 

Epoch 10, batch 5733
training loss: 0.16044725477695465 

Epoch 10, batch 5734
training loss: 0.006793519947677851 

Epoch 

Epoch 10, batch 5936
training loss: 0.7681864500045776 

Epoch 10, batch 5937
training loss: 0.011287437751889229 

Epoch 10, batch 5938
training loss: 0.16158144176006317 

Epoch 10, batch 5939
training loss: 0.0766485333442688 

Epoch 10, batch 5940
training loss: 0.09469076246023178 

Epoch 10, batch 5941
training loss: 0.1386057436466217 

Epoch 10, batch 5942
training loss: 0.008369168266654015 

Epoch 10, batch 5943
training loss: 0.09333322942256927 

Epoch 10, batch 5944
training loss: 0.10118237882852554 

Epoch 10, batch 5945
training loss: 0.010359447449445724 

Epoch 10, batch 5946
training loss: 0.054045505821704865 

Epoch 10, batch 5947
training loss: 0.1749398410320282 

Epoch 10, batch 5948
training loss: 0.1090371236205101 

Epoch 10, batch 5949
training loss: 0.03610512614250183 

Epoch 10, batch 5950
training loss: 0.011905076913535595 

Epoch 10, batch 5951
training loss: 0.011995651759207249 

Epoch 10, batch 5952
training loss: 0.1737779676914215 

Epoch 10, batc

In [47]:
def eval_model(model, test_data):
    test_loader = DataLoader(test_data, batch_size=10, shuffle=True)
    correct = 0
    total = 0
    with torch.no_grad():
        for data in test_loader:
            x, y = data
            output = model(x.view(-1, 784))
            for idx, i in enumerate(output):
                if torch.argmax(i) == y[idx]:
                    correct += 1
                total += 1
    print(f'accuracy: {correct/total}')

eval_model(model, mnist_test)

accuracy: 0.9619
