In [1]:
import torch
from model import *
import numpy as np
import os
import random
import torch.optim as optim
import torch.nn as nn
from Myloader import *
import time
import torchvision.models as models
from torchmetrics.classification import MultilabelAveragePrecision



In [2]:
def set_seed(seed):
    torch.manual_seed(seed)
    torch.cuda.manual_seed(seed)
    torch.cuda.manual_seed_all(seed)
    np.random.seed(seed)
    random.seed(seed)
    torch.backends.cudnn.benchmark = False
    torch.backends.cudnn.deterministic = True


def evaluate(model, val_loader):
    model.eval()
    test_running_loss = 0.0
    test_total = 0

    with torch.no_grad():
        record_target_label = torch.zeros(1, 19).to(device)
        record_predict_label = torch.zeros(1, 19).to(device)
        for (test_imgs, test_labels, test_dicoms) in val_loader:
            test_imgs = test_imgs.to(device)
            test_labels = test_labels.to(device)
            test_labels = test_labels.squeeze(-1)

            test_output = model(test_imgs)
            loss = criterion(test_output, test_labels)

            test_running_loss += loss.item() * test_imgs.size(0)
            test_total += test_imgs.size(0)

            record_target_label = torch.cat((record_target_label, test_labels), 0)
            record_predict_label = torch.cat((record_predict_label, test_output), 0)


        record_target_label = record_target_label[1::]
        record_predict_label = record_predict_label[1::]

        metric = MultilabelAveragePrecision(num_labels=19, average="macro", thresholds=None)
        mAP = metric(record_predict_label, record_target_label.to(torch.int32))

    return mAP, test_running_loss, test_total

In [3]:
set_seed(123)
#     weight_dir = ""
#     if not os.path.exists(weight_dir):
#         os.makedirs(weight_dir)

epochs = 100
batch_size = 32
num_classes = 19

weight_path = "weights/"

train_path = "data/MICCAI_long_tail_train.tfrecords"
train_index = "data/MICCAI_long_tail_train.tfindex"
val_path = "data/MICCAI_long_tail_val.tfrecords"
val_index = "data/MICCAI_long_tail_val.tfindex"
opt_lr = 1e-4
weight_decay = 0
training = True
train_name = ""
val_name = ""

In [4]:
device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
print(device)
encoder = ResnetEncoder(num_layers=18, embDimension=num_classes).to(device)
opt = optim.Adam(encoder.parameters(), lr=opt_lr, weight_decay = weight_decay)
train_loader = Myloader(train_path, train_index, batch_size, num_workers=0, shuffle=True)
val_loader = Myloader(val_path, val_index, batch_size, num_workers=0, shuffle=False)

criterion = nn.BCEWithLogitsLoss()

cuda




In [14]:
print(mAP, test_running_loss, test_total )

tensor(0.1372, device='cuda:0') 15696.87715625763 20360


In [12]:
# torch.save({
#       'model_state_dict': encoder.state_dict(),
#       'optimizer_state_dict': opt.state_dict(),
#   }, weight_path+'/test.pt')

In [13]:
# checkpoint = torch.load(weight_path+'/test.pt')
# encoder.load_state_dict(checkpoint['model_state_dict'])
# opt.load_state_dict(checkpoint['optimizer_state_dict'])

In [None]:
# mAP, test_running_loss, test_total = evaluate(encoder, val_loader)

In [None]:
train_losses = []
test_losses = []

if training == True:
#         wandb.init(
#             project='chexpert mitigate bias',
#             name= train_wandb_name)
#         config = wandb.config
#         config.batch_size = batch_size
    max_map = 0
    total = 0
    scaler = torch.cuda.amp.GradScaler()

    for epoch in range(epochs):
        encoder.train()
        running_loss = 0.0
        start_time = time.time()
        count = 0

        for (imgs, labels, dicom_ids) in train_loader:
            encoder.zero_grad()
            opt.zero_grad()

            imgs = imgs.to(device)
            labels = labels.to(device)
            labels = labels.squeeze(-1)

            with torch.autocast(device_type='cuda', dtype=torch.float16):
                output = encoder(imgs)
                loss = criterion(output, labels)

            scaler.scale(loss).backward()
            scaler.step(opt)
            scaler.update()

            running_loss += loss.item() * imgs.size(0)
            count += imgs.size(0)

            if count != 0 and count % 1024 == 0 and total == 0:
                print(f"epoch {epoch}: {count}/unknown finished / train loss: {running_loss / count}")

            elif count != 0 and count % 10 == 0 and total != 0:
                print(f"epoch {epoch}: {count}/{total} (%.2f %%) finished / train loss: {running_loss / count}" % (count/total))

        total = count
        mAP, test_running_loss, test_total = evaluate(encoder, val_loader)
        
        train_losses.append(running_loss / count)
        test_losses.append(test_running_loss)
        
        if mAP > max_map:
            max_map = mAP
            torch.save({
                'model_state_dict': encoder.state_dict(),
                'optimizer_state_dict': opt.state_dict(),
            }, f"{weight_path}/model_best.pt")
        if epoch % 10 == 0:
            torch.save({
                    'model_state_dict': encoder.state_dict(),
                    'optimizer_state_dict': opt.state_dict(),
                }, weight_path+"/{}epoch.pt".format(epoch))

        end_time = time.time()
        duration = end_time - start_time

        print(f"epoch {epoch} / mAP: {mAP} / test loss: {test_running_loss / test_total} / duration: {duration}")





epoch 0: 1024/unknown finished / train loss: 0.4247866189107299
epoch 0: 2048/unknown finished / train loss: 0.3762495471164584
epoch 0: 3072/unknown finished / train loss: 0.35491527151316404
epoch 0: 4096/unknown finished / train loss: 0.33879745670128614
epoch 0: 5120/unknown finished / train loss: 0.33022431591525675
epoch 0: 6144/unknown finished / train loss: 0.3233362406026572
epoch 0: 7168/unknown finished / train loss: 0.31730631313153673
epoch 0: 8192/unknown finished / train loss: 0.31565669167321175
epoch 0: 9216/unknown finished / train loss: 0.3123269284971886
epoch 0: 10240/unknown finished / train loss: 0.30940602710470555
epoch 0: 11264/unknown finished / train loss: 0.3064982090992006
epoch 0: 12288/unknown finished / train loss: 0.3036631285212934
epoch 0: 13312/unknown finished / train loss: 0.3020171134446103
epoch 0: 14336/unknown finished / train loss: 0.3010796048744981
epoch 0: 15360/unknown finished / train loss: 0.29958329017584523
epoch 0: 16384/unknown fini

epoch 0: 130048/unknown finished / train loss: 0.2715492548795021
epoch 0: 131072/unknown finished / train loss: 0.27148861339810537
epoch 0: 132096/unknown finished / train loss: 0.2714036445371633
epoch 0: 133120/unknown finished / train loss: 0.2712982663311637
epoch 0: 134144/unknown finished / train loss: 0.2711914220668432
epoch 0: 135168/unknown finished / train loss: 0.27103271583363303
epoch 0: 136192/unknown finished / train loss: 0.27095147131949215
epoch 0: 137216/unknown finished / train loss: 0.27087222996737753
epoch 0: 138240/unknown finished / train loss: 0.2708004722923592
epoch 0: 139264/unknown finished / train loss: 0.2706820242901278
epoch 0: 140288/unknown finished / train loss: 0.27056988930995884
epoch 0: 141312/unknown finished / train loss: 0.2705553954001516
epoch 0: 142336/unknown finished / train loss: 0.2703719040204724
epoch 0: 143360/unknown finished / train loss: 0.2703205941777144
epoch 0: 144384/unknown finished / train loss: 0.2702637107527636
epoch

epoch 1: 10560/182380 (0.06 %) finished / train loss: 0.25299369101271485
epoch 1: 10720/182380 (0.06 %) finished / train loss: 0.25291595948276235
epoch 1: 10880/182380 (0.06 %) finished / train loss: 0.25319539532065394
epoch 1: 11040/182380 (0.06 %) finished / train loss: 0.25339888312678405
epoch 1: 11200/182380 (0.06 %) finished / train loss: 0.2533008699331965
epoch 1: 11360/182380 (0.06 %) finished / train loss: 0.25360792619241795
epoch 1: 11520/182380 (0.06 %) finished / train loss: 0.253476236305303
epoch 1: 11680/182380 (0.06 %) finished / train loss: 0.2531330308685564
epoch 1: 11840/182380 (0.06 %) finished / train loss: 0.2531447030402519
epoch 1: 12000/182380 (0.07 %) finished / train loss: 0.2534269363085429
epoch 1: 12160/182380 (0.07 %) finished / train loss: 0.25442318273218056
epoch 1: 12320/182380 (0.07 %) finished / train loss: 0.2545434364250728
epoch 1: 12480/182380 (0.07 %) finished / train loss: 0.2542610392738611
epoch 1: 12640/182380 (0.07 %) finished / trai

epoch 1: 28480/182380 (0.16 %) finished / train loss: 0.2531714089968231
epoch 1: 28640/182380 (0.16 %) finished / train loss: 0.2531430857308084
epoch 1: 28800/182380 (0.16 %) finished / train loss: 0.2530301529169083
epoch 1: 28960/182380 (0.16 %) finished / train loss: 0.25299567626326125
epoch 1: 29120/182380 (0.16 %) finished / train loss: 0.25293255474541215
epoch 1: 29280/182380 (0.16 %) finished / train loss: 0.25293316618015205
epoch 1: 29440/182380 (0.16 %) finished / train loss: 0.25293214628877847
epoch 1: 29600/182380 (0.16 %) finished / train loss: 0.2530569740404954
epoch 1: 29760/182380 (0.16 %) finished / train loss: 0.2530160129230509
epoch 1: 29920/182380 (0.16 %) finished / train loss: 0.2530734807252884
epoch 1: 30080/182380 (0.16 %) finished / train loss: 0.2529442678423638
epoch 1: 30240/182380 (0.17 %) finished / train loss: 0.2528120963031022
epoch 1: 30400/182380 (0.17 %) finished / train loss: 0.25285821161772076
epoch 1: 30560/182380 (0.17 %) finished / trai

epoch 1: 46400/182380 (0.25 %) finished / train loss: 0.25507137130046714
epoch 1: 46560/182380 (0.26 %) finished / train loss: 0.25508938521863667
epoch 1: 46720/182380 (0.26 %) finished / train loss: 0.25526771749535654
epoch 1: 46880/182380 (0.26 %) finished / train loss: 0.25524086026608334
epoch 1: 47040/182380 (0.26 %) finished / train loss: 0.25529458077789163
epoch 1: 47200/182380 (0.26 %) finished / train loss: 0.2552527332406933
epoch 1: 47360/182380 (0.26 %) finished / train loss: 0.25529573817510864
epoch 1: 47520/182380 (0.26 %) finished / train loss: 0.25541348090075483
epoch 1: 47680/182380 (0.26 %) finished / train loss: 0.25539774791706327
epoch 1: 47840/182380 (0.26 %) finished / train loss: 0.2553746496853621
epoch 1: 48000/182380 (0.26 %) finished / train loss: 0.25548962427179017
epoch 1: 48160/182380 (0.26 %) finished / train loss: 0.25542291967179687
epoch 1: 48320/182380 (0.26 %) finished / train loss: 0.25536423820928233
epoch 1: 48480/182380 (0.27 %) finished 

epoch 1: 64320/182380 (0.35 %) finished / train loss: 0.255277173895741
epoch 1: 64480/182380 (0.35 %) finished / train loss: 0.2552886567843463
epoch 1: 64640/182380 (0.35 %) finished / train loss: 0.2552622560153503
epoch 1: 64800/182380 (0.36 %) finished / train loss: 0.25526716943876243
epoch 1: 64960/182380 (0.36 %) finished / train loss: 0.25534087109741904
epoch 1: 65120/182380 (0.36 %) finished / train loss: 0.2552957814580393
epoch 1: 65280/182380 (0.36 %) finished / train loss: 0.2552980955251876
epoch 1: 65440/182380 (0.36 %) finished / train loss: 0.25524983413353525
epoch 1: 65600/182380 (0.36 %) finished / train loss: 0.2552879200475972
epoch 1: 65760/182380 (0.36 %) finished / train loss: 0.25526408318910576
epoch 1: 65920/182380 (0.36 %) finished / train loss: 0.2552776957816869
epoch 1: 66080/182380 (0.36 %) finished / train loss: 0.2552152980254291
epoch 1: 66240/182380 (0.36 %) finished / train loss: 0.25524518041363087
epoch 1: 66400/182380 (0.36 %) finished / train

epoch 1: 82240/182380 (0.45 %) finished / train loss: 0.2554177634099114
epoch 1: 82400/182380 (0.45 %) finished / train loss: 0.25540745188888997
epoch 1: 82560/182380 (0.45 %) finished / train loss: 0.2553944443258666
epoch 1: 82720/182380 (0.45 %) finished / train loss: 0.2554919166133759
epoch 1: 82880/182380 (0.45 %) finished / train loss: 0.2555210481164078
epoch 1: 83040/182380 (0.46 %) finished / train loss: 0.2554832432311394
epoch 1: 83200/182380 (0.46 %) finished / train loss: 0.2554943665632835
epoch 1: 83360/182380 (0.46 %) finished / train loss: 0.2554889375669256
epoch 1: 83520/182380 (0.46 %) finished / train loss: 0.2554721478358539
epoch 1: 83680/182380 (0.46 %) finished / train loss: 0.255467952585585
epoch 1: 83840/182380 (0.46 %) finished / train loss: 0.2554929092753935
epoch 1: 84000/182380 (0.46 %) finished / train loss: 0.2555328225635347
epoch 1: 84160/182380 (0.46 %) finished / train loss: 0.2555464486885433
epoch 1: 84320/182380 (0.46 %) finished / train los

epoch 1: 100160/182380 (0.55 %) finished / train loss: 0.25499717170914143
epoch 1: 100320/182380 (0.55 %) finished / train loss: 0.2549244970415958
epoch 1: 100480/182380 (0.55 %) finished / train loss: 0.25488766983720906
epoch 1: 100640/182380 (0.55 %) finished / train loss: 0.254836071314607
epoch 1: 100800/182380 (0.55 %) finished / train loss: 0.2548176079610037
epoch 1: 100960/182380 (0.55 %) finished / train loss: 0.25481173650681876
epoch 1: 101120/182380 (0.55 %) finished / train loss: 0.25478413612404954
epoch 1: 101280/182380 (0.56 %) finished / train loss: 0.2548011770886833
epoch 1: 101440/182380 (0.56 %) finished / train loss: 0.254828141672002
epoch 1: 101600/182380 (0.56 %) finished / train loss: 0.25480461135154636
epoch 1: 101760/182380 (0.56 %) finished / train loss: 0.2548083264497841
epoch 1: 101920/182380 (0.56 %) finished / train loss: 0.2548206358680171
epoch 1: 102080/182380 (0.56 %) finished / train loss: 0.25491105510990447
epoch 1: 102240/182380 (0.56 %) fi

epoch 1: 117920/182380 (0.65 %) finished / train loss: 0.2546965151216476
epoch 1: 118080/182380 (0.65 %) finished / train loss: 0.2546957338284348
epoch 1: 118240/182380 (0.65 %) finished / train loss: 0.2547115948509944
epoch 1: 118400/182380 (0.65 %) finished / train loss: 0.2547067504557403
epoch 1: 118560/182380 (0.65 %) finished / train loss: 0.25474842913478973
epoch 1: 118720/182380 (0.65 %) finished / train loss: 0.2547159227118338
epoch 1: 118880/182380 (0.65 %) finished / train loss: 0.2547097805210591
epoch 1: 119040/182380 (0.65 %) finished / train loss: 0.25471148556198486
epoch 1: 119200/182380 (0.65 %) finished / train loss: 0.2547363423461082
epoch 1: 119360/182380 (0.65 %) finished / train loss: 0.254764222695265
epoch 1: 119520/182380 (0.66 %) finished / train loss: 0.2547628147734536
epoch 1: 119680/182380 (0.66 %) finished / train loss: 0.25477915828957914
epoch 1: 119840/182380 (0.66 %) finished / train loss: 0.25476465433716616
epoch 1: 120000/182380 (0.66 %) fin

epoch 1: 135680/182380 (0.74 %) finished / train loss: 0.2541297131587031
epoch 1: 135840/182380 (0.74 %) finished / train loss: 0.2541463756238333
epoch 1: 136000/182380 (0.75 %) finished / train loss: 0.254109373355613
epoch 1: 136160/182380 (0.75 %) finished / train loss: 0.25410289816584625
epoch 1: 136320/182380 (0.75 %) finished / train loss: 0.2540701839950443
epoch 1: 136480/182380 (0.75 %) finished / train loss: 0.2540976283733339
epoch 1: 136640/182380 (0.75 %) finished / train loss: 0.2540691624655098
epoch 1: 136800/182380 (0.75 %) finished / train loss: 0.25406722900463125
epoch 1: 136960/182380 (0.75 %) finished / train loss: 0.254081549707835
epoch 1: 137120/182380 (0.75 %) finished / train loss: 0.2540676103381042
epoch 1: 137280/182380 (0.75 %) finished / train loss: 0.25405892852719847
epoch 1: 137440/182380 (0.75 %) finished / train loss: 0.25405484606903284
epoch 1: 137600/182380 (0.75 %) finished / train loss: 0.2540410971988079
epoch 1: 137760/182380 (0.76 %) fini

epoch 1: 153440/182380 (0.84 %) finished / train loss: 0.25440568656071133
epoch 1: 153600/182380 (0.84 %) finished / train loss: 0.2543851897617181
epoch 1: 153760/182380 (0.84 %) finished / train loss: 0.25437770230651024
epoch 1: 153920/182380 (0.84 %) finished / train loss: 0.25435273167435196
epoch 1: 154080/182380 (0.84 %) finished / train loss: 0.2543355391466234
epoch 1: 154240/182380 (0.85 %) finished / train loss: 0.25433061516754857
epoch 1: 154400/182380 (0.85 %) finished / train loss: 0.25432005212714637
epoch 1: 154560/182380 (0.85 %) finished / train loss: 0.25431038920862087
epoch 1: 154720/182380 (0.85 %) finished / train loss: 0.2543179159450432
epoch 1: 154880/182380 (0.85 %) finished / train loss: 0.2543797981394224
epoch 1: 155040/182380 (0.85 %) finished / train loss: 0.2543943894506116
epoch 1: 155200/182380 (0.85 %) finished / train loss: 0.25441634391693724
epoch 1: 155360/182380 (0.85 %) finished / train loss: 0.254404251478482
epoch 1: 155520/182380 (0.85 %) 

epoch 1: 171200/182380 (0.94 %) finished / train loss: 0.25402062763956107
epoch 1: 171360/182380 (0.94 %) finished / train loss: 0.2540205774910532
epoch 1: 171520/182380 (0.94 %) finished / train loss: 0.2539930279880985
epoch 1: 171680/182380 (0.94 %) finished / train loss: 0.25400177871692103
epoch 1: 171840/182380 (0.94 %) finished / train loss: 0.2540034380704997
epoch 1: 172000/182380 (0.94 %) finished / train loss: 0.25399634431129275
epoch 1: 172160/182380 (0.94 %) finished / train loss: 0.25401077729175525
epoch 1: 172320/182380 (0.94 %) finished / train loss: 0.2540156537748202
epoch 1: 172480/182380 (0.95 %) finished / train loss: 0.2540071347427722
epoch 1: 172640/182380 (0.95 %) finished / train loss: 0.2539910895554858
epoch 1: 172800/182380 (0.95 %) finished / train loss: 0.2539589496150061
epoch 1: 172960/182380 (0.95 %) finished / train loss: 0.2539487386527269
epoch 1: 173120/182380 (0.95 %) finished / train loss: 0.25397920528368234
epoch 1: 173280/182380 (0.95 %) f

epoch 2: 6400/182380 (0.04 %) finished / train loss: 0.2432501357793808
epoch 2: 6560/182380 (0.04 %) finished / train loss: 0.24344963344132028
epoch 2: 6720/182380 (0.04 %) finished / train loss: 0.24285918204557327
epoch 2: 6880/182380 (0.04 %) finished / train loss: 0.24289986137733904
epoch 2: 7040/182380 (0.04 %) finished / train loss: 0.2433990340341221
epoch 2: 7200/182380 (0.04 %) finished / train loss: 0.24304577615525988
epoch 2: 7360/182380 (0.04 %) finished / train loss: 0.24306073681167933
epoch 2: 7520/182380 (0.04 %) finished / train loss: 0.24316046250627396
epoch 2: 7680/182380 (0.04 %) finished / train loss: 0.2430994498853882
epoch 2: 7840/182380 (0.04 %) finished / train loss: 0.2429165281811539
epoch 2: 8000/182380 (0.04 %) finished / train loss: 0.2423912826180458
epoch 2: 8160/182380 (0.04 %) finished / train loss: 0.24252707023246617
epoch 2: 8320/182380 (0.05 %) finished / train loss: 0.24289455184569725
epoch 2: 8480/182380 (0.05 %) finished / train loss: 0.2

epoch 2: 24320/182380 (0.13 %) finished / train loss: 0.24571323463399158
epoch 2: 24480/182380 (0.13 %) finished / train loss: 0.24563998987082564
epoch 2: 24640/182380 (0.14 %) finished / train loss: 0.2456121175126596
epoch 2: 24800/182380 (0.14 %) finished / train loss: 0.24557287737246483
epoch 2: 24960/182380 (0.14 %) finished / train loss: 0.245629560508025
epoch 2: 25120/182380 (0.14 %) finished / train loss: 0.24556648283247734
epoch 2: 25280/182380 (0.14 %) finished / train loss: 0.24568931833852695
epoch 2: 25440/182380 (0.14 %) finished / train loss: 0.24580555322035302
epoch 2: 25600/182380 (0.14 %) finished / train loss: 0.2457740463130176
epoch 2: 25760/182380 (0.14 %) finished / train loss: 0.2457657729061494
epoch 2: 25920/182380 (0.14 %) finished / train loss: 0.24576735104675645
epoch 2: 26080/182380 (0.14 %) finished / train loss: 0.2458935196048643
epoch 2: 26240/182380 (0.14 %) finished / train loss: 0.24605006550143405
epoch 2: 26400/182380 (0.14 %) finished / tr

epoch 2: 42240/182380 (0.23 %) finished / train loss: 0.24718731347132814
epoch 2: 42400/182380 (0.23 %) finished / train loss: 0.24712415150876316
epoch 2: 42560/182380 (0.23 %) finished / train loss: 0.2471861816998711
epoch 2: 42720/182380 (0.23 %) finished / train loss: 0.2472171235843544
epoch 2: 42880/182380 (0.24 %) finished / train loss: 0.247160938104142
epoch 2: 43040/182380 (0.24 %) finished / train loss: 0.24721789598243388
epoch 2: 43200/182380 (0.24 %) finished / train loss: 0.2472452171533196
epoch 2: 43360/182380 (0.24 %) finished / train loss: 0.24734227634224065
epoch 2: 43520/182380 (0.24 %) finished / train loss: 0.24739823964807917
epoch 2: 43680/182380 (0.24 %) finished / train loss: 0.24743397252245264
epoch 2: 43840/182380 (0.24 %) finished / train loss: 0.24735409118180726
epoch 2: 44000/182380 (0.24 %) finished / train loss: 0.24732574365355753
epoch 2: 44160/182380 (0.24 %) finished / train loss: 0.2473094174179478
epoch 2: 44320/182380 (0.24 %) finished / tr

epoch 2: 60160/182380 (0.33 %) finished / train loss: 0.24817227760845043
epoch 2: 60320/182380 (0.33 %) finished / train loss: 0.24815616161816947
epoch 2: 60480/182380 (0.33 %) finished / train loss: 0.24808694165219705
epoch 2: 60640/182380 (0.33 %) finished / train loss: 0.24809531573412602
epoch 2: 60800/182380 (0.33 %) finished / train loss: 0.24813739735044932
epoch 2: 60960/182380 (0.33 %) finished / train loss: 0.2481498829570655
epoch 2: 61120/182380 (0.34 %) finished / train loss: 0.24816844443064084
epoch 2: 61280/182380 (0.34 %) finished / train loss: 0.24822556080768376
epoch 2: 61440/182380 (0.34 %) finished / train loss: 0.24819148368357372
epoch 2: 61600/182380 (0.34 %) finished / train loss: 0.24818871330131184
epoch 2: 61760/182380 (0.34 %) finished / train loss: 0.24819414311431232
epoch 2: 61920/182380 (0.34 %) finished / train loss: 0.24822119310382726
epoch 2: 62080/182380 (0.34 %) finished / train loss: 0.2481839436922491
epoch 2: 62240/182380 (0.34 %) finished 

epoch 2: 78080/182380 (0.43 %) finished / train loss: 0.2483125818984919
epoch 2: 78240/182380 (0.43 %) finished / train loss: 0.2483288993742812
epoch 2: 78400/182380 (0.43 %) finished / train loss: 0.2483825893304786
epoch 2: 78560/182380 (0.43 %) finished / train loss: 0.24838813116011454
epoch 2: 78720/182380 (0.43 %) finished / train loss: 0.24839269578820322
epoch 2: 78880/182380 (0.43 %) finished / train loss: 0.24841821445775564
epoch 2: 79040/182380 (0.43 %) finished / train loss: 0.2484310499026708
epoch 2: 79200/182380 (0.43 %) finished / train loss: 0.24843161180163875
epoch 2: 79360/182380 (0.44 %) finished / train loss: 0.24841998201464452
epoch 2: 79520/182380 (0.44 %) finished / train loss: 0.24838100614202335
epoch 2: 79680/182380 (0.44 %) finished / train loss: 0.24834418767187968
epoch 2: 79840/182380 (0.44 %) finished / train loss: 0.248428427032335
epoch 2: 80000/182380 (0.44 %) finished / train loss: 0.24838454129099846
epoch 2: 80160/182380 (0.44 %) finished / tr

epoch 2: 96000/182380 (0.53 %) finished / train loss: 0.248773265833656
epoch 2: 96160/182380 (0.53 %) finished / train loss: 0.2487921969069419
epoch 2: 96320/182380 (0.53 %) finished / train loss: 0.24879406410396296
epoch 2: 96480/182380 (0.53 %) finished / train loss: 0.24878778292567377
epoch 2: 96640/182380 (0.53 %) finished / train loss: 0.2487775903762571
epoch 2: 96800/182380 (0.53 %) finished / train loss: 0.24876404294297716
epoch 2: 96960/182380 (0.53 %) finished / train loss: 0.2487181169463463
epoch 2: 97120/182380 (0.53 %) finished / train loss: 0.2487622010452547
epoch 2: 97280/182380 (0.53 %) finished / train loss: 0.24879343847401048
epoch 2: 97440/182380 (0.53 %) finished / train loss: 0.24879042807666735
epoch 2: 97600/182380 (0.54 %) finished / train loss: 0.24875111446517412
epoch 2: 97760/182380 (0.54 %) finished / train loss: 0.2487349787437389
epoch 2: 97920/182380 (0.54 %) finished / train loss: 0.24871792387631203
epoch 2: 98080/182380 (0.54 %) finished / tra

epoch 2: 113760/182380 (0.62 %) finished / train loss: 0.24827211315202646
epoch 2: 113920/182380 (0.62 %) finished / train loss: 0.2482990005587259
epoch 2: 114080/182380 (0.63 %) finished / train loss: 0.24828581794950103
epoch 2: 114240/182380 (0.63 %) finished / train loss: 0.24827590664895643
epoch 2: 114400/182380 (0.63 %) finished / train loss: 0.2482756704258752
epoch 2: 114560/182380 (0.63 %) finished / train loss: 0.2482969264952497
epoch 2: 114720/182380 (0.63 %) finished / train loss: 0.24832064082931773
epoch 2: 114880/182380 (0.63 %) finished / train loss: 0.248295629323359
epoch 2: 115040/182380 (0.63 %) finished / train loss: 0.2482970000805543
epoch 2: 115200/182380 (0.63 %) finished / train loss: 0.2483112951243917
epoch 2: 115360/182380 (0.63 %) finished / train loss: 0.2483051688760395
epoch 2: 115520/182380 (0.63 %) finished / train loss: 0.24828762962712475
epoch 2: 115680/182380 (0.63 %) finished / train loss: 0.2483131122457206
epoch 2: 115840/182380 (0.64 %) fi

epoch 2: 131360/182380 (0.72 %) finished / train loss: 0.24794263554403465
epoch 2: 131520/182380 (0.72 %) finished / train loss: 0.2479367939080055
epoch 2: 131680/182380 (0.72 %) finished / train loss: 0.24795128864984176
epoch 2: 131840/182380 (0.72 %) finished / train loss: 0.24797590659587707
epoch 2: 132000/182380 (0.72 %) finished / train loss: 0.24797047423232685
epoch 2: 132160/182380 (0.72 %) finished / train loss: 0.24797543146203274
epoch 2: 132320/182380 (0.73 %) finished / train loss: 0.24797290700162336
epoch 2: 132480/182380 (0.73 %) finished / train loss: 0.2479581019692663
epoch 2: 132640/182380 (0.73 %) finished / train loss: 0.247947262326397
epoch 2: 132800/182380 (0.73 %) finished / train loss: 0.2479243674299803
epoch 2: 132960/182380 (0.73 %) finished / train loss: 0.24790439075296106
epoch 2: 133120/182380 (0.73 %) finished / train loss: 0.2478874972842347
epoch 2: 133280/182380 (0.73 %) finished / train loss: 0.24789575836023076
epoch 2: 133440/182380 (0.73 %)

epoch 2: 148960/182380 (0.82 %) finished / train loss: 0.24798539551705218
epoch 2: 149120/182380 (0.82 %) finished / train loss: 0.2479923343581703
epoch 2: 149280/182380 (0.82 %) finished / train loss: 0.24799771867572687
epoch 2: 149440/182380 (0.82 %) finished / train loss: 0.24800243744311548
epoch 2: 149600/182380 (0.82 %) finished / train loss: 0.24801022461072647
epoch 2: 149760/182380 (0.82 %) finished / train loss: 0.248012045567107
epoch 2: 149920/182380 (0.82 %) finished / train loss: 0.2480229795424381
epoch 2: 150080/182380 (0.82 %) finished / train loss: 0.24805280460414095
epoch 2: 150240/182380 (0.82 %) finished / train loss: 0.2480721688752992
epoch 2: 150400/182380 (0.82 %) finished / train loss: 0.24806832834444148
epoch 2: 150560/182380 (0.83 %) finished / train loss: 0.24806623148487428
epoch 2: 150720/182380 (0.83 %) finished / train loss: 0.24808735613989982
epoch 2: 150880/182380 (0.83 %) finished / train loss: 0.24808375928017645
epoch 2: 151040/182380 (0.83 %

epoch 2: 166560/182380 (0.91 %) finished / train loss: 0.24829688070200592
epoch 2: 166720/182380 (0.91 %) finished / train loss: 0.24827283160357008
epoch 2: 166880/182380 (0.92 %) finished / train loss: 0.24827367726245525
epoch 2: 167040/182380 (0.92 %) finished / train loss: 0.24828208470253196
epoch 2: 167200/182380 (0.92 %) finished / train loss: 0.24827203393267672
epoch 2: 167360/182380 (0.92 %) finished / train loss: 0.24829460100393677
epoch 2: 167520/182380 (0.92 %) finished / train loss: 0.2482731876565711
epoch 2: 167680/182380 (0.92 %) finished / train loss: 0.24826719382393905
epoch 2: 167840/182380 (0.92 %) finished / train loss: 0.24824912868532484
epoch 2: 168000/182380 (0.92 %) finished / train loss: 0.24822445028736478
epoch 2: 168160/182380 (0.92 %) finished / train loss: 0.2482232730208296
epoch 2: 168320/182380 (0.92 %) finished / train loss: 0.2482167706545088
epoch 2: 168480/182380 (0.92 %) finished / train loss: 0.24825509896984807
epoch 2: 168640/182380 (0.92

epoch 3: 1600/182380 (0.01 %) finished / train loss: 0.2467580744624138
epoch 3: 1760/182380 (0.01 %) finished / train loss: 0.24795630980621686
epoch 3: 1920/182380 (0.01 %) finished / train loss: 0.24823568438490232
epoch 3: 2080/182380 (0.01 %) finished / train loss: 0.2480975852562831
epoch 3: 2240/182380 (0.01 %) finished / train loss: 0.24626949365649906
epoch 3: 2400/182380 (0.01 %) finished / train loss: 0.24482174237569174
epoch 3: 2560/182380 (0.01 %) finished / train loss: 0.24543656911700965
epoch 3: 2720/182380 (0.01 %) finished / train loss: 0.24611298827564015
epoch 3: 2880/182380 (0.02 %) finished / train loss: 0.24700377302037346
epoch 3: 3040/182380 (0.02 %) finished / train loss: 0.24753231970887435
epoch 3: 3200/182380 (0.02 %) finished / train loss: 0.24710306018590927
epoch 3: 3360/182380 (0.02 %) finished / train loss: 0.24755766916842686
epoch 3: 3520/182380 (0.02 %) finished / train loss: 0.2474477071653713
epoch 3: 3680/182380 (0.02 %) finished / train loss: 0

epoch 3: 19520/182380 (0.11 %) finished / train loss: 0.2445380066994761
epoch 3: 19680/182380 (0.11 %) finished / train loss: 0.2445226193685842
epoch 3: 19840/182380 (0.11 %) finished / train loss: 0.24461287529237807
epoch 3: 20000/182380 (0.11 %) finished / train loss: 0.24475688111782073
epoch 3: 20160/182380 (0.11 %) finished / train loss: 0.2447777796832342
epoch 3: 20320/182380 (0.11 %) finished / train loss: 0.24475183134942544
epoch 3: 20480/182380 (0.11 %) finished / train loss: 0.2448902313131839
epoch 3: 20640/182380 (0.11 %) finished / train loss: 0.24493830954843712
epoch 3: 20800/182380 (0.11 %) finished / train loss: 0.24488858763988203
epoch 3: 20960/182380 (0.11 %) finished / train loss: 0.24497985641919928
epoch 3: 21120/182380 (0.12 %) finished / train loss: 0.24488478503895528
epoch 3: 21280/182380 (0.12 %) finished / train loss: 0.2448086520110754
epoch 3: 21440/182380 (0.12 %) finished / train loss: 0.24474169569673823
epoch 3: 21600/182380 (0.12 %) finished / t

epoch 3: 37440/182380 (0.21 %) finished / train loss: 0.2446555728968392
epoch 3: 37600/182380 (0.21 %) finished / train loss: 0.24448959066512738
epoch 3: 37760/182380 (0.21 %) finished / train loss: 0.24449774526943593
epoch 3: 37920/182380 (0.21 %) finished / train loss: 0.24450110604491415
epoch 3: 38080/182380 (0.21 %) finished / train loss: 0.24446728366012332
epoch 3: 38240/182380 (0.21 %) finished / train loss: 0.2443604620056671
epoch 3: 38400/182380 (0.21 %) finished / train loss: 0.2443794505422314
epoch 3: 38560/182380 (0.21 %) finished / train loss: 0.24429773034149185
epoch 3: 38720/182380 (0.21 %) finished / train loss: 0.24416325168668732
epoch 3: 38880/182380 (0.21 %) finished / train loss: 0.2441620840825171
epoch 3: 39040/182380 (0.21 %) finished / train loss: 0.24419900467161273
epoch 3: 39200/182380 (0.21 %) finished / train loss: 0.2441506214044532
epoch 3: 39360/182380 (0.22 %) finished / train loss: 0.24414611598098182
epoch 3: 39520/182380 (0.22 %) finished / t

epoch 3: 55360/182380 (0.30 %) finished / train loss: 0.24384939382014248
epoch 3: 55520/182380 (0.30 %) finished / train loss: 0.24380903256042546
epoch 3: 55680/182380 (0.31 %) finished / train loss: 0.2438876172506261
epoch 3: 55840/182380 (0.31 %) finished / train loss: 0.2438808385400171
epoch 3: 56000/182380 (0.31 %) finished / train loss: 0.24389968007802965
epoch 3: 56160/182380 (0.31 %) finished / train loss: 0.2438888230809459
epoch 3: 56320/182380 (0.31 %) finished / train loss: 0.24390444973991676
epoch 3: 56480/182380 (0.31 %) finished / train loss: 0.24388873513798537
epoch 3: 56640/182380 (0.31 %) finished / train loss: 0.24388575444450486
epoch 3: 56800/182380 (0.31 %) finished / train loss: 0.24396134589759397
epoch 3: 56960/182380 (0.31 %) finished / train loss: 0.24396677474292477
epoch 3: 57120/182380 (0.31 %) finished / train loss: 0.24395044057810006
epoch 3: 57280/182380 (0.31 %) finished / train loss: 0.2438896572040446
epoch 3: 57440/182380 (0.31 %) finished / 

epoch 3: 73280/182380 (0.40 %) finished / train loss: 0.24516460861050926
epoch 3: 73440/182380 (0.40 %) finished / train loss: 0.24519541007111534
epoch 3: 73600/182380 (0.40 %) finished / train loss: 0.24520196452736853
epoch 3: 73760/182380 (0.40 %) finished / train loss: 0.2452132083976605
epoch 3: 73920/182380 (0.41 %) finished / train loss: 0.24525598873307694
epoch 3: 74080/182380 (0.41 %) finished / train loss: 0.245282824759092
epoch 3: 74240/182380 (0.41 %) finished / train loss: 0.24534086923532444
epoch 3: 74400/182380 (0.41 %) finished / train loss: 0.2453649276751344
epoch 3: 74560/182380 (0.41 %) finished / train loss: 0.2453596342402978
epoch 3: 74720/182380 (0.41 %) finished / train loss: 0.24533314505787426
epoch 3: 74880/182380 (0.41 %) finished / train loss: 0.2453073548646564
epoch 3: 75040/182380 (0.41 %) finished / train loss: 0.24525716818853227
epoch 3: 75200/182380 (0.41 %) finished / train loss: 0.24520664416729135
epoch 3: 75360/182380 (0.41 %) finished / tr

epoch 3: 91200/182380 (0.50 %) finished / train loss: 0.24486127124543774
epoch 3: 91360/182380 (0.50 %) finished / train loss: 0.24489222847434142
epoch 3: 91520/182380 (0.50 %) finished / train loss: 0.24489316214527285
epoch 3: 91680/182380 (0.50 %) finished / train loss: 0.244868787478194
epoch 3: 91840/182380 (0.50 %) finished / train loss: 0.2448664490769549
epoch 3: 92000/182380 (0.50 %) finished / train loss: 0.2448846022201621
epoch 3: 92160/182380 (0.51 %) finished / train loss: 0.24482805961225595
epoch 3: 92320/182380 (0.51 %) finished / train loss: 0.24480341605751726
epoch 3: 92480/182380 (0.51 %) finished / train loss: 0.24481757083153644
epoch 3: 92640/182380 (0.51 %) finished / train loss: 0.24483912023032062
epoch 3: 92800/182380 (0.51 %) finished / train loss: 0.2448874679413335
epoch 3: 92960/182380 (0.51 %) finished / train loss: 0.244854856173471
epoch 3: 93120/182380 (0.51 %) finished / train loss: 0.24484245090959816
epoch 3: 93280/182380 (0.51 %) finished / tra

epoch 3: 108960/182380 (0.60 %) finished / train loss: 0.24437543700795167
epoch 3: 109120/182380 (0.60 %) finished / train loss: 0.2444565292546127
epoch 3: 109280/182380 (0.60 %) finished / train loss: 0.24448342833389825
epoch 3: 109440/182380 (0.60 %) finished / train loss: 0.2444536733871315
epoch 3: 109600/182380 (0.60 %) finished / train loss: 0.24445140577580807
epoch 3: 109760/182380 (0.60 %) finished / train loss: 0.2444638413998893
epoch 3: 109920/182380 (0.60 %) finished / train loss: 0.24443543881741847
epoch 3: 110080/182380 (0.60 %) finished / train loss: 0.2444253087693522
epoch 3: 110240/182380 (0.60 %) finished / train loss: 0.24442913584162432
epoch 3: 110400/182380 (0.61 %) finished / train loss: 0.24438561629557956
epoch 3: 110560/182380 (0.61 %) finished / train loss: 0.24433778365683106
epoch 3: 110720/182380 (0.61 %) finished / train loss: 0.2443520773482116
epoch 3: 110880/182380 (0.61 %) finished / train loss: 0.2443265459797255
epoch 3: 111040/182380 (0.61 %)

epoch 3: 126560/182380 (0.69 %) finished / train loss: 0.2439385531335956
epoch 3: 126720/182380 (0.69 %) finished / train loss: 0.24391870730076776
epoch 3: 126880/182380 (0.70 %) finished / train loss: 0.24393820849072287
epoch 3: 127040/182380 (0.70 %) finished / train loss: 0.24389653229893604
epoch 3: 127200/182380 (0.70 %) finished / train loss: 0.24386089559621033
epoch 3: 127360/182380 (0.70 %) finished / train loss: 0.24387345577229808
epoch 3: 127520/182380 (0.70 %) finished / train loss: 0.24389820451494143
epoch 3: 127680/182380 (0.70 %) finished / train loss: 0.24390062178884234
epoch 3: 127840/182380 (0.70 %) finished / train loss: 0.24394931373220213
epoch 3: 128000/182380 (0.70 %) finished / train loss: 0.24392298065871001
epoch 3: 128160/182380 (0.70 %) finished / train loss: 0.24388918524303388
epoch 3: 128320/182380 (0.70 %) finished / train loss: 0.2438966865588602
epoch 3: 128480/182380 (0.70 %) finished / train loss: 0.2439426233173159
epoch 3: 128640/182380 (0.71

epoch 3: 144160/182380 (0.79 %) finished / train loss: 0.24436292177630584
epoch 3: 144320/182380 (0.79 %) finished / train loss: 0.24437652688531283
epoch 3: 144480/182380 (0.79 %) finished / train loss: 0.24439807940493127
epoch 3: 144640/182380 (0.79 %) finished / train loss: 0.24440309445876462
epoch 3: 144800/182380 (0.79 %) finished / train loss: 0.2443786488481648
epoch 3: 144960/182380 (0.79 %) finished / train loss: 0.24439592622631695
epoch 3: 145120/182380 (0.80 %) finished / train loss: 0.24438650379698754
epoch 3: 145280/182380 (0.80 %) finished / train loss: 0.24437520718325076
epoch 3: 145440/182380 (0.80 %) finished / train loss: 0.24437542104288296
epoch 3: 145600/182380 (0.80 %) finished / train loss: 0.24441433761801037
epoch 3: 145760/182380 (0.80 %) finished / train loss: 0.24439847954476313
epoch 3: 145920/182380 (0.80 %) finished / train loss: 0.24440266398811025
epoch 3: 146080/182380 (0.80 %) finished / train loss: 0.24442566284932285
epoch 3: 146240/182380 (0.

epoch 3: 161760/182380 (0.89 %) finished / train loss: 0.24430664421071166
epoch 3: 161920/182380 (0.89 %) finished / train loss: 0.24434723632608948
epoch 3: 162080/182380 (0.89 %) finished / train loss: 0.24433245880406088
epoch 3: 162240/182380 (0.89 %) finished / train loss: 0.2443343944685934
epoch 3: 162400/182380 (0.89 %) finished / train loss: 0.2443207599112553
epoch 3: 162560/182380 (0.89 %) finished / train loss: 0.244342013342878
epoch 3: 162720/182380 (0.89 %) finished / train loss: 0.2443313097443904
epoch 3: 162880/182380 (0.89 %) finished / train loss: 0.24434048205848294
epoch 3: 163040/182380 (0.89 %) finished / train loss: 0.2443233197962571
epoch 3: 163200/182380 (0.89 %) finished / train loss: 0.24431970051106286
epoch 3: 163360/182380 (0.90 %) finished / train loss: 0.24433827471721417
epoch 3: 163520/182380 (0.90 %) finished / train loss: 0.24436466854262492
epoch 3: 163680/182380 (0.90 %) finished / train loss: 0.24434795276801724
epoch 3: 163840/182380 (0.90 %)

epoch 3: 179360/182380 (0.98 %) finished / train loss: 0.24441882211060315
epoch 3: 179520/182380 (0.98 %) finished / train loss: 0.24441678266368022
epoch 3: 179680/182380 (0.99 %) finished / train loss: 0.24445749126368088
epoch 3: 179840/182380 (0.99 %) finished / train loss: 0.24447779802612138
epoch 3: 180000/182380 (0.99 %) finished / train loss: 0.24447128546237945
epoch 3: 180160/182380 (0.99 %) finished / train loss: 0.24447855551596434
epoch 3: 180320/182380 (0.99 %) finished / train loss: 0.2444786515400911
epoch 3: 180480/182380 (0.99 %) finished / train loss: 0.2444694459121278
epoch 3: 180640/182380 (0.99 %) finished / train loss: 0.24447359757892212
epoch 3: 180800/182380 (0.99 %) finished / train loss: 0.24448743125506206
epoch 3: 180960/182380 (0.99 %) finished / train loss: 0.24449312316960303
epoch 3: 181120/182380 (0.99 %) finished / train loss: 0.24450259328730958
epoch 3: 181280/182380 (0.99 %) finished / train loss: 0.24449223227345196
epoch 3: 181440/182380 (0.9

epoch 4: 14720/182380 (0.08 %) finished / train loss: 0.24194947008205497
epoch 4: 14880/182380 (0.08 %) finished / train loss: 0.24198578922979294
epoch 4: 15040/182380 (0.08 %) finished / train loss: 0.24225617485477569
epoch 4: 15200/182380 (0.08 %) finished / train loss: 0.24234413507737612
epoch 4: 15360/182380 (0.08 %) finished / train loss: 0.24227257957682014
epoch 4: 15520/182380 (0.09 %) finished / train loss: 0.2421833165527619
epoch 4: 15680/182380 (0.09 %) finished / train loss: 0.2427284827645944
epoch 4: 15840/182380 (0.09 %) finished / train loss: 0.2429825190943901
epoch 4: 16000/182380 (0.09 %) finished / train loss: 0.24283682331442832
epoch 4: 16160/182380 (0.09 %) finished / train loss: 0.24293732466083942
epoch 4: 16320/182380 (0.09 %) finished / train loss: 0.2428284302938218
epoch 4: 16480/182380 (0.09 %) finished / train loss: 0.2428009398932596
epoch 4: 16640/182380 (0.09 %) finished / train loss: 0.2428584774526266
epoch 4: 16800/182380 (0.09 %) finished / tr

epoch 4: 32640/182380 (0.18 %) finished / train loss: 0.2425383058102692
epoch 4: 32800/182380 (0.18 %) finished / train loss: 0.24263457030784794
epoch 4: 32960/182380 (0.18 %) finished / train loss: 0.24263128843701
epoch 4: 33120/182380 (0.18 %) finished / train loss: 0.24252258245495784
epoch 4: 33280/182380 (0.18 %) finished / train loss: 0.2423371917496507
epoch 4: 33440/182380 (0.18 %) finished / train loss: 0.24225362232712466
epoch 4: 33600/182380 (0.18 %) finished / train loss: 0.24209682494401932
epoch 4: 33760/182380 (0.19 %) finished / train loss: 0.2420233568450286
epoch 4: 33920/182380 (0.19 %) finished / train loss: 0.24200565916187358
epoch 4: 34080/182380 (0.19 %) finished / train loss: 0.24201154755034918
epoch 4: 34240/182380 (0.19 %) finished / train loss: 0.24205615141681422
epoch 4: 34400/182380 (0.19 %) finished / train loss: 0.24209900868493456
epoch 4: 34560/182380 (0.19 %) finished / train loss: 0.24202513189779387
epoch 4: 34720/182380 (0.19 %) finished / tr

epoch 4: 50560/182380 (0.28 %) finished / train loss: 0.24238822261178042
epoch 4: 50720/182380 (0.28 %) finished / train loss: 0.24242210539545547
epoch 4: 50880/182380 (0.28 %) finished / train loss: 0.2423957253308416
epoch 4: 51040/182380 (0.28 %) finished / train loss: 0.24242467145934748
epoch 4: 51200/182380 (0.28 %) finished / train loss: 0.24243540207855405
epoch 4: 51360/182380 (0.28 %) finished / train loss: 0.24243081923214446
epoch 4: 51520/182380 (0.28 %) finished / train loss: 0.242498367950783
epoch 4: 51680/182380 (0.28 %) finished / train loss: 0.24243099654422087
epoch 4: 51840/182380 (0.28 %) finished / train loss: 0.24239546443209237
epoch 4: 52000/182380 (0.29 %) finished / train loss: 0.24244273891815774
epoch 4: 52160/182380 (0.29 %) finished / train loss: 0.2424731974130028
epoch 4: 52320/182380 (0.29 %) finished / train loss: 0.2425366753102807
epoch 4: 52480/182380 (0.29 %) finished / train loss: 0.2425718921622852
epoch 4: 52640/182380 (0.29 %) finished / tr

epoch 4: 68480/182380 (0.38 %) finished / train loss: 0.24180018238932172
epoch 4: 68640/182380 (0.38 %) finished / train loss: 0.24173176528968454
epoch 4: 68800/182380 (0.38 %) finished / train loss: 0.24175959973834282
epoch 4: 68960/182380 (0.38 %) finished / train loss: 0.2416704813662372
epoch 4: 69120/182380 (0.38 %) finished / train loss: 0.24168169835789335
epoch 4: 69280/182380 (0.38 %) finished / train loss: 0.24165548869423722
epoch 4: 69440/182380 (0.38 %) finished / train loss: 0.24168141525461925
epoch 4: 69600/182380 (0.38 %) finished / train loss: 0.24163661671095882
epoch 4: 69760/182380 (0.38 %) finished / train loss: 0.2416401439030236
epoch 4: 69920/182380 (0.38 %) finished / train loss: 0.2416668748214534
epoch 4: 70080/182380 (0.38 %) finished / train loss: 0.24166126455346199
epoch 4: 70240/182380 (0.39 %) finished / train loss: 0.24165114281796649
epoch 4: 70400/182380 (0.39 %) finished / train loss: 0.2416508364406499
epoch 4: 70560/182380 (0.39 %) finished / 

epoch 4: 86400/182380 (0.47 %) finished / train loss: 0.24276587217494294
epoch 4: 86560/182380 (0.47 %) finished / train loss: 0.24273560216819073
epoch 4: 86720/182380 (0.48 %) finished / train loss: 0.24274057283502662
epoch 4: 86880/182380 (0.48 %) finished / train loss: 0.2426913983145691
epoch 4: 87040/182380 (0.48 %) finished / train loss: 0.2426703055279658
epoch 4: 87200/182380 (0.48 %) finished / train loss: 0.24265591791463553
epoch 4: 87360/182380 (0.48 %) finished / train loss: 0.24264811670387185
epoch 4: 87520/182380 (0.48 %) finished / train loss: 0.2426406031116925
epoch 4: 87680/182380 (0.48 %) finished / train loss: 0.24268944391260183
epoch 4: 87840/182380 (0.48 %) finished / train loss: 0.24275471974157461
epoch 4: 88000/182380 (0.48 %) finished / train loss: 0.24279833800684322
epoch 4: 88160/182380 (0.48 %) finished / train loss: 0.2428449464742155
epoch 4: 88320/182380 (0.48 %) finished / train loss: 0.2428246500213509
epoch 4: 88480/182380 (0.49 %) finished / t

epoch 4: 104160/182380 (0.57 %) finished / train loss: 0.24251525556803116
epoch 4: 104320/182380 (0.57 %) finished / train loss: 0.2425039501277947
epoch 4: 104480/182380 (0.57 %) finished / train loss: 0.2424858413419899
epoch 4: 104640/182380 (0.57 %) finished / train loss: 0.24249379346403507
epoch 4: 104800/182380 (0.57 %) finished / train loss: 0.24249293713169243
epoch 4: 104960/182380 (0.58 %) finished / train loss: 0.24247966776715546
epoch 4: 105120/182380 (0.58 %) finished / train loss: 0.24249847656515636
epoch 4: 105280/182380 (0.58 %) finished / train loss: 0.2425176788472477
epoch 4: 105440/182380 (0.58 %) finished / train loss: 0.24251690324684194
epoch 4: 105600/182380 (0.58 %) finished / train loss: 0.24248721706144738
epoch 4: 105760/182380 (0.58 %) finished / train loss: 0.2424521979198153
epoch 4: 105920/182380 (0.58 %) finished / train loss: 0.24243291822174884
epoch 4: 106080/182380 (0.58 %) finished / train loss: 0.24248831635776508
epoch 4: 106240/182380 (0.58 

epoch 4: 121760/182380 (0.67 %) finished / train loss: 0.24218609343612085
epoch 4: 121920/182380 (0.67 %) finished / train loss: 0.242170129043693
epoch 4: 122080/182380 (0.67 %) finished / train loss: 0.24217503979352947
epoch 4: 122240/182380 (0.67 %) finished / train loss: 0.24218462102934327
epoch 4: 122400/182380 (0.67 %) finished / train loss: 0.24216738920975356
epoch 4: 122560/182380 (0.67 %) finished / train loss: 0.2421824235245391
epoch 4: 122720/182380 (0.67 %) finished / train loss: 0.24217755074529013
epoch 4: 122880/182380 (0.67 %) finished / train loss: 0.24218039298430086
epoch 4: 123040/182380 (0.67 %) finished / train loss: 0.2421803905300418
epoch 4: 123200/182380 (0.68 %) finished / train loss: 0.24215702711761772
epoch 4: 123360/182380 (0.68 %) finished / train loss: 0.2422055413750823
epoch 4: 123520/182380 (0.68 %) finished / train loss: 0.24219370094451262
epoch 4: 123680/182380 (0.68 %) finished / train loss: 0.2422058476937542
epoch 4: 123840/182380 (0.68 %)

epoch 4: 139360/182380 (0.76 %) finished / train loss: 0.24196840386439958
epoch 4: 139520/182380 (0.76 %) finished / train loss: 0.24195517205180378
epoch 4: 139680/182380 (0.77 %) finished / train loss: 0.241971058189391
epoch 4: 139840/182380 (0.77 %) finished / train loss: 0.24198380453294693
epoch 4: 140000/182380 (0.77 %) finished / train loss: 0.24196594866684504
epoch 4: 140160/182380 (0.77 %) finished / train loss: 0.24198890766596684
epoch 4: 140320/182380 (0.77 %) finished / train loss: 0.24199086162288214
epoch 4: 140480/182380 (0.77 %) finished / train loss: 0.24194962263175188
epoch 4: 140640/182380 (0.77 %) finished / train loss: 0.24194115407773387
epoch 4: 140800/182380 (0.77 %) finished / train loss: 0.24193086892366408
epoch 4: 140960/182380 (0.77 %) finished / train loss: 0.2419394379340019
epoch 4: 141120/182380 (0.77 %) finished / train loss: 0.24191979194849797
epoch 4: 141280/182380 (0.77 %) finished / train loss: 0.2419231279486303
epoch 4: 141440/182380 (0.78 

epoch 4: 156960/182380 (0.86 %) finished / train loss: 0.24187507227473304
epoch 4: 157120/182380 (0.86 %) finished / train loss: 0.24186023176019886
epoch 4: 157280/182380 (0.86 %) finished / train loss: 0.2418612820570976
epoch 4: 157440/182380 (0.86 %) finished / train loss: 0.2418930980944779
epoch 4: 157600/182380 (0.86 %) finished / train loss: 0.24188638751276859
epoch 4: 157760/182380 (0.87 %) finished / train loss: 0.24186807834896548
epoch 4: 157920/182380 (0.87 %) finished / train loss: 0.24187135948538177
epoch 4: 158080/182380 (0.87 %) finished / train loss: 0.24192376383825354
epoch 4: 158240/182380 (0.87 %) finished / train loss: 0.24191362955452098
epoch 4: 158400/182380 (0.87 %) finished / train loss: 0.2418971860258266
epoch 4: 158560/182380 (0.87 %) finished / train loss: 0.24188635443702836
epoch 4: 158720/182380 (0.87 %) finished / train loss: 0.24190217775082395
epoch 4: 158880/182380 (0.87 %) finished / train loss: 0.24191817570428953
epoch 4: 159040/182380 (0.87

epoch 4: 174560/182380 (0.96 %) finished / train loss: 0.24203546018255184
epoch 4: 174720/182380 (0.96 %) finished / train loss: 0.24203287397985493
epoch 4: 174880/182380 (0.96 %) finished / train loss: 0.24200703668027215
epoch 4: 175040/182380 (0.96 %) finished / train loss: 0.24201305232656067
epoch 4: 175200/182380 (0.96 %) finished / train loss: 0.24199681992128014
epoch 4: 175360/182380 (0.96 %) finished / train loss: 0.24199131097454224
epoch 4: 175520/182380 (0.96 %) finished / train loss: 0.24198652692512695
epoch 4: 175680/182380 (0.96 %) finished / train loss: 0.24199544513268983
epoch 4: 175840/182380 (0.96 %) finished / train loss: 0.24199357981352074
epoch 4: 176000/182380 (0.97 %) finished / train loss: 0.24198582609404218
epoch 4: 176160/182380 (0.97 %) finished / train loss: 0.24198731389725675
epoch 4: 176320/182380 (0.97 %) finished / train loss: 0.2420120194716592
epoch 4: 176480/182380 (0.97 %) finished / train loss: 0.24199392358660157
epoch 4: 176640/182380 (0.

epoch 5: 9760/182380 (0.05 %) finished / train loss: 0.2408854186046319
epoch 5: 9920/182380 (0.05 %) finished / train loss: 0.24119852449624768
epoch 5: 10080/182380 (0.06 %) finished / train loss: 0.24131768861460307
epoch 5: 10240/182380 (0.06 %) finished / train loss: 0.24141305438242852
epoch 5: 10400/182380 (0.06 %) finished / train loss: 0.24164218031443083
epoch 5: 10560/182380 (0.06 %) finished / train loss: 0.24128733056061197
epoch 5: 10720/182380 (0.06 %) finished / train loss: 0.24066924070244405
epoch 5: 10880/182380 (0.06 %) finished / train loss: 0.24069259675110088
epoch 5: 11040/182380 (0.06 %) finished / train loss: 0.24069958463095237
epoch 5: 11200/182380 (0.06 %) finished / train loss: 0.240644619848047
epoch 5: 11360/182380 (0.06 %) finished / train loss: 0.24023578217331792
epoch 5: 11520/182380 (0.06 %) finished / train loss: 0.24020517393946647
epoch 5: 11680/182380 (0.06 %) finished / train loss: 0.24008104343936867
epoch 5: 11840/182380 (0.06 %) finished / t

epoch 5: 27680/182380 (0.15 %) finished / train loss: 0.23892517194927082
epoch 5: 27840/182380 (0.15 %) finished / train loss: 0.23887229621752926
epoch 5: 28000/182380 (0.15 %) finished / train loss: 0.23883039261613573
epoch 5: 28160/182380 (0.15 %) finished / train loss: 0.23880603474310852
epoch 5: 28320/182380 (0.16 %) finished / train loss: 0.23900480994396964
epoch 5: 28480/182380 (0.16 %) finished / train loss: 0.238979938542575
epoch 5: 28640/182380 (0.16 %) finished / train loss: 0.23893654329816721
epoch 5: 28800/182380 (0.16 %) finished / train loss: 0.2390652047759957
epoch 5: 28960/182380 (0.16 %) finished / train loss: 0.23907070533676042
epoch 5: 29120/182380 (0.16 %) finished / train loss: 0.23915597848839812
epoch 5: 29280/182380 (0.16 %) finished / train loss: 0.2391350699415624
epoch 5: 29440/182380 (0.16 %) finished / train loss: 0.23909533864454083
epoch 5: 29600/182380 (0.16 %) finished / train loss: 0.23912464816828033
epoch 5: 29760/182380 (0.16 %) finished / 

epoch 5: 45600/182380 (0.25 %) finished / train loss: 0.24121431501288162
epoch 5: 45760/182380 (0.25 %) finished / train loss: 0.24114453259047927
epoch 5: 45920/182380 (0.25 %) finished / train loss: 0.24112896207940704
epoch 5: 46080/182380 (0.25 %) finished / train loss: 0.2412783341275321
epoch 5: 46240/182380 (0.25 %) finished / train loss: 0.24134864977280573
epoch 5: 46400/182380 (0.25 %) finished / train loss: 0.24139996001432681
epoch 5: 46560/182380 (0.26 %) finished / train loss: 0.2414313584258876
epoch 5: 46720/182380 (0.26 %) finished / train loss: 0.24147791360339074
epoch 5: 46880/182380 (0.26 %) finished / train loss: 0.2414524077453711
epoch 5: 47040/182380 (0.26 %) finished / train loss: 0.24153415156262262
epoch 5: 47200/182380 (0.26 %) finished / train loss: 0.24158187736899167
epoch 5: 47360/182380 (0.26 %) finished / train loss: 0.24169115797692053
epoch 5: 47520/182380 (0.26 %) finished / train loss: 0.24171399113907155
epoch 5: 47680/182380 (0.26 %) finished /

epoch 5: 63520/182380 (0.35 %) finished / train loss: 0.24075433874610688
epoch 5: 63680/182380 (0.35 %) finished / train loss: 0.24074858543860853
epoch 5: 63840/182380 (0.35 %) finished / train loss: 0.24079064453454843
epoch 5: 64000/182380 (0.35 %) finished / train loss: 0.24079419323801995
epoch 5: 64160/182380 (0.35 %) finished / train loss: 0.24082957833187835
epoch 5: 64320/182380 (0.35 %) finished / train loss: 0.2408796038052336
epoch 5: 64480/182380 (0.35 %) finished / train loss: 0.24092009682809154
epoch 5: 64640/182380 (0.35 %) finished / train loss: 0.24091396796526296
epoch 5: 64800/182380 (0.36 %) finished / train loss: 0.2408678670944991
epoch 5: 64960/182380 (0.36 %) finished / train loss: 0.24087201285685225
epoch 5: 65120/182380 (0.36 %) finished / train loss: 0.2408948697827079
epoch 5: 65280/182380 (0.36 %) finished / train loss: 0.24080106984166538
epoch 5: 65440/182380 (0.36 %) finished / train loss: 0.2407556331245124
epoch 5: 65600/182380 (0.36 %) finished / 

epoch 5: 81440/182380 (0.45 %) finished / train loss: 0.24010504564391139
epoch 5: 81600/182380 (0.45 %) finished / train loss: 0.24010708585089327
epoch 5: 81760/182380 (0.45 %) finished / train loss: 0.24008338001142976
epoch 5: 81920/182380 (0.45 %) finished / train loss: 0.2400763841054868
epoch 5: 82080/182380 (0.45 %) finished / train loss: 0.24006402793451126
epoch 5: 82240/182380 (0.45 %) finished / train loss: 0.24016264085639777
epoch 5: 82400/182380 (0.45 %) finished / train loss: 0.24018587479892287
epoch 5: 82560/182380 (0.45 %) finished / train loss: 0.24016161081633827
epoch 5: 82720/182380 (0.45 %) finished / train loss: 0.2401395794386098
epoch 5: 82880/182380 (0.45 %) finished / train loss: 0.240164584013486
epoch 5: 83040/182380 (0.46 %) finished / train loss: 0.2401281803329556
epoch 5: 83200/182380 (0.46 %) finished / train loss: 0.2401311188706985
epoch 5: 83360/182380 (0.46 %) finished / train loss: 0.24014040057810163
epoch 5: 83520/182380 (0.46 %) finished / tr

epoch 5: 99360/182380 (0.54 %) finished / train loss: 0.23943870381936552
epoch 5: 99520/182380 (0.55 %) finished / train loss: 0.23941810641833056
epoch 5: 99680/182380 (0.55 %) finished / train loss: 0.2394303026398342
epoch 5: 99840/182380 (0.55 %) finished / train loss: 0.23939965337705918
epoch 5: 100000/182380 (0.55 %) finished / train loss: 0.23942107586860656
epoch 5: 100160/182380 (0.55 %) finished / train loss: 0.2393689791805828
epoch 5: 100320/182380 (0.55 %) finished / train loss: 0.23934726604814544
epoch 5: 100480/182380 (0.55 %) finished / train loss: 0.23934886627800905
epoch 5: 100640/182380 (0.55 %) finished / train loss: 0.23936538118721
epoch 5: 100800/182380 (0.55 %) finished / train loss: 0.23936892686855224
epoch 5: 100960/182380 (0.55 %) finished / train loss: 0.23941400853087522
epoch 5: 101120/182380 (0.55 %) finished / train loss: 0.2393800793474988
epoch 5: 101280/182380 (0.56 %) finished / train loss: 0.23932797243998138
epoch 5: 101440/182380 (0.56 %) fin

epoch 5: 116960/182380 (0.64 %) finished / train loss: 0.23984842554815164
epoch 5: 117120/182380 (0.64 %) finished / train loss: 0.23985839516250163
epoch 5: 117280/182380 (0.64 %) finished / train loss: 0.23984972998032303
epoch 5: 117440/182380 (0.64 %) finished / train loss: 0.2398568986709501
epoch 5: 117600/182380 (0.64 %) finished / train loss: 0.23989387421380906
epoch 5: 117760/182380 (0.65 %) finished / train loss: 0.23990936433977406
epoch 5: 117920/182380 (0.65 %) finished / train loss: 0.23986965384703315
epoch 5: 118080/182380 (0.65 %) finished / train loss: 0.2398846607342322
epoch 5: 118240/182380 (0.65 %) finished / train loss: 0.2398861894426875
epoch 5: 118400/182380 (0.65 %) finished / train loss: 0.23986654047224973
epoch 5: 118560/182380 (0.65 %) finished / train loss: 0.2398610851703546
epoch 5: 118720/182380 (0.65 %) finished / train loss: 0.23988917010492392
epoch 5: 118880/182380 (0.65 %) finished / train loss: 0.23989510196054287
epoch 5: 119040/182380 (0.65 

epoch 5: 134560/182380 (0.74 %) finished / train loss: 0.23983134636201417
epoch 5: 134720/182380 (0.74 %) finished / train loss: 0.23981103649685898
epoch 5: 134880/182380 (0.74 %) finished / train loss: 0.2398004676417524
epoch 5: 135040/182380 (0.74 %) finished / train loss: 0.23983891041004826
epoch 5: 135200/182380 (0.74 %) finished / train loss: 0.23981624035792942
epoch 5: 135360/182380 (0.74 %) finished / train loss: 0.23982143489463392
epoch 5: 135520/182380 (0.74 %) finished / train loss: 0.23980828254464948
epoch 5: 135680/182380 (0.74 %) finished / train loss: 0.23982775027178369
epoch 5: 135840/182380 (0.74 %) finished / train loss: 0.23981624770080243
epoch 5: 136000/182380 (0.75 %) finished / train loss: 0.23981761733574025
epoch 5: 136160/182380 (0.75 %) finished / train loss: 0.23980391680073654
epoch 5: 136320/182380 (0.75 %) finished / train loss: 0.23980421115045256
epoch 5: 136480/182380 (0.75 %) finished / train loss: 0.23983394501846533
epoch 5: 136640/182380 (0.

epoch 5: 152160/182380 (0.83 %) finished / train loss: 0.23997473563180236
epoch 5: 152320/182380 (0.84 %) finished / train loss: 0.23999967179691592
epoch 5: 152480/182380 (0.84 %) finished / train loss: 0.2399954204075234
epoch 5: 152640/182380 (0.84 %) finished / train loss: 0.23998945340420466
epoch 5: 152800/182380 (0.84 %) finished / train loss: 0.24003273982028062
epoch 5: 152960/182380 (0.84 %) finished / train loss: 0.2400702672055825
epoch 5: 153120/182380 (0.84 %) finished / train loss: 0.24006155150375147
epoch 5: 153280/182380 (0.84 %) finished / train loss: 0.2400654902444503
epoch 5: 153440/182380 (0.84 %) finished / train loss: 0.2400678792387651
epoch 5: 153600/182380 (0.84 %) finished / train loss: 0.24005993665196002
epoch 5: 153760/182380 (0.84 %) finished / train loss: 0.24006585757578572
epoch 5: 153920/182380 (0.84 %) finished / train loss: 0.24008217009709928
epoch 5: 154080/182380 (0.84 %) finished / train loss: 0.24009086582829028
epoch 5: 154240/182380 (0.85 

epoch 5: 169760/182380 (0.93 %) finished / train loss: 0.24003082921379137
epoch 5: 169920/182380 (0.93 %) finished / train loss: 0.2400381258146911
epoch 5: 170080/182380 (0.93 %) finished / train loss: 0.24005939197338425
epoch 5: 170240/182380 (0.93 %) finished / train loss: 0.24004466049933343
epoch 5: 170400/182380 (0.93 %) finished / train loss: 0.24000435775714302
epoch 5: 170560/182380 (0.94 %) finished / train loss: 0.23997038817819466
epoch 5: 170720/182380 (0.94 %) finished / train loss: 0.23996509051032455
epoch 5: 170880/182380 (0.94 %) finished / train loss: 0.23994479505589392
epoch 5: 171040/182380 (0.94 %) finished / train loss: 0.23994271056020897
epoch 5: 171200/182380 (0.94 %) finished / train loss: 0.23993080876140951
epoch 5: 171360/182380 (0.94 %) finished / train loss: 0.23993979042150726
epoch 5: 171520/182380 (0.94 %) finished / train loss: 0.23995907962211033
epoch 5: 171680/182380 (0.94 %) finished / train loss: 0.23994092162202033
epoch 5: 171840/182380 (0.

epoch 6: 4960/182380 (0.03 %) finished / train loss: 0.23840202218101872
epoch 6: 5120/182380 (0.03 %) finished / train loss: 0.23830841183662416
epoch 6: 5280/182380 (0.03 %) finished / train loss: 0.238512814857743
epoch 6: 5440/182380 (0.03 %) finished / train loss: 0.2391387750120724
epoch 6: 5600/182380 (0.03 %) finished / train loss: 0.23883964589663914
epoch 6: 5760/182380 (0.03 %) finished / train loss: 0.23877476304769515
epoch 6: 5920/182380 (0.03 %) finished / train loss: 0.23875873064672626
epoch 6: 6080/182380 (0.03 %) finished / train loss: 0.23867916849098708
epoch 6: 6240/182380 (0.03 %) finished / train loss: 0.23774502659455324
epoch 6: 6400/182380 (0.04 %) finished / train loss: 0.23752745121717453
epoch 6: 6560/182380 (0.04 %) finished / train loss: 0.2365831815614933
epoch 6: 6720/182380 (0.04 %) finished / train loss: 0.23715630365269524
epoch 6: 6880/182380 (0.04 %) finished / train loss: 0.23694953190725904
epoch 6: 7040/182380 (0.04 %) finished / train loss: 0.

epoch 6: 22880/182380 (0.13 %) finished / train loss: 0.237233448362017
epoch 6: 23040/182380 (0.13 %) finished / train loss: 0.2371637374576595
epoch 6: 23200/182380 (0.13 %) finished / train loss: 0.23712187195646353
epoch 6: 23360/182380 (0.13 %) finished / train loss: 0.23705449957553654
epoch 6: 23520/182380 (0.13 %) finished / train loss: 0.23686130458400362
epoch 6: 23680/182380 (0.13 %) finished / train loss: 0.23678988415647198
epoch 6: 23840/182380 (0.13 %) finished / train loss: 0.23682719847099892
epoch 6: 24000/182380 (0.13 %) finished / train loss: 0.23684090775251387
epoch 6: 24160/182380 (0.13 %) finished / train loss: 0.23673089379506396
epoch 6: 24320/182380 (0.13 %) finished / train loss: 0.23680496372674642
epoch 6: 24480/182380 (0.13 %) finished / train loss: 0.23673410910406922
epoch 6: 24640/182380 (0.14 %) finished / train loss: 0.23665539748095846
epoch 6: 24800/182380 (0.14 %) finished / train loss: 0.23653513356562583
epoch 6: 24960/182380 (0.14 %) finished /

epoch 6: 40800/182380 (0.22 %) finished / train loss: 0.23700724656675376
epoch 6: 40960/182380 (0.22 %) finished / train loss: 0.23702315770788118
epoch 6: 41120/182380 (0.23 %) finished / train loss: 0.23704896101923767
epoch 6: 41280/182380 (0.23 %) finished / train loss: 0.2370503446852514
epoch 6: 41440/182380 (0.23 %) finished / train loss: 0.23698293644949275
epoch 6: 41600/182380 (0.23 %) finished / train loss: 0.23707028454312912
epoch 6: 41760/182380 (0.23 %) finished / train loss: 0.2371081095088944
epoch 6: 41920/182380 (0.23 %) finished / train loss: 0.2371417558488955
epoch 6: 42080/182380 (0.23 %) finished / train loss: 0.2370746139337808
epoch 6: 42240/182380 (0.23 %) finished / train loss: 0.2370466978825403
epoch 6: 42400/182380 (0.23 %) finished / train loss: 0.23702738526857126
epoch 6: 42560/182380 (0.23 %) finished / train loss: 0.23720261815347168
epoch 6: 42720/182380 (0.23 %) finished / train loss: 0.23714706426702636
epoch 6: 42880/182380 (0.24 %) finished / t

epoch 6: 58720/182380 (0.32 %) finished / train loss: 0.23890124787589184
epoch 6: 58880/182380 (0.32 %) finished / train loss: 0.23892994723080294
epoch 6: 59040/182380 (0.32 %) finished / train loss: 0.23899976566716585
epoch 6: 59200/182380 (0.32 %) finished / train loss: 0.23900252795702703
epoch 6: 59360/182380 (0.33 %) finished / train loss: 0.23906225361271366
epoch 6: 59520/182380 (0.33 %) finished / train loss: 0.2389862774841247
epoch 6: 59680/182380 (0.33 %) finished / train loss: 0.23900099976772277
epoch 6: 59840/182380 (0.33 %) finished / train loss: 0.23893733892370672
epoch 6: 60000/182380 (0.33 %) finished / train loss: 0.2388655262708664
epoch 6: 60160/182380 (0.33 %) finished / train loss: 0.2388393527887603
epoch 6: 60320/182380 (0.33 %) finished / train loss: 0.23883247013433542
epoch 6: 60480/182380 (0.33 %) finished / train loss: 0.2388155691601612
epoch 6: 60640/182380 (0.33 %) finished / train loss: 0.23881432661752272
epoch 6: 60800/182380 (0.33 %) finished / 

epoch 6: 76640/182380 (0.42 %) finished / train loss: 0.238488083206786
epoch 6: 76800/182380 (0.42 %) finished / train loss: 0.23850085600589713
epoch 6: 76960/182380 (0.42 %) finished / train loss: 0.23843235584777506
epoch 6: 77120/182380 (0.42 %) finished / train loss: 0.23838435909807434
epoch 6: 77280/182380 (0.42 %) finished / train loss: 0.23840646637646062
epoch 6: 77440/182380 (0.42 %) finished / train loss: 0.23841177174005626
epoch 6: 77600/182380 (0.43 %) finished / train loss: 0.238465294377091
epoch 6: 77760/182380 (0.43 %) finished / train loss: 0.23845857062948095
epoch 6: 77920/182380 (0.43 %) finished / train loss: 0.23840037725666954
epoch 6: 78080/182380 (0.43 %) finished / train loss: 0.23844271942850997
epoch 6: 78240/182380 (0.43 %) finished / train loss: 0.23843661172502123
epoch 6: 78400/182380 (0.43 %) finished / train loss: 0.23844831643664108
epoch 6: 78560/182380 (0.43 %) finished / train loss: 0.23846333883323398
epoch 6: 78720/182380 (0.43 %) finished / 

epoch 6: 94560/182380 (0.52 %) finished / train loss: 0.23790331969507253
epoch 6: 94720/182380 (0.52 %) finished / train loss: 0.23789684597805544
epoch 6: 94880/182380 (0.52 %) finished / train loss: 0.23785833754085167
epoch 6: 95040/182380 (0.52 %) finished / train loss: 0.2378758391095733
epoch 6: 95200/182380 (0.52 %) finished / train loss: 0.23781931056695826
epoch 6: 95360/182380 (0.52 %) finished / train loss: 0.2377884266960541
epoch 6: 95520/182380 (0.52 %) finished / train loss: 0.23777855443495202
epoch 6: 95680/182380 (0.52 %) finished / train loss: 0.23780186557550495
epoch 6: 95840/182380 (0.53 %) finished / train loss: 0.23776445019623274
epoch 6: 96000/182380 (0.53 %) finished / train loss: 0.23776205194493136
epoch 6: 96160/182380 (0.53 %) finished / train loss: 0.23778560807720794
epoch 6: 96320/182380 (0.53 %) finished / train loss: 0.2377746883123816
epoch 6: 96480/182380 (0.53 %) finished / train loss: 0.23775515798015975
epoch 6: 96640/182380 (0.53 %) finished /

epoch 6: 112320/182380 (0.62 %) finished / train loss: 0.23729791833974018
epoch 6: 112480/182380 (0.62 %) finished / train loss: 0.2373154347049732
epoch 6: 112640/182380 (0.62 %) finished / train loss: 0.23735304885882547
epoch 6: 112800/182380 (0.62 %) finished / train loss: 0.237355896154194
epoch 6: 112960/182380 (0.62 %) finished / train loss: 0.23729644266640498
epoch 6: 113120/182380 (0.62 %) finished / train loss: 0.23730903995003355
epoch 6: 113280/182380 (0.62 %) finished / train loss: 0.2373245892720034
epoch 6: 113440/182380 (0.62 %) finished / train loss: 0.2373677182180757
epoch 6: 113600/182380 (0.62 %) finished / train loss: 0.2373652501467248
epoch 6: 113760/182380 (0.62 %) finished / train loss: 0.23740872633859578
epoch 6: 113920/182380 (0.62 %) finished / train loss: 0.2374108045707258
epoch 6: 114080/182380 (0.63 %) finished / train loss: 0.23742322412647338
epoch 6: 114240/182380 (0.63 %) finished / train loss: 0.2374304075701898
epoch 6: 114400/182380 (0.63 %) f

epoch 6: 129920/182380 (0.71 %) finished / train loss: 0.23781452505239126
epoch 6: 130080/182380 (0.71 %) finished / train loss: 0.2377967669001951
epoch 6: 130240/182380 (0.71 %) finished / train loss: 0.23778249585511352
epoch 6: 130400/182380 (0.71 %) finished / train loss: 0.2378173725992624
epoch 6: 130560/182380 (0.72 %) finished / train loss: 0.23782535304552785
epoch 6: 130720/182380 (0.72 %) finished / train loss: 0.23780572117104523
epoch 6: 130880/182380 (0.72 %) finished / train loss: 0.2378214331375649
epoch 6: 131040/182380 (0.72 %) finished / train loss: 0.23783900292365107
epoch 6: 131200/182380 (0.72 %) finished / train loss: 0.23784078280736762
epoch 6: 131360/182380 (0.72 %) finished / train loss: 0.23785873292497248
epoch 6: 131520/182380 (0.72 %) finished / train loss: 0.23782809831365181
epoch 6: 131680/182380 (0.72 %) finished / train loss: 0.237835355474187
epoch 6: 131840/182380 (0.72 %) finished / train loss: 0.23786307622145103
epoch 6: 132000/182380 (0.72 %

epoch 6: 147520/182380 (0.81 %) finished / train loss: 0.23775491987934858
epoch 6: 147680/182380 (0.81 %) finished / train loss: 0.23774016406205467
epoch 6: 147840/182380 (0.81 %) finished / train loss: 0.23775176892613437
epoch 6: 148000/182380 (0.81 %) finished / train loss: 0.2377402196381543
epoch 6: 148160/182380 (0.81 %) finished / train loss: 0.23775967226301362
epoch 6: 148320/182380 (0.81 %) finished / train loss: 0.2377747992867405
epoch 6: 148480/182380 (0.81 %) finished / train loss: 0.23776338180398632
epoch 6: 148640/182380 (0.82 %) finished / train loss: 0.23777539804176828
epoch 6: 148800/182380 (0.82 %) finished / train loss: 0.23774940571477338
epoch 6: 148960/182380 (0.82 %) finished / train loss: 0.2377471119677598
epoch 6: 149120/182380 (0.82 %) finished / train loss: 0.23773372010547716
epoch 6: 149280/182380 (0.82 %) finished / train loss: 0.2377537834363224
epoch 6: 149440/182380 (0.82 %) finished / train loss: 0.23773709187160466
epoch 6: 149600/182380 (0.82 

epoch 6: 165120/182380 (0.91 %) finished / train loss: 0.23796221654024696
epoch 6: 165280/182380 (0.91 %) finished / train loss: 0.23795748958859994
epoch 6: 165440/182380 (0.91 %) finished / train loss: 0.23796180589286686
epoch 6: 165600/182380 (0.91 %) finished / train loss: 0.23798260989972359
epoch 6: 165760/182380 (0.91 %) finished / train loss: 0.23798181829420295
epoch 6: 165920/182380 (0.91 %) finished / train loss: 0.23798909878776756
epoch 6: 166080/182380 (0.91 %) finished / train loss: 0.23797878665214328
epoch 6: 166240/182380 (0.91 %) finished / train loss: 0.23797036786568176
epoch 6: 166400/182380 (0.91 %) finished / train loss: 0.23799991860699196
epoch 6: 166560/182380 (0.91 %) finished / train loss: 0.2379992573623126
epoch 6: 166720/182380 (0.91 %) finished / train loss: 0.23798949564315536
epoch 6: 166880/182380 (0.92 %) finished / train loss: 0.23799268840771964
epoch 6: 167040/182380 (0.92 %) finished / train loss: 0.23799975427631218
epoch 6: 167200/182380 (0.

epoch 7: 160/182380 (0.00 %) finished / train loss: 0.2530993163585663
epoch 7: 320/182380 (0.00 %) finished / train loss: 0.24704332947731017
epoch 7: 480/182380 (0.00 %) finished / train loss: 0.24561170041561126
epoch 7: 640/182380 (0.00 %) finished / train loss: 0.24595527723431587
epoch 7: 800/182380 (0.00 %) finished / train loss: 0.24627873063087463
epoch 7: 960/182380 (0.01 %) finished / train loss: 0.24256292035182317
epoch 7: 1120/182380 (0.01 %) finished / train loss: 0.23848237139838083
epoch 7: 1280/182380 (0.01 %) finished / train loss: 0.23848310336470604
epoch 7: 1440/182380 (0.01 %) finished / train loss: 0.2447580721643236
epoch 7: 1600/182380 (0.01 %) finished / train loss: 0.2447918677330017
epoch 7: 1760/182380 (0.01 %) finished / train loss: 0.24307504567233
epoch 7: 1920/182380 (0.01 %) finished / train loss: 0.24056251843770346
epoch 7: 2080/182380 (0.01 %) finished / train loss: 0.24190132044828855
epoch 7: 2240/182380 (0.01 %) finished / train loss: 0.24058470

epoch 7: 18240/182380 (0.10 %) finished / train loss: 0.2330687388777733
epoch 7: 18400/182380 (0.10 %) finished / train loss: 0.23299646787021472
epoch 7: 18560/182380 (0.10 %) finished / train loss: 0.23305778385236345
epoch 7: 18720/182380 (0.10 %) finished / train loss: 0.23297445234070477
epoch 7: 18880/182380 (0.10 %) finished / train loss: 0.23306705272298747
epoch 7: 19040/182380 (0.10 %) finished / train loss: 0.23298211523464749
epoch 7: 19200/182380 (0.11 %) finished / train loss: 0.2331081019838651
epoch 7: 19360/182380 (0.11 %) finished / train loss: 0.23291527860420794
epoch 7: 19520/182380 (0.11 %) finished / train loss: 0.23274592254005494
epoch 7: 19680/182380 (0.11 %) finished / train loss: 0.2326810425374566
epoch 7: 19840/182380 (0.11 %) finished / train loss: 0.2326943522739795
epoch 7: 20000/182380 (0.11 %) finished / train loss: 0.23285894768238066
epoch 7: 20160/182380 (0.11 %) finished / train loss: 0.23301676036346528
epoch 7: 20320/182380 (0.11 %) finished / 

epoch 7: 36160/182380 (0.20 %) finished / train loss: 0.23548061043287802
epoch 7: 36320/182380 (0.20 %) finished / train loss: 0.23544496120597821
epoch 7: 36480/182380 (0.20 %) finished / train loss: 0.23544923022650835
epoch 7: 36640/182380 (0.20 %) finished / train loss: 0.23546684524898445
epoch 7: 36800/182380 (0.20 %) finished / train loss: 0.2355517755902332
epoch 7: 36960/182380 (0.20 %) finished / train loss: 0.23558988025436153
epoch 7: 37120/182380 (0.20 %) finished / train loss: 0.2355256294638946
epoch 7: 37280/182380 (0.20 %) finished / train loss: 0.2355011636735032
epoch 7: 37440/182380 (0.21 %) finished / train loss: 0.23559065813946928
epoch 7: 37600/182380 (0.21 %) finished / train loss: 0.23553927799488636
epoch 7: 37760/182380 (0.21 %) finished / train loss: 0.2354782731730049
epoch 7: 37920/182380 (0.21 %) finished / train loss: 0.23560700368780627
epoch 7: 38080/182380 (0.21 %) finished / train loss: 0.23559047525920787
epoch 7: 38240/182380 (0.21 %) finished / 

epoch 7: 54080/182380 (0.30 %) finished / train loss: 0.23530436390074047
epoch 7: 54240/182380 (0.30 %) finished / train loss: 0.23540154197047242
epoch 7: 54400/182380 (0.30 %) finished / train loss: 0.2353634718498763
epoch 7: 54560/182380 (0.30 %) finished / train loss: 0.23536243054174608
epoch 7: 54720/182380 (0.30 %) finished / train loss: 0.23535513309707418
epoch 7: 54880/182380 (0.30 %) finished / train loss: 0.23540835487425502
epoch 7: 55040/182380 (0.30 %) finished / train loss: 0.235385083433154
epoch 7: 55200/182380 (0.30 %) finished / train loss: 0.2353507050310356
epoch 7: 55360/182380 (0.30 %) finished / train loss: 0.23538206967315234
epoch 7: 55520/182380 (0.30 %) finished / train loss: 0.235361303367601
epoch 7: 55680/182380 (0.31 %) finished / train loss: 0.23539914401440784
epoch 7: 55840/182380 (0.31 %) finished / train loss: 0.23544908009661644
epoch 7: 56000/182380 (0.31 %) finished / train loss: 0.23541188281774522
epoch 7: 56160/182380 (0.31 %) finished / tr

epoch 7: 72000/182380 (0.39 %) finished / train loss: 0.23591064277622434
epoch 7: 72160/182380 (0.40 %) finished / train loss: 0.2359981703652511
epoch 7: 72320/182380 (0.40 %) finished / train loss: 0.23601562710462418
epoch 7: 72480/182380 (0.40 %) finished / train loss: 0.23599761140925468
epoch 7: 72640/182380 (0.40 %) finished / train loss: 0.2360042937986126
epoch 7: 72800/182380 (0.40 %) finished / train loss: 0.23598278530351408
epoch 7: 72960/182380 (0.40 %) finished / train loss: 0.23600035008500542
epoch 7: 73120/182380 (0.40 %) finished / train loss: 0.23604843136518217
epoch 7: 73280/182380 (0.40 %) finished / train loss: 0.23605164125496644
epoch 7: 73440/182380 (0.40 %) finished / train loss: 0.23607053248970597
epoch 7: 73600/182380 (0.40 %) finished / train loss: 0.23606612984253011
epoch 7: 73760/182380 (0.40 %) finished / train loss: 0.2360370999109202
epoch 7: 73920/182380 (0.41 %) finished / train loss: 0.2360658344961864
epoch 7: 74080/182380 (0.41 %) finished / 

epoch 7: 89920/182380 (0.49 %) finished / train loss: 0.23573517348630574
epoch 7: 90080/182380 (0.49 %) finished / train loss: 0.23567492193269476
epoch 7: 90240/182380 (0.49 %) finished / train loss: 0.2356716258464553
epoch 7: 90400/182380 (0.50 %) finished / train loss: 0.23565570255823895
epoch 7: 90560/182380 (0.50 %) finished / train loss: 0.23566683899387453
epoch 7: 90720/182380 (0.50 %) finished / train loss: 0.2356952425296134
epoch 7: 90880/182380 (0.50 %) finished / train loss: 0.23569210989689324
epoch 7: 91040/182380 (0.50 %) finished / train loss: 0.2356791683523433
epoch 7: 91200/182380 (0.50 %) finished / train loss: 0.23567769846372438
epoch 7: 91360/182380 (0.50 %) finished / train loss: 0.2357585925250045
epoch 7: 91520/182380 (0.50 %) finished / train loss: 0.23580725385279921
epoch 7: 91680/182380 (0.50 %) finished / train loss: 0.23581394178184956
epoch 7: 91840/182380 (0.50 %) finished / train loss: 0.23577007339287304
epoch 7: 92000/182380 (0.50 %) finished / 

epoch 7: 107680/182380 (0.59 %) finished / train loss: 0.23605044805188768
epoch 7: 107840/182380 (0.59 %) finished / train loss: 0.23607351206884186
epoch 7: 108000/182380 (0.59 %) finished / train loss: 0.2360470797441624
epoch 7: 108160/182380 (0.59 %) finished / train loss: 0.23602882119766355
epoch 7: 108320/182380 (0.59 %) finished / train loss: 0.23603675465816232
epoch 7: 108480/182380 (0.59 %) finished / train loss: 0.23605995812950584
epoch 7: 108640/182380 (0.60 %) finished / train loss: 0.23610435551325948
epoch 7: 108800/182380 (0.60 %) finished / train loss: 0.23611922148834258
epoch 7: 108960/182380 (0.60 %) finished / train loss: 0.23612766077690012
epoch 7: 109120/182380 (0.60 %) finished / train loss: 0.23614903985143057
epoch 7: 109280/182380 (0.60 %) finished / train loss: 0.23614419846199616
epoch 7: 109440/182380 (0.60 %) finished / train loss: 0.23612405337523995
epoch 7: 109600/182380 (0.60 %) finished / train loss: 0.23610543279752244
epoch 7: 109760/182380 (0.

epoch 7: 125280/182380 (0.69 %) finished / train loss: 0.23575369041998268
epoch 7: 125440/182380 (0.69 %) finished / train loss: 0.23573541118934446
epoch 7: 125600/182380 (0.69 %) finished / train loss: 0.23573148290063164
epoch 7: 125760/182380 (0.69 %) finished / train loss: 0.23572375442235524
epoch 7: 125920/182380 (0.69 %) finished / train loss: 0.235732386425005
epoch 7: 126080/182380 (0.69 %) finished / train loss: 0.23570866948986416
epoch 7: 126240/182380 (0.69 %) finished / train loss: 0.23572850157477254
epoch 7: 126400/182380 (0.69 %) finished / train loss: 0.23572304881448988
epoch 7: 126560/182380 (0.69 %) finished / train loss: 0.23569243513754135
epoch 7: 126720/182380 (0.69 %) finished / train loss: 0.23571595297844122
epoch 7: 126880/182380 (0.70 %) finished / train loss: 0.23571974768915213
epoch 7: 127040/182380 (0.70 %) finished / train loss: 0.23571472312476233
epoch 7: 127200/182380 (0.70 %) finished / train loss: 0.23573446683538785
epoch 7: 127360/182380 (0.7

epoch 7: 142880/182380 (0.78 %) finished / train loss: 0.23646087700215326
epoch 7: 143040/182380 (0.78 %) finished / train loss: 0.2364364422641078
epoch 7: 143200/182380 (0.79 %) finished / train loss: 0.23643867771052782
epoch 7: 143360/182380 (0.79 %) finished / train loss: 0.23641823311668952
epoch 7: 143520/182380 (0.79 %) finished / train loss: 0.23640173348362498
epoch 7: 143680/182380 (0.79 %) finished / train loss: 0.23640776719972656
epoch 7: 143840/182380 (0.79 %) finished / train loss: 0.23641291772894918
epoch 7: 144000/182380 (0.79 %) finished / train loss: 0.23641062240799268
epoch 7: 144160/182380 (0.79 %) finished / train loss: 0.2364575256319607
epoch 7: 144320/182380 (0.79 %) finished / train loss: 0.23647882809858364
epoch 7: 144480/182380 (0.79 %) finished / train loss: 0.23650920039923617
epoch 7: 144640/182380 (0.79 %) finished / train loss: 0.2365301079619511
epoch 7: 144800/182380 (0.79 %) finished / train loss: 0.23651086398251148
epoch 7: 144960/182380 (0.79

epoch 7: 160480/182380 (0.88 %) finished / train loss: 0.23638170612892387
epoch 7: 160640/182380 (0.88 %) finished / train loss: 0.23636663815830333
epoch 7: 160800/182380 (0.88 %) finished / train loss: 0.23635118191515037
epoch 7: 160960/182380 (0.88 %) finished / train loss: 0.2363455077436999
epoch 7: 161120/182380 (0.88 %) finished / train loss: 0.2363797411307796
epoch 7: 161280/182380 (0.88 %) finished / train loss: 0.2363698876300265
epoch 7: 161440/182380 (0.89 %) finished / train loss: 0.2363755447688495
epoch 7: 161600/182380 (0.89 %) finished / train loss: 0.23638442720517072
epoch 7: 161760/182380 (0.89 %) finished / train loss: 0.23639244348783522
epoch 7: 161920/182380 (0.89 %) finished / train loss: 0.2363779198393049
epoch 7: 162080/182380 (0.89 %) finished / train loss: 0.2363662425939799
epoch 7: 162240/182380 (0.89 %) finished / train loss: 0.23634129476382654
epoch 7: 162400/182380 (0.89 %) finished / train loss: 0.23635859929869327
epoch 7: 162560/182380 (0.89 %)

epoch 7: 178080/182380 (0.98 %) finished / train loss: 0.23625518503161239
epoch 7: 178240/182380 (0.98 %) finished / train loss: 0.23622451561839192
epoch 7: 178400/182380 (0.98 %) finished / train loss: 0.23621409603298513
epoch 7: 178560/182380 (0.98 %) finished / train loss: 0.23623208358456585
epoch 7: 178720/182380 (0.98 %) finished / train loss: 0.23622197292698421
epoch 7: 178880/182380 (0.98 %) finished / train loss: 0.23622392453319913
epoch 7: 179040/182380 (0.98 %) finished / train loss: 0.23622465879923538
epoch 7: 179200/182380 (0.98 %) finished / train loss: 0.23622749106426325
epoch 7: 179360/182380 (0.98 %) finished / train loss: 0.23622939678093455
epoch 7: 179520/182380 (0.98 %) finished / train loss: 0.23622443270662039
epoch 7: 179680/182380 (0.99 %) finished / train loss: 0.23622599816545248
epoch 7: 179840/182380 (0.99 %) finished / train loss: 0.23624622136142331
epoch 7: 180000/182380 (0.99 %) finished / train loss: 0.23624983479711745
epoch 7: 180160/182380 (0

epoch 8: 13440/182380 (0.07 %) finished / train loss: 0.2314779016943205
epoch 8: 13600/182380 (0.07 %) finished / train loss: 0.23146592052543866
epoch 8: 13760/182380 (0.08 %) finished / train loss: 0.2312636824194775
epoch 8: 13920/182380 (0.08 %) finished / train loss: 0.23115704737860582
epoch 8: 14080/182380 (0.08 %) finished / train loss: 0.23106444677845997
epoch 8: 14240/182380 (0.08 %) finished / train loss: 0.2309052970302239
epoch 8: 14400/182380 (0.08 %) finished / train loss: 0.2308043337199423
epoch 8: 14560/182380 (0.08 %) finished / train loss: 0.23069458862582407
epoch 8: 14720/182380 (0.08 %) finished / train loss: 0.23036374689444253
epoch 8: 14880/182380 (0.08 %) finished / train loss: 0.23023056173196402
epoch 8: 15040/182380 (0.08 %) finished / train loss: 0.23050519136038233
epoch 8: 15200/182380 (0.08 %) finished / train loss: 0.23075800851771705
epoch 8: 15360/182380 (0.08 %) finished / train loss: 0.23075243157024186
epoch 8: 15520/182380 (0.09 %) finished / 

epoch 8: 31360/182380 (0.17 %) finished / train loss: 0.23143609444401703
epoch 8: 31520/182380 (0.17 %) finished / train loss: 0.23153039135303594
epoch 8: 31680/182380 (0.17 %) finished / train loss: 0.23147347098348117
epoch 8: 31840/182380 (0.17 %) finished / train loss: 0.2316192201184268
epoch 8: 32000/182380 (0.18 %) finished / train loss: 0.23175747072696687
epoch 8: 32160/182380 (0.18 %) finished / train loss: 0.23199176600026847
epoch 8: 32320/182380 (0.18 %) finished / train loss: 0.23197592049837112
epoch 8: 32480/182380 (0.18 %) finished / train loss: 0.2321138951578751
epoch 8: 32640/182380 (0.18 %) finished / train loss: 0.2321803262566819
epoch 8: 32800/182380 (0.18 %) finished / train loss: 0.23223682213120345
epoch 8: 32960/182380 (0.18 %) finished / train loss: 0.23229412547882322
epoch 8: 33120/182380 (0.18 %) finished / train loss: 0.2323139883901762
epoch 8: 33280/182380 (0.18 %) finished / train loss: 0.23239680018562536
epoch 8: 33440/182380 (0.18 %) finished / 

epoch 8: 49280/182380 (0.27 %) finished / train loss: 0.23343685822827476
epoch 8: 49440/182380 (0.27 %) finished / train loss: 0.23339608867191575
epoch 8: 49600/182380 (0.27 %) finished / train loss: 0.23334751559842018
epoch 8: 49760/182380 (0.27 %) finished / train loss: 0.23331074184735104
epoch 8: 49920/182380 (0.27 %) finished / train loss: 0.23323390130431224
epoch 8: 50080/182380 (0.27 %) finished / train loss: 0.2332032216147493
epoch 8: 50240/182380 (0.28 %) finished / train loss: 0.2331832522894167
epoch 8: 50400/182380 (0.28 %) finished / train loss: 0.23322820114710974
epoch 8: 50560/182380 (0.28 %) finished / train loss: 0.23316964368465581
epoch 8: 50720/182380 (0.28 %) finished / train loss: 0.2331438821761014
epoch 8: 50880/182380 (0.28 %) finished / train loss: 0.23316734604678063
epoch 8: 51040/182380 (0.28 %) finished / train loss: 0.23321864970238604
epoch 8: 51200/182380 (0.28 %) finished / train loss: 0.23326942267827688
epoch 8: 51360/182380 (0.28 %) finished /

epoch 8: 67200/182380 (0.37 %) finished / train loss: 0.2336225456425122
epoch 8: 67360/182380 (0.37 %) finished / train loss: 0.23361660309330584
epoch 8: 67520/182380 (0.37 %) finished / train loss: 0.2335650539723053
epoch 8: 67680/182380 (0.37 %) finished / train loss: 0.233500956481512
epoch 8: 67840/182380 (0.37 %) finished / train loss: 0.23348967035845766
epoch 8: 68000/182380 (0.37 %) finished / train loss: 0.2335671877861023
epoch 8: 68160/182380 (0.37 %) finished / train loss: 0.23354037227764934
epoch 8: 68320/182380 (0.37 %) finished / train loss: 0.2335563191066581
epoch 8: 68480/182380 (0.38 %) finished / train loss: 0.2336018223002135
epoch 8: 68640/182380 (0.38 %) finished / train loss: 0.2335867433350681
epoch 8: 68800/182380 (0.38 %) finished / train loss: 0.2335971364933391
epoch 8: 68960/182380 (0.38 %) finished / train loss: 0.23357071403560947
epoch 8: 69120/182380 (0.38 %) finished / train loss: 0.23356305891992868
epoch 8: 69280/182380 (0.38 %) finished / train

epoch 8: 85120/182380 (0.47 %) finished / train loss: 0.23435099538891835
epoch 8: 85280/182380 (0.47 %) finished / train loss: 0.2343830294389886
epoch 8: 85440/182380 (0.47 %) finished / train loss: 0.23444384364376353
epoch 8: 85600/182380 (0.47 %) finished / train loss: 0.23443474815827664
epoch 8: 85760/182380 (0.47 %) finished / train loss: 0.23442611942317948
epoch 8: 85920/182380 (0.47 %) finished / train loss: 0.2344491937695491
epoch 8: 86080/182380 (0.47 %) finished / train loss: 0.23447417045725322
epoch 8: 86240/182380 (0.47 %) finished / train loss: 0.23445461041852142
epoch 8: 86400/182380 (0.47 %) finished / train loss: 0.23446021957529917
epoch 8: 86560/182380 (0.47 %) finished / train loss: 0.23445350613699822
epoch 8: 86720/182380 (0.48 %) finished / train loss: 0.23445149419272518
epoch 8: 86880/182380 (0.48 %) finished / train loss: 0.23447943110821656
epoch 8: 87040/182380 (0.48 %) finished / train loss: 0.2344618113601909
epoch 8: 87200/182380 (0.48 %) finished /

epoch 8: 102880/182380 (0.56 %) finished / train loss: 0.23412366257299716
epoch 8: 103040/182380 (0.56 %) finished / train loss: 0.2341099308514447
epoch 8: 103200/182380 (0.57 %) finished / train loss: 0.2341127742445746
epoch 8: 103360/182380 (0.57 %) finished / train loss: 0.2341268940422188
epoch 8: 103520/182380 (0.57 %) finished / train loss: 0.23412225764169944
epoch 8: 103680/182380 (0.57 %) finished / train loss: 0.2341344678889454
epoch 8: 103840/182380 (0.57 %) finished / train loss: 0.23414695483785933
epoch 8: 104000/182380 (0.57 %) finished / train loss: 0.2341510838499436
epoch 8: 104160/182380 (0.57 %) finished / train loss: 0.23415069410694725
epoch 8: 104320/182380 (0.57 %) finished / train loss: 0.23412463968973948
epoch 8: 104480/182380 (0.57 %) finished / train loss: 0.2341065052503101
epoch 8: 104640/182380 (0.57 %) finished / train loss: 0.23409018998663725
epoch 8: 104800/182380 (0.57 %) finished / train loss: 0.23413818519989044
epoch 8: 104960/182380 (0.58 %)

epoch 8: 120480/182380 (0.66 %) finished / train loss: 0.23409185678677097
epoch 8: 120640/182380 (0.66 %) finished / train loss: 0.23407500342364654
epoch 8: 120800/182380 (0.66 %) finished / train loss: 0.23410578153386022
epoch 8: 120960/182380 (0.66 %) finished / train loss: 0.23408320330122792
epoch 8: 121120/182380 (0.66 %) finished / train loss: 0.23412136804789815
epoch 8: 121280/182380 (0.66 %) finished / train loss: 0.23411590300873905
epoch 8: 121440/182380 (0.67 %) finished / train loss: 0.23407744354174542
epoch 8: 121600/182380 (0.67 %) finished / train loss: 0.2340855239723858
epoch 8: 121760/182380 (0.67 %) finished / train loss: 0.23405030537763813
epoch 8: 121920/182380 (0.67 %) finished / train loss: 0.23401482182694233
epoch 8: 122080/182380 (0.67 %) finished / train loss: 0.23401859078854126
epoch 8: 122240/182380 (0.67 %) finished / train loss: 0.23399899952230654
epoch 8: 122400/182380 (0.67 %) finished / train loss: 0.23401163539076164
epoch 8: 122560/182380 (0.

epoch 8: 138080/182380 (0.76 %) finished / train loss: 0.2340493688094381
epoch 8: 138240/182380 (0.76 %) finished / train loss: 0.23410400803442355
epoch 8: 138400/182380 (0.76 %) finished / train loss: 0.23409115244542933
epoch 8: 138560/182380 (0.76 %) finished / train loss: 0.23409053253452994
epoch 8: 138720/182380 (0.76 %) finished / train loss: 0.2340938416181826
epoch 8: 138880/182380 (0.76 %) finished / train loss: 0.2340942756371564
epoch 8: 139040/182380 (0.76 %) finished / train loss: 0.23408712641827942
epoch 8: 139200/182380 (0.76 %) finished / train loss: 0.23407881190379462
epoch 8: 139360/182380 (0.76 %) finished / train loss: 0.23408080779794438
epoch 8: 139520/182380 (0.76 %) finished / train loss: 0.2341050942214804
epoch 8: 139680/182380 (0.77 %) finished / train loss: 0.23408441784592154
epoch 8: 139840/182380 (0.77 %) finished / train loss: 0.23409513246003769
epoch 8: 140000/182380 (0.77 %) finished / train loss: 0.23410267968858992
epoch 8: 140160/182380 (0.77 

epoch 8: 155680/182380 (0.85 %) finished / train loss: 0.2347638312646811
epoch 8: 155840/182380 (0.85 %) finished / train loss: 0.23474304115197006
epoch 8: 156000/182380 (0.86 %) finished / train loss: 0.23474303041971648
epoch 8: 156160/182380 (0.86 %) finished / train loss: 0.23474821231221077
epoch 8: 156320/182380 (0.86 %) finished / train loss: 0.2347385174267856
epoch 8: 156480/182380 (0.86 %) finished / train loss: 0.2347538878611748
epoch 8: 156640/182380 (0.86 %) finished / train loss: 0.23477200955548252
epoch 8: 156800/182380 (0.86 %) finished / train loss: 0.23476978051419162
epoch 8: 156960/182380 (0.86 %) finished / train loss: 0.23476080511080502
epoch 8: 157120/182380 (0.86 %) finished / train loss: 0.23475276015076763
epoch 8: 157280/182380 (0.86 %) finished / train loss: 0.23474576873430036
epoch 8: 157440/182380 (0.86 %) finished / train loss: 0.2347455281400826
epoch 8: 157600/182380 (0.86 %) finished / train loss: 0.2347476197499309
epoch 8: 157760/182380 (0.87 %

epoch 8: 173280/182380 (0.95 %) finished / train loss: 0.23461790455510412
epoch 8: 173440/182380 (0.95 %) finished / train loss: 0.23462304437457415
epoch 8: 173600/182380 (0.95 %) finished / train loss: 0.2345962190408311
epoch 8: 173760/182380 (0.95 %) finished / train loss: 0.23460758623991224
epoch 8: 173920/182380 (0.95 %) finished / train loss: 0.23461502692298047
epoch 8: 174080/182380 (0.95 %) finished / train loss: 0.23461099402047694
epoch 8: 174240/182380 (0.96 %) finished / train loss: 0.23462510549551419
epoch 8: 174400/182380 (0.96 %) finished / train loss: 0.2346270208812635
epoch 8: 174560/182380 (0.96 %) finished / train loss: 0.23461769425901768
epoch 8: 174720/182380 (0.96 %) finished / train loss: 0.23459564679653652
epoch 8: 174880/182380 (0.96 %) finished / train loss: 0.23458991630406742
epoch 8: 175040/182380 (0.96 %) finished / train loss: 0.23459253182849238
epoch 8: 175200/182380 (0.96 %) finished / train loss: 0.2345693656870219
epoch 8: 175360/182380 (0.96

epoch 9: 8480/182380 (0.05 %) finished / train loss: 0.2323041815240428
epoch 9: 8640/182380 (0.05 %) finished / train loss: 0.232542336318228
epoch 9: 8800/182380 (0.05 %) finished / train loss: 0.23252981624820016
epoch 9: 8960/182380 (0.05 %) finished / train loss: 0.23219898071672235
epoch 9: 9120/182380 (0.05 %) finished / train loss: 0.23199046128674558
epoch 9: 9280/182380 (0.05 %) finished / train loss: 0.23218705181417795
epoch 9: 9440/182380 (0.05 %) finished / train loss: 0.23212479514590764
epoch 9: 9600/182380 (0.05 %) finished / train loss: 0.2317698357999325
epoch 9: 9760/182380 (0.05 %) finished / train loss: 0.23174264035264
epoch 9: 9920/182380 (0.05 %) finished / train loss: 0.23150603348209012
epoch 9: 10080/182380 (0.06 %) finished / train loss: 0.23130010673924098
epoch 9: 10240/182380 (0.06 %) finished / train loss: 0.2313813937827945
epoch 9: 10400/182380 (0.06 %) finished / train loss: 0.23111712854642136
epoch 9: 10560/182380 (0.06 %) finished / train loss: 0.

epoch 9: 26400/182380 (0.14 %) finished / train loss: 0.23013829041611064
epoch 9: 26560/182380 (0.15 %) finished / train loss: 0.23017018850309304
epoch 9: 26720/182380 (0.15 %) finished / train loss: 0.2300768298481753
epoch 9: 26880/182380 (0.15 %) finished / train loss: 0.22998260481371766
epoch 9: 27040/182380 (0.15 %) finished / train loss: 0.2300075314454073
epoch 9: 27200/182380 (0.15 %) finished / train loss: 0.23011841340976602
epoch 9: 27360/182380 (0.15 %) finished / train loss: 0.23022350790904977
epoch 9: 27520/182380 (0.15 %) finished / train loss: 0.23009762800363606
epoch 9: 27680/182380 (0.15 %) finished / train loss: 0.23020188332982147
epoch 9: 27840/182380 (0.15 %) finished / train loss: 0.2302616675352228
epoch 9: 28000/182380 (0.15 %) finished / train loss: 0.2301857612984521
epoch 9: 28160/182380 (0.15 %) finished / train loss: 0.23023356868123465
epoch 9: 28320/182380 (0.16 %) finished / train loss: 0.23033888013349416
epoch 9: 28480/182380 (0.16 %) finished / 

epoch 9: 44320/182380 (0.24 %) finished / train loss: 0.23255953285237943
epoch 9: 44480/182380 (0.24 %) finished / train loss: 0.23256643682503872
epoch 9: 44640/182380 (0.24 %) finished / train loss: 0.23260551746600844
epoch 9: 44800/182380 (0.25 %) finished / train loss: 0.23260207475296088
epoch 9: 44960/182380 (0.25 %) finished / train loss: 0.23257196589084705
epoch 9: 45120/182380 (0.25 %) finished / train loss: 0.23258339330448327
epoch 9: 45280/182380 (0.25 %) finished / train loss: 0.2326123246982325
epoch 9: 45440/182380 (0.25 %) finished / train loss: 0.23257049393485968
epoch 9: 45600/182380 (0.25 %) finished / train loss: 0.23271649153609025
epoch 9: 45760/182380 (0.25 %) finished / train loss: 0.2326771431035929
epoch 9: 45920/182380 (0.25 %) finished / train loss: 0.2327087164652057
epoch 9: 46080/182380 (0.25 %) finished / train loss: 0.23261048083917962
epoch 9: 46240/182380 (0.25 %) finished / train loss: 0.2326032934510584
epoch 9: 46400/182380 (0.25 %) finished / 

epoch 9: 62240/182380 (0.34 %) finished / train loss: 0.23257543105239428
epoch 9: 62400/182380 (0.34 %) finished / train loss: 0.23256902467746002
epoch 9: 62560/182380 (0.34 %) finished / train loss: 0.23252782374239334
epoch 9: 62720/182380 (0.34 %) finished / train loss: 0.23246169967614874
epoch 9: 62880/182380 (0.34 %) finished / train loss: 0.23245006140710137
epoch 9: 63040/182380 (0.35 %) finished / train loss: 0.23248359579876596
epoch 9: 63200/182380 (0.35 %) finished / train loss: 0.23248199179202694
epoch 9: 63360/182380 (0.35 %) finished / train loss: 0.23254912595706756
epoch 9: 63520/182380 (0.35 %) finished / train loss: 0.23259763143374879
epoch 9: 63680/182380 (0.35 %) finished / train loss: 0.2325979396625979
epoch 9: 63840/182380 (0.35 %) finished / train loss: 0.2325916720213448
epoch 9: 64000/182380 (0.35 %) finished / train loss: 0.2326648753359914
epoch 9: 64160/182380 (0.35 %) finished / train loss: 0.23258050483212506
epoch 9: 64320/182380 (0.35 %) finished /

epoch 9: 80160/182380 (0.44 %) finished / train loss: 0.2320676989957482
epoch 9: 80320/182380 (0.44 %) finished / train loss: 0.2320402368843793
epoch 9: 80480/182380 (0.44 %) finished / train loss: 0.23197801020699987
epoch 9: 80640/182380 (0.44 %) finished / train loss: 0.23198134929887831
epoch 9: 80800/182380 (0.44 %) finished / train loss: 0.23197710623835574
epoch 9: 80960/182380 (0.44 %) finished / train loss: 0.23192365619504876
epoch 9: 81120/182380 (0.44 %) finished / train loss: 0.23192211525327355
epoch 9: 81280/182380 (0.45 %) finished / train loss: 0.23193386631805127
epoch 9: 81440/182380 (0.45 %) finished / train loss: 0.23194110058613984
epoch 9: 81600/182380 (0.45 %) finished / train loss: 0.23192819339387558
epoch 9: 81760/182380 (0.45 %) finished / train loss: 0.23192301596680734
epoch 9: 81920/182380 (0.45 %) finished / train loss: 0.231925696489634
epoch 9: 82080/182380 (0.45 %) finished / train loss: 0.23196206765565258
epoch 9: 82240/182380 (0.45 %) finished / 

epoch 9: 98080/182380 (0.54 %) finished / train loss: 0.2318969994102761
epoch 9: 98240/182380 (0.54 %) finished / train loss: 0.23187492796574818
epoch 9: 98400/182380 (0.54 %) finished / train loss: 0.2318508583888775
epoch 9: 98560/182380 (0.54 %) finished / train loss: 0.2318794830424058
epoch 9: 98720/182380 (0.54 %) finished / train loss: 0.231890348667457
epoch 9: 98880/182380 (0.54 %) finished / train loss: 0.23187899724565278
epoch 9: 99040/182380 (0.54 %) finished / train loss: 0.23187230201453116
epoch 9: 99200/182380 (0.54 %) finished / train loss: 0.23185032021614813
epoch 9: 99360/182380 (0.54 %) finished / train loss: 0.2318563238338188
epoch 9: 99520/182380 (0.55 %) finished / train loss: 0.23180410288441985
epoch 9: 99680/182380 (0.55 %) finished / train loss: 0.2318409077954713
epoch 9: 99840/182380 (0.55 %) finished / train loss: 0.23192201328869813
epoch 9: 100000/182380 (0.55 %) finished / train loss: 0.23192765085220338
epoch 9: 100160/182380 (0.55 %) finished / t

epoch 9: 115840/182380 (0.64 %) finished / train loss: 0.2319903510957133
epoch 9: 116000/182380 (0.64 %) finished / train loss: 0.2319981123291213
epoch 9: 116160/182380 (0.64 %) finished / train loss: 0.2319968790349553
epoch 9: 116320/182380 (0.64 %) finished / train loss: 0.23196997952838383
epoch 9: 116480/182380 (0.64 %) finished / train loss: 0.23196053115630544
epoch 9: 116640/182380 (0.64 %) finished / train loss: 0.2319534776305629
epoch 9: 116800/182380 (0.64 %) finished / train loss: 0.23197162626949075
epoch 9: 116960/182380 (0.64 %) finished / train loss: 0.23195921823932764
epoch 9: 117120/182380 (0.64 %) finished / train loss: 0.23197180811580412
epoch 9: 117280/182380 (0.64 %) finished / train loss: 0.23193680241521025
epoch 9: 117440/182380 (0.64 %) finished / train loss: 0.23192239181628344
epoch 9: 117600/182380 (0.64 %) finished / train loss: 0.23191004740543106
epoch 9: 117760/182380 (0.65 %) finished / train loss: 0.23190299506582643
epoch 9: 117920/182380 (0.65 

epoch 9: 133440/182380 (0.73 %) finished / train loss: 0.23215615841553366
epoch 9: 133600/182380 (0.73 %) finished / train loss: 0.23218499659064287
epoch 9: 133760/182380 (0.73 %) finished / train loss: 0.2321762468897555
epoch 9: 133920/182380 (0.73 %) finished / train loss: 0.2321738261368967
epoch 9: 134080/182380 (0.74 %) finished / train loss: 0.2321640086984862
epoch 9: 134240/182380 (0.74 %) finished / train loss: 0.23219308270956251
epoch 9: 134400/182380 (0.74 %) finished / train loss: 0.23220238437255222
epoch 9: 134560/182380 (0.74 %) finished / train loss: 0.23219115037059104
epoch 9: 134720/182380 (0.74 %) finished / train loss: 0.23220056432726263
epoch 9: 134880/182380 (0.74 %) finished / train loss: 0.23219250722358517
epoch 9: 135040/182380 (0.74 %) finished / train loss: 0.23219186983896659
epoch 9: 135200/182380 (0.74 %) finished / train loss: 0.2322208321447203
epoch 9: 135360/182380 (0.74 %) finished / train loss: 0.23221788395099324
epoch 9: 135520/182380 (0.74 

epoch 9: 151040/182380 (0.83 %) finished / train loss: 0.23232199268699702
epoch 9: 151200/182380 (0.83 %) finished / train loss: 0.23232615273150187
epoch 9: 151360/182380 (0.83 %) finished / train loss: 0.23234408822296537
epoch 9: 151520/182380 (0.83 %) finished / train loss: 0.23233678636732172
epoch 9: 151680/182380 (0.83 %) finished / train loss: 0.23234698749481375
epoch 9: 151840/182380 (0.83 %) finished / train loss: 0.23233726008925723
epoch 9: 152000/182380 (0.83 %) finished / train loss: 0.23232895973167922
epoch 9: 152160/182380 (0.83 %) finished / train loss: 0.2323120706496304
epoch 9: 152320/182380 (0.84 %) finished / train loss: 0.23234519072878762
epoch 9: 152480/182380 (0.84 %) finished / train loss: 0.23233326296366025
epoch 9: 152640/182380 (0.84 %) finished / train loss: 0.23230613998959398
epoch 9: 152800/182380 (0.84 %) finished / train loss: 0.2323313549238974
epoch 9: 152960/182380 (0.84 %) finished / train loss: 0.23234093870079167
epoch 9: 153120/182380 (0.8

epoch 9: 168640/182380 (0.92 %) finished / train loss: 0.2327130596144602
epoch 9: 168800/182380 (0.93 %) finished / train loss: 0.23270576505581914
epoch 9: 168960/182380 (0.93 %) finished / train loss: 0.2326982935185008
epoch 9: 169120/182380 (0.93 %) finished / train loss: 0.2326810672357608
epoch 9: 169280/182380 (0.93 %) finished / train loss: 0.23268541996781
epoch 9: 169440/182380 (0.93 %) finished / train loss: 0.23266848865210504
epoch 9: 169600/182380 (0.93 %) finished / train loss: 0.23269798657241858
epoch 9: 169760/182380 (0.93 %) finished / train loss: 0.23269470246415674
epoch 9: 169920/182380 (0.93 %) finished / train loss: 0.23269737632822407
epoch 9: 170080/182380 (0.93 %) finished / train loss: 0.23267924831312778
epoch 9: 170240/182380 (0.93 %) finished / train loss: 0.23267542449547385
epoch 9: 170400/182380 (0.93 %) finished / train loss: 0.2326490697614464
epoch 9: 170560/182380 (0.94 %) finished / train loss: 0.23264882869836762
epoch 9: 170720/182380 (0.94 %) 

epoch 10: 3680/182380 (0.02 %) finished / train loss: 0.22816079984540524
epoch 10: 3840/182380 (0.02 %) finished / train loss: 0.22792092425127825
epoch 10: 4000/182380 (0.02 %) finished / train loss: 0.22737418735027312
epoch 10: 4160/182380 (0.02 %) finished / train loss: 0.2275323117008576
epoch 10: 4320/182380 (0.02 %) finished / train loss: 0.22642287468468703
epoch 10: 4480/182380 (0.02 %) finished / train loss: 0.22559246740170888
epoch 10: 4640/182380 (0.03 %) finished / train loss: 0.2255805285840199
epoch 10: 4800/182380 (0.03 %) finished / train loss: 0.22574347704648973
epoch 10: 4960/182380 (0.03 %) finished / train loss: 0.2262634571521513
epoch 10: 5120/182380 (0.03 %) finished / train loss: 0.22564199967309834
epoch 10: 5280/182380 (0.03 %) finished / train loss: 0.2252745531725161
epoch 10: 5440/182380 (0.03 %) finished / train loss: 0.22519741899826948
epoch 10: 5600/182380 (0.03 %) finished / train loss: 0.2251662279878344
epoch 10: 5760/182380 (0.03 %) finished / t

epoch 10: 21440/182380 (0.12 %) finished / train loss: 0.22971714472592766
epoch 10: 21600/182380 (0.12 %) finished / train loss: 0.22975258072217306
epoch 10: 21760/182380 (0.12 %) finished / train loss: 0.22967396249227665
epoch 10: 21920/182380 (0.12 %) finished / train loss: 0.22970180635469672
epoch 10: 22080/182380 (0.12 %) finished / train loss: 0.2298517870730248
epoch 10: 22240/182380 (0.12 %) finished / train loss: 0.22972683589235485
epoch 10: 22400/182380 (0.12 %) finished / train loss: 0.22980490739856446
epoch 10: 22560/182380 (0.12 %) finished / train loss: 0.2300544961758539
epoch 10: 22720/182380 (0.12 %) finished / train loss: 0.23031455196545159
epoch 10: 22880/182380 (0.13 %) finished / train loss: 0.2306002024170402
epoch 10: 23040/182380 (0.13 %) finished / train loss: 0.23059301127990087
epoch 10: 23200/182380 (0.13 %) finished / train loss: 0.2307724661868194
epoch 10: 23360/182380 (0.13 %) finished / train loss: 0.23076710337645387
epoch 10: 23520/182380 (0.13 

epoch 10: 39040/182380 (0.21 %) finished / train loss: 0.23251031607878012
epoch 10: 39200/182380 (0.21 %) finished / train loss: 0.23252225693391293
epoch 10: 39360/182380 (0.22 %) finished / train loss: 0.23255400790916225
epoch 10: 39520/182380 (0.22 %) finished / train loss: 0.2325321677242696
epoch 10: 39680/182380 (0.22 %) finished / train loss: 0.23249428657995116
epoch 10: 39840/182380 (0.22 %) finished / train loss: 0.2324605913286707
epoch 10: 40000/182380 (0.22 %) finished / train loss: 0.23246333540678024
epoch 10: 40160/182380 (0.22 %) finished / train loss: 0.23242698238190426
epoch 10: 40320/182380 (0.22 %) finished / train loss: 0.23243307135407887
epoch 10: 40480/182380 (0.22 %) finished / train loss: 0.23241058510282767
epoch 10: 40640/182380 (0.22 %) finished / train loss: 0.2323805852433828
epoch 10: 40800/182380 (0.22 %) finished / train loss: 0.232297089602433
epoch 10: 40960/182380 (0.22 %) finished / train loss: 0.23222287903772668
epoch 10: 41120/182380 (0.23 %

epoch 10: 56640/182380 (0.31 %) finished / train loss: 0.23155253117030622
epoch 10: 56800/182380 (0.31 %) finished / train loss: 0.23158896507511675
epoch 10: 56960/182380 (0.31 %) finished / train loss: 0.2316068622084816
epoch 10: 57120/182380 (0.31 %) finished / train loss: 0.23153944337735324
epoch 10: 57280/182380 (0.31 %) finished / train loss: 0.2315242906688978
epoch 10: 57440/182380 (0.31 %) finished / train loss: 0.23151539767519014
epoch 10: 57600/182380 (0.32 %) finished / train loss: 0.23150060692595112
epoch 10: 57760/182380 (0.32 %) finished / train loss: 0.23144704112550887
epoch 10: 57920/182380 (0.32 %) finished / train loss: 0.2314192413954445
epoch 10: 58080/182380 (0.32 %) finished / train loss: 0.23136315821123518
epoch 10: 58240/182380 (0.32 %) finished / train loss: 0.23129262106267962
epoch 10: 58400/182380 (0.32 %) finished / train loss: 0.23125619752766335
epoch 10: 58560/182380 (0.32 %) finished / train loss: 0.2312616912312195
epoch 10: 58720/182380 (0.32 

epoch 10: 74240/182380 (0.41 %) finished / train loss: 0.23056125013992704
epoch 10: 74400/182380 (0.41 %) finished / train loss: 0.23061465605612724
epoch 10: 74560/182380 (0.41 %) finished / train loss: 0.23060312378560013
epoch 10: 74720/182380 (0.41 %) finished / train loss: 0.2306000408574907
epoch 10: 74880/182380 (0.41 %) finished / train loss: 0.2305679410441309
epoch 10: 75040/182380 (0.41 %) finished / train loss: 0.230552763369546
epoch 10: 75200/182380 (0.41 %) finished / train loss: 0.23052785318582616
epoch 10: 75360/182380 (0.41 %) finished / train loss: 0.23056890427939705
epoch 10: 75520/182380 (0.41 %) finished / train loss: 0.23057863346095814
epoch 10: 75680/182380 (0.41 %) finished / train loss: 0.23052230829542333
epoch 10: 75840/182380 (0.42 %) finished / train loss: 0.23053979065096328
epoch 10: 76000/182380 (0.42 %) finished / train loss: 0.23054894031348983
epoch 10: 76160/182380 (0.42 %) finished / train loss: 0.23049962622653536
epoch 10: 76320/182380 (0.42 

epoch 10: 91840/182380 (0.50 %) finished / train loss: 0.2301177984434553
epoch 10: 92000/182380 (0.50 %) finished / train loss: 0.23015726807324782
epoch 10: 92160/182380 (0.51 %) finished / train loss: 0.23017146495791774
epoch 10: 92320/182380 (0.51 %) finished / train loss: 0.23017943210680317
epoch 10: 92480/182380 (0.51 %) finished / train loss: 0.23018454759797424
epoch 10: 92640/182380 (0.51 %) finished / train loss: 0.2301809062251567
epoch 10: 92800/182380 (0.51 %) finished / train loss: 0.2301855228070555
epoch 10: 92960/182380 (0.51 %) finished / train loss: 0.23016478922506617
epoch 10: 93120/182380 (0.51 %) finished / train loss: 0.23015904094755035
epoch 10: 93280/182380 (0.51 %) finished / train loss: 0.23014766459910785
epoch 10: 93440/182380 (0.51 %) finished / train loss: 0.23012698015631877
epoch 10: 93600/182380 (0.51 %) finished / train loss: 0.23013226446432944
epoch 10: 93760/182380 (0.51 %) finished / train loss: 0.23009423296199316
epoch 10: 93920/182380 (0.51

epoch 10: 109280/182380 (0.60 %) finished / train loss: 0.2306830344795308
epoch 10: 109440/182380 (0.60 %) finished / train loss: 0.23070801620246373
epoch 10: 109600/182380 (0.60 %) finished / train loss: 0.2307175926831517
epoch 10: 109760/182380 (0.60 %) finished / train loss: 0.2306921595951906
epoch 10: 109920/182380 (0.60 %) finished / train loss: 0.23070711922524104
epoch 10: 110080/182380 (0.60 %) finished / train loss: 0.23072627727808648
epoch 10: 110240/182380 (0.60 %) finished / train loss: 0.23069811274334032
epoch 10: 110400/182380 (0.61 %) finished / train loss: 0.23069008149530576
epoch 10: 110560/182380 (0.61 %) finished / train loss: 0.23073043718438072
epoch 10: 110720/182380 (0.61 %) finished / train loss: 0.23071794508595686
epoch 10: 110880/182380 (0.61 %) finished / train loss: 0.2306857073590869
epoch 10: 111040/182380 (0.61 %) finished / train loss: 0.23068440341812047
epoch 10: 111200/182380 (0.61 %) finished / train loss: 0.2307064845150323
epoch 10: 111360/

epoch 10: 126720/182380 (0.69 %) finished / train loss: 0.23063201480968432
epoch 10: 126880/182380 (0.70 %) finished / train loss: 0.23063709963991544
epoch 10: 127040/182380 (0.70 %) finished / train loss: 0.23062575067621033
epoch 10: 127200/182380 (0.70 %) finished / train loss: 0.23061793759933807
epoch 10: 127360/182380 (0.70 %) finished / train loss: 0.2306000532554322
epoch 10: 127520/182380 (0.70 %) finished / train loss: 0.23062230786834487
epoch 10: 127680/182380 (0.70 %) finished / train loss: 0.23059946005804496
epoch 10: 127840/182380 (0.70 %) finished / train loss: 0.23059832210534803
epoch 10: 128000/182380 (0.70 %) finished / train loss: 0.23057751808688046
epoch 10: 128160/182380 (0.70 %) finished / train loss: 0.23055134410789693
epoch 10: 128320/182380 (0.70 %) finished / train loss: 0.23054789421415686
epoch 10: 128480/182380 (0.70 %) finished / train loss: 0.23055414570075639
epoch 10: 128640/182380 (0.71 %) finished / train loss: 0.2305518084089851
epoch 10: 1288

epoch 10: 144160/182380 (0.79 %) finished / train loss: 0.2309615719761621
epoch 10: 144320/182380 (0.79 %) finished / train loss: 0.23096687151098463
epoch 10: 144480/182380 (0.79 %) finished / train loss: 0.23095467393910502
epoch 10: 144640/182380 (0.79 %) finished / train loss: 0.23097403497492844
epoch 10: 144800/182380 (0.79 %) finished / train loss: 0.2309730628083424
epoch 10: 144960/182380 (0.79 %) finished / train loss: 0.23098034360682465
epoch 10: 145120/182380 (0.80 %) finished / train loss: 0.2309826862292884
epoch 10: 145280/182380 (0.80 %) finished / train loss: 0.23096872401723254
epoch 10: 145440/182380 (0.80 %) finished / train loss: 0.23096793187398984
epoch 10: 145600/182380 (0.80 %) finished / train loss: 0.23097514573361846
epoch 10: 145760/182380 (0.80 %) finished / train loss: 0.23096214091215123
epoch 10: 145920/182380 (0.80 %) finished / train loss: 0.2309860392555333
epoch 10: 146080/182380 (0.80 %) finished / train loss: 0.23101805271284995
epoch 10: 146240

epoch 10: 161600/182380 (0.89 %) finished / train loss: 0.23080479894829267
epoch 10: 161760/182380 (0.89 %) finished / train loss: 0.23079172152027297
epoch 10: 161920/182380 (0.89 %) finished / train loss: 0.23078960250665548
epoch 10: 162080/182380 (0.89 %) finished / train loss: 0.23082782085709133
epoch 10: 162240/182380 (0.89 %) finished / train loss: 0.230863751794342
epoch 10: 162400/182380 (0.89 %) finished / train loss: 0.23086824973228529
epoch 10: 162560/182380 (0.89 %) finished / train loss: 0.23084678308759618
epoch 10: 162720/182380 (0.89 %) finished / train loss: 0.23085640544326375
epoch 10: 162880/182380 (0.89 %) finished / train loss: 0.2308546724950635
epoch 10: 163040/182380 (0.89 %) finished / train loss: 0.23084874416941867
epoch 10: 163200/182380 (0.89 %) finished / train loss: 0.23084479012617878
epoch 10: 163360/182380 (0.90 %) finished / train loss: 0.23085697442731007
epoch 10: 163520/182380 (0.90 %) finished / train loss: 0.23083609846181832
epoch 10: 16368

epoch 10: 179040/182380 (0.98 %) finished / train loss: 0.23098349553783415
epoch 10: 179200/182380 (0.98 %) finished / train loss: 0.23100503931753338
epoch 10: 179360/182380 (0.98 %) finished / train loss: 0.2310324646937964
epoch 10: 179520/182380 (0.98 %) finished / train loss: 0.23104840852917835
epoch 10: 179680/182380 (0.99 %) finished / train loss: 0.2310540881482279
epoch 10: 179840/182380 (0.99 %) finished / train loss: 0.23106718265792867
epoch 10: 180000/182380 (0.99 %) finished / train loss: 0.23106632321543163
epoch 10: 180160/182380 (0.99 %) finished / train loss: 0.2310637166707067
epoch 10: 180320/182380 (0.99 %) finished / train loss: 0.23105541190401896
epoch 10: 180480/182380 (0.99 %) finished / train loss: 0.2310396193889967
epoch 10: 180640/182380 (0.99 %) finished / train loss: 0.23103019807246852
epoch 10: 180800/182380 (0.99 %) finished / train loss: 0.2310242757161634
epoch 10: 180960/182380 (0.99 %) finished / train loss: 0.23102435255003229
epoch 10: 181120/

epoch 11: 14080/182380 (0.08 %) finished / train loss: 0.2264197508042509
epoch 11: 14240/182380 (0.08 %) finished / train loss: 0.22642667008919662
epoch 11: 14400/182380 (0.08 %) finished / train loss: 0.22655003935098647
epoch 11: 14560/182380 (0.08 %) finished / train loss: 0.22635024913719723
epoch 11: 14720/182380 (0.08 %) finished / train loss: 0.22652824789933537
epoch 11: 14880/182380 (0.08 %) finished / train loss: 0.22654897916701533
epoch 11: 15040/182380 (0.08 %) finished / train loss: 0.2268427386879921
epoch 11: 15200/182380 (0.08 %) finished / train loss: 0.2267758906515021
epoch 11: 15360/182380 (0.08 %) finished / train loss: 0.22683101423705618
epoch 11: 15520/182380 (0.09 %) finished / train loss: 0.22672658922131528
epoch 11: 15680/182380 (0.09 %) finished / train loss: 0.22680310342384843
epoch 11: 15840/182380 (0.09 %) finished / train loss: 0.22700083228674803
epoch 11: 16000/182380 (0.09 %) finished / train loss: 0.22707884359359742
epoch 11: 16160/182380 (0.09

epoch 11: 31680/182380 (0.17 %) finished / train loss: 0.22654924644063218
epoch 11: 31840/182380 (0.17 %) finished / train loss: 0.22661207827491378
epoch 11: 32000/182380 (0.18 %) finished / train loss: 0.2266005747616291
epoch 11: 32160/182380 (0.18 %) finished / train loss: 0.22666885685268326
epoch 11: 32320/182380 (0.18 %) finished / train loss: 0.2268304518101239
epoch 11: 32480/182380 (0.18 %) finished / train loss: 0.22684212460600098
epoch 11: 32640/182380 (0.18 %) finished / train loss: 0.2268400644700901
epoch 11: 32800/182380 (0.18 %) finished / train loss: 0.22664965347545904
epoch 11: 32960/182380 (0.18 %) finished / train loss: 0.22652803710074101
epoch 11: 33120/182380 (0.18 %) finished / train loss: 0.22656967845803874
epoch 11: 33280/182380 (0.18 %) finished / train loss: 0.22658618586854293
epoch 11: 33440/182380 (0.18 %) finished / train loss: 0.22667214819118736
epoch 11: 33600/182380 (0.18 %) finished / train loss: 0.22667411115907488
epoch 11: 33760/182380 (0.19

epoch 11: 49280/182380 (0.27 %) finished / train loss: 0.22666164514693346
epoch 11: 49440/182380 (0.27 %) finished / train loss: 0.22665706969387708
epoch 11: 49600/182380 (0.27 %) finished / train loss: 0.22668081632544917
epoch 11: 49760/182380 (0.27 %) finished / train loss: 0.2266092896748969
epoch 11: 49920/182380 (0.27 %) finished / train loss: 0.22648932691185902
epoch 11: 50080/182380 (0.27 %) finished / train loss: 0.2264866760363594
epoch 11: 50240/182380 (0.28 %) finished / train loss: 0.22649797998416196
epoch 11: 50400/182380 (0.28 %) finished / train loss: 0.2265747207403183
epoch 11: 50560/182380 (0.28 %) finished / train loss: 0.22654053835740573
epoch 11: 50720/182380 (0.28 %) finished / train loss: 0.22643115967042063
epoch 11: 50880/182380 (0.28 %) finished / train loss: 0.22638475807770242
epoch 11: 51040/182380 (0.28 %) finished / train loss: 0.22640936754900834
epoch 11: 51200/182380 (0.28 %) finished / train loss: 0.22636927447281777
epoch 11: 51360/182380 (0.28

epoch 11: 66880/182380 (0.37 %) finished / train loss: 0.22711369598453696
epoch 11: 67040/182380 (0.37 %) finished / train loss: 0.22715075809801963
epoch 11: 67200/182380 (0.37 %) finished / train loss: 0.22715860985574268
epoch 11: 67360/182380 (0.37 %) finished / train loss: 0.22717812490293363
epoch 11: 67520/182380 (0.37 %) finished / train loss: 0.22721866737892277
epoch 11: 67680/182380 (0.37 %) finished / train loss: 0.22723787362834805
epoch 11: 67840/182380 (0.37 %) finished / train loss: 0.22723697923686145
epoch 11: 68000/182380 (0.37 %) finished / train loss: 0.2272393534113379
epoch 11: 68160/182380 (0.37 %) finished / train loss: 0.22722803164675762
epoch 11: 68320/182380 (0.37 %) finished / train loss: 0.2272491018721873
epoch 11: 68480/182380 (0.38 %) finished / train loss: 0.22728844906125112
epoch 11: 68640/182380 (0.38 %) finished / train loss: 0.22731985781159433
epoch 11: 68800/182380 (0.38 %) finished / train loss: 0.22732129399859627
epoch 11: 68960/182380 (0.3

epoch 11: 84480/182380 (0.46 %) finished / train loss: 0.22751792941355345
epoch 11: 84640/182380 (0.46 %) finished / train loss: 0.2275411912365086
epoch 11: 84800/182380 (0.46 %) finished / train loss: 0.22756777889323684
epoch 11: 84960/182380 (0.47 %) finished / train loss: 0.2275295830547473
epoch 11: 85120/182380 (0.47 %) finished / train loss: 0.22749469326739025
epoch 11: 85280/182380 (0.47 %) finished / train loss: 0.2274953852954546
epoch 11: 85440/182380 (0.47 %) finished / train loss: 0.22750867729106647
epoch 11: 85600/182380 (0.47 %) finished / train loss: 0.2275572175344574
epoch 11: 85760/182380 (0.47 %) finished / train loss: 0.22756434132470124
epoch 11: 85920/182380 (0.47 %) finished / train loss: 0.22753698160417474
epoch 11: 86080/182380 (0.47 %) finished / train loss: 0.22754146580802465
epoch 11: 86240/182380 (0.47 %) finished / train loss: 0.22751480240879343
epoch 11: 86400/182380 (0.47 %) finished / train loss: 0.22750363559082704
epoch 11: 86560/182380 (0.47 

epoch 11: 102080/182380 (0.56 %) finished / train loss: 0.22800098677694236
epoch 11: 102240/182380 (0.56 %) finished / train loss: 0.22800415746855998
epoch 11: 102400/182380 (0.56 %) finished / train loss: 0.22801569243427366
epoch 11: 102560/182380 (0.56 %) finished / train loss: 0.2280320698776037
epoch 11: 102720/182380 (0.56 %) finished / train loss: 0.22805301590686275
epoch 11: 102880/182380 (0.56 %) finished / train loss: 0.22802935577291722
epoch 11: 103040/182380 (0.56 %) finished / train loss: 0.22801910755889757
epoch 11: 103200/182380 (0.57 %) finished / train loss: 0.22803687100262604
epoch 11: 103360/182380 (0.57 %) finished / train loss: 0.22802764229453384
epoch 11: 103520/182380 (0.57 %) finished / train loss: 0.22802051624982766
epoch 11: 103680/182380 (0.57 %) finished / train loss: 0.22803095802204845
epoch 11: 103840/182380 (0.57 %) finished / train loss: 0.22807210009252346
epoch 11: 104000/182380 (0.57 %) finished / train loss: 0.22802260237473707
epoch 11: 104

epoch 11: 119520/182380 (0.66 %) finished / train loss: 0.22827787183055598
epoch 11: 119680/182380 (0.66 %) finished / train loss: 0.22829031384086865
epoch 11: 119840/182380 (0.66 %) finished / train loss: 0.2282621760950865
epoch 11: 120000/182380 (0.66 %) finished / train loss: 0.2282493723710378
epoch 11: 120160/182380 (0.66 %) finished / train loss: 0.22825453836971846
epoch 11: 120320/182380 (0.66 %) finished / train loss: 0.2282487878734444
epoch 11: 120480/182380 (0.66 %) finished / train loss: 0.2282263501983873
epoch 11: 120640/182380 (0.66 %) finished / train loss: 0.2282638442453086
epoch 11: 120800/182380 (0.66 %) finished / train loss: 0.22829341000673786
epoch 11: 120960/182380 (0.66 %) finished / train loss: 0.22829381343785418
epoch 11: 121120/182380 (0.66 %) finished / train loss: 0.22826825052775354
epoch 11: 121280/182380 (0.66 %) finished / train loss: 0.22827049183971335
epoch 11: 121440/182380 (0.67 %) finished / train loss: 0.22824286708561642
epoch 11: 121600/

epoch 11: 136960/182380 (0.75 %) finished / train loss: 0.22844978491209936
epoch 11: 137120/182380 (0.75 %) finished / train loss: 0.22846222451367484
epoch 11: 137280/182380 (0.75 %) finished / train loss: 0.22850621248875463
epoch 11: 137440/182380 (0.75 %) finished / train loss: 0.22851036672889147
epoch 11: 137600/182380 (0.75 %) finished / train loss: 0.22851928724452505
epoch 11: 137760/182380 (0.76 %) finished / train loss: 0.2284962892566962
epoch 11: 137920/182380 (0.76 %) finished / train loss: 0.2284844228950288
epoch 11: 138080/182380 (0.76 %) finished / train loss: 0.22848359799122617
epoch 11: 138240/182380 (0.76 %) finished / train loss: 0.2284838957781041
epoch 11: 138400/182380 (0.76 %) finished / train loss: 0.2284678040798
epoch 11: 138560/182380 (0.76 %) finished / train loss: 0.22845883753159305
epoch 11: 138720/182380 (0.76 %) finished / train loss: 0.22845236807545988
epoch 11: 138880/182380 (0.76 %) finished / train loss: 0.22844143642395873
epoch 11: 139040/18

epoch 11: 154400/182380 (0.85 %) finished / train loss: 0.22829485489914456
epoch 11: 154560/182380 (0.85 %) finished / train loss: 0.22829168904457034
epoch 11: 154720/182380 (0.85 %) finished / train loss: 0.22827452183262886
epoch 11: 154880/182380 (0.85 %) finished / train loss: 0.22828847130160193
epoch 11: 155040/182380 (0.85 %) finished / train loss: 0.22831942462453655
epoch 11: 155200/182380 (0.85 %) finished / train loss: 0.228317312275626
epoch 11: 155360/182380 (0.85 %) finished / train loss: 0.22832845904615953
epoch 11: 155520/182380 (0.85 %) finished / train loss: 0.2283054323966611
epoch 11: 155680/182380 (0.85 %) finished / train loss: 0.22830102843407615
epoch 11: 155840/182380 (0.85 %) finished / train loss: 0.2283135068796009
epoch 11: 156000/182380 (0.86 %) finished / train loss: 0.22832373331754635
epoch 11: 156160/182380 (0.86 %) finished / train loss: 0.22833338423525212
epoch 11: 156320/182380 (0.86 %) finished / train loss: 0.22832609733515166
epoch 11: 156480

epoch 11: 171840/182380 (0.94 %) finished / train loss: 0.22891681302526143
epoch 11: 172000/182380 (0.94 %) finished / train loss: 0.22895955498828444
epoch 11: 172160/182380 (0.94 %) finished / train loss: 0.22895559965179313
epoch 11: 172320/182380 (0.94 %) finished / train loss: 0.22895589060216673
epoch 11: 172480/182380 (0.95 %) finished / train loss: 0.22894927187510014
epoch 11: 172640/182380 (0.95 %) finished / train loss: 0.22895272751446671
epoch 11: 172800/182380 (0.95 %) finished / train loss: 0.22894096885842305
epoch 11: 172960/182380 (0.95 %) finished / train loss: 0.22893217293120005
epoch 11: 173120/182380 (0.95 %) finished / train loss: 0.2289424685310304
epoch 11: 173280/182380 (0.95 %) finished / train loss: 0.2289394881228881
epoch 11: 173440/182380 (0.95 %) finished / train loss: 0.2289507201731865
epoch 11: 173600/182380 (0.95 %) finished / train loss: 0.2289491908918328
epoch 11: 173760/182380 (0.95 %) finished / train loss: 0.2289435214622025
epoch 11: 173920/

epoch 12: 6880/182380 (0.04 %) finished / train loss: 0.22793107150599015
epoch 12: 7040/182380 (0.04 %) finished / train loss: 0.2279822233725678
epoch 12: 7200/182380 (0.04 %) finished / train loss: 0.22775090906355117
epoch 12: 7360/182380 (0.04 %) finished / train loss: 0.22773402100024015
epoch 12: 7520/182380 (0.04 %) finished / train loss: 0.22815629091668635
epoch 12: 7680/182380 (0.04 %) finished / train loss: 0.227979408018291
epoch 12: 7840/182380 (0.04 %) finished / train loss: 0.22802690614242943
epoch 12: 8000/182380 (0.04 %) finished / train loss: 0.22770402538776396
epoch 12: 8160/182380 (0.04 %) finished / train loss: 0.22794850433574004
epoch 12: 8320/182380 (0.05 %) finished / train loss: 0.22789552389429166
epoch 12: 8480/182380 (0.05 %) finished / train loss: 0.22794257250596892
epoch 12: 8640/182380 (0.05 %) finished / train loss: 0.22741407796188637
epoch 12: 8800/182380 (0.05 %) finished / train loss: 0.22762874912131917
epoch 12: 8960/182380 (0.05 %) finished /

epoch 12: 24480/182380 (0.13 %) finished / train loss: 0.22744502840088862
epoch 12: 24640/182380 (0.14 %) finished / train loss: 0.2275869879629705
epoch 12: 24800/182380 (0.14 %) finished / train loss: 0.22764989918278108
epoch 12: 24960/182380 (0.14 %) finished / train loss: 0.2276095341031368
epoch 12: 25120/182380 (0.14 %) finished / train loss: 0.22758988445731484
epoch 12: 25280/182380 (0.14 %) finished / train loss: 0.22789133613622642
epoch 12: 25440/182380 (0.14 %) finished / train loss: 0.2280032126221267
epoch 12: 25600/182380 (0.14 %) finished / train loss: 0.22794886805117132
epoch 12: 25760/182380 (0.14 %) finished / train loss: 0.22798668825478288
epoch 12: 25920/182380 (0.14 %) finished / train loss: 0.22801430254806707
epoch 12: 26080/182380 (0.14 %) finished / train loss: 0.22797729058499716
epoch 12: 26240/182380 (0.14 %) finished / train loss: 0.22799660643426384
epoch 12: 26400/182380 (0.14 %) finished / train loss: 0.2280838823860342
epoch 12: 26560/182380 (0.15 

epoch 12: 42080/182380 (0.23 %) finished / train loss: 0.22722481456319643
epoch 12: 42240/182380 (0.23 %) finished / train loss: 0.22723355236830134
epoch 12: 42400/182380 (0.23 %) finished / train loss: 0.2272649760403723
epoch 12: 42560/182380 (0.23 %) finished / train loss: 0.22726141467578428
epoch 12: 42720/182380 (0.23 %) finished / train loss: 0.22721301499154237
epoch 12: 42880/182380 (0.24 %) finished / train loss: 0.2270550107889211
epoch 12: 43040/182380 (0.24 %) finished / train loss: 0.22697169192440006
epoch 12: 43200/182380 (0.24 %) finished / train loss: 0.22688828424171165
epoch 12: 43360/182380 (0.24 %) finished / train loss: 0.22684101885755123
epoch 12: 43520/182380 (0.24 %) finished / train loss: 0.22683034041786895
epoch 12: 43680/182380 (0.24 %) finished / train loss: 0.22678387346285167
epoch 12: 43840/182380 (0.24 %) finished / train loss: 0.2268249070992435
epoch 12: 44000/182380 (0.24 %) finished / train loss: 0.22687398538806222
epoch 12: 44160/182380 (0.24

epoch 12: 59680/182380 (0.33 %) finished / train loss: 0.2270050604685382
epoch 12: 59840/182380 (0.33 %) finished / train loss: 0.22699523528310706
epoch 12: 60000/182380 (0.33 %) finished / train loss: 0.22701755640506743
epoch 12: 60160/182380 (0.33 %) finished / train loss: 0.22700845964569993
epoch 12: 60320/182380 (0.33 %) finished / train loss: 0.227059861480083
epoch 12: 60480/182380 (0.33 %) finished / train loss: 0.22703542479920008
epoch 12: 60640/182380 (0.33 %) finished / train loss: 0.22705671871400446
epoch 12: 60800/182380 (0.33 %) finished / train loss: 0.22704249927872105
epoch 12: 60960/182380 (0.33 %) finished / train loss: 0.227048825247707
epoch 12: 61120/182380 (0.34 %) finished / train loss: 0.22709904528413144
epoch 12: 61280/182380 (0.34 %) finished / train loss: 0.22704896474787212
epoch 12: 61440/182380 (0.34 %) finished / train loss: 0.22701193436514586
epoch 12: 61600/182380 (0.34 %) finished / train loss: 0.22702708983576142
epoch 12: 61760/182380 (0.34 %

epoch 12: 77280/182380 (0.42 %) finished / train loss: 0.22649157813000137
epoch 12: 77440/182380 (0.42 %) finished / train loss: 0.22647350947103226
epoch 12: 77600/182380 (0.43 %) finished / train loss: 0.22651049781091434
epoch 12: 77760/182380 (0.43 %) finished / train loss: 0.22650868501437543
epoch 12: 77920/182380 (0.43 %) finished / train loss: 0.22650423023000635
epoch 12: 78080/182380 (0.43 %) finished / train loss: 0.2265383093633124
epoch 12: 78240/182380 (0.43 %) finished / train loss: 0.22647318439615285
epoch 12: 78400/182380 (0.43 %) finished / train loss: 0.22650157920560057
epoch 12: 78560/182380 (0.43 %) finished / train loss: 0.22642382923551588
epoch 12: 78720/182380 (0.43 %) finished / train loss: 0.22642583350340525
epoch 12: 78880/182380 (0.43 %) finished / train loss: 0.22639322883579843
epoch 12: 79040/182380 (0.43 %) finished / train loss: 0.2264468729797645
epoch 12: 79200/182380 (0.43 %) finished / train loss: 0.22639998876687253
epoch 12: 79360/182380 (0.4

epoch 12: 94880/182380 (0.52 %) finished / train loss: 0.22748991928956963
epoch 12: 95040/182380 (0.52 %) finished / train loss: 0.22743744756838288
epoch 12: 95200/182380 (0.52 %) finished / train loss: 0.22743755463792498
epoch 12: 95360/182380 (0.52 %) finished / train loss: 0.22745890328848123
epoch 12: 95520/182380 (0.52 %) finished / train loss: 0.2274798765853422
epoch 12: 95680/182380 (0.52 %) finished / train loss: 0.22748939504591517
epoch 12: 95840/182380 (0.53 %) finished / train loss: 0.2274997665756732
epoch 12: 96000/182380 (0.53 %) finished / train loss: 0.2275121945142746
epoch 12: 96160/182380 (0.53 %) finished / train loss: 0.22750109589833784
epoch 12: 96320/182380 (0.53 %) finished / train loss: 0.2274827615862273
epoch 12: 96480/182380 (0.53 %) finished / train loss: 0.22745339867487477
epoch 12: 96640/182380 (0.53 %) finished / train loss: 0.2274328622350235
epoch 12: 96800/182380 (0.53 %) finished / train loss: 0.2274312629581483
epoch 12: 96960/182380 (0.53 %)

epoch 12: 112320/182380 (0.62 %) finished / train loss: 0.22752657082260844
epoch 12: 112480/182380 (0.62 %) finished / train loss: 0.22755996764214925
epoch 12: 112640/182380 (0.62 %) finished / train loss: 0.22756224652667614
epoch 12: 112800/182380 (0.62 %) finished / train loss: 0.22756550237642112
epoch 12: 112960/182380 (0.62 %) finished / train loss: 0.22759197108215382
epoch 12: 113120/182380 (0.62 %) finished / train loss: 0.2275556954206132
epoch 12: 113280/182380 (0.62 %) finished / train loss: 0.22750815460826718
epoch 12: 113440/182380 (0.62 %) finished / train loss: 0.22747551817735934
epoch 12: 113600/182380 (0.62 %) finished / train loss: 0.22746117794597653
epoch 12: 113760/182380 (0.62 %) finished / train loss: 0.2274519313194916
epoch 12: 113920/182380 (0.62 %) finished / train loss: 0.22744280645686588
epoch 12: 114080/182380 (0.63 %) finished / train loss: 0.22741915644218344
epoch 12: 114240/182380 (0.63 %) finished / train loss: 0.22740876695939471
epoch 12: 1144

epoch 12: 129760/182380 (0.71 %) finished / train loss: 0.22733117165974123
epoch 12: 129920/182380 (0.71 %) finished / train loss: 0.2272867199161957
epoch 12: 130080/182380 (0.71 %) finished / train loss: 0.22729033378364122
epoch 12: 130240/182380 (0.71 %) finished / train loss: 0.22728899835954428
epoch 12: 130400/182380 (0.71 %) finished / train loss: 0.22729311140037023
epoch 12: 130560/182380 (0.72 %) finished / train loss: 0.2272894388064742
epoch 12: 130720/182380 (0.72 %) finished / train loss: 0.2272918202776366
epoch 12: 130880/182380 (0.72 %) finished / train loss: 0.2273011981165788
epoch 12: 131040/182380 (0.72 %) finished / train loss: 0.2273107730206989
epoch 12: 131200/182380 (0.72 %) finished / train loss: 0.2273159989532901
epoch 12: 131360/182380 (0.72 %) finished / train loss: 0.22731518046283838
epoch 12: 131520/182380 (0.72 %) finished / train loss: 0.22729080438686403
epoch 12: 131680/182380 (0.72 %) finished / train loss: 0.22727847022173037
epoch 12: 131840/1

epoch 12: 147200/182380 (0.81 %) finished / train loss: 0.22718729919713476
epoch 12: 147360/182380 (0.81 %) finished / train loss: 0.22717510757888956
epoch 12: 147520/182380 (0.81 %) finished / train loss: 0.22718812214319722
epoch 12: 147680/182380 (0.81 %) finished / train loss: 0.22720254472702064
epoch 12: 147840/182380 (0.81 %) finished / train loss: 0.22718734520273806
epoch 12: 148000/182380 (0.81 %) finished / train loss: 0.22718765685687195
epoch 12: 148160/182380 (0.81 %) finished / train loss: 0.22717139432548705
epoch 12: 148320/182380 (0.81 %) finished / train loss: 0.2271754558996861
epoch 12: 148480/182380 (0.81 %) finished / train loss: 0.22713504920488803
epoch 12: 148640/182380 (0.82 %) finished / train loss: 0.22715073330217594
epoch 12: 148800/182380 (0.82 %) finished / train loss: 0.22720179862553075
epoch 12: 148960/182380 (0.82 %) finished / train loss: 0.22722181552975057
epoch 12: 149120/182380 (0.82 %) finished / train loss: 0.2272124944646471
epoch 12: 1492

epoch 12: 164640/182380 (0.90 %) finished / train loss: 0.22720058587306444
epoch 12: 164800/182380 (0.90 %) finished / train loss: 0.22722068912774615
epoch 12: 164960/182380 (0.90 %) finished / train loss: 0.227230270994623
epoch 12: 165120/182380 (0.91 %) finished / train loss: 0.22723836902269098
epoch 12: 165280/182380 (0.91 %) finished / train loss: 0.227217465595839
epoch 12: 165440/182380 (0.91 %) finished / train loss: 0.22721370045290232
epoch 12: 165600/182380 (0.91 %) finished / train loss: 0.227205117923626
epoch 12: 165760/182380 (0.91 %) finished / train loss: 0.2272104037860876
epoch 12: 165920/182380 (0.91 %) finished / train loss: 0.22720440416062465
epoch 12: 166080/182380 (0.91 %) finished / train loss: 0.22720888524903038
epoch 12: 166240/182380 (0.91 %) finished / train loss: 0.22720129945395198
epoch 12: 166400/182380 (0.91 %) finished / train loss: 0.22717823861596675
epoch 12: 166560/182380 (0.91 %) finished / train loss: 0.22716845923267112
epoch 12: 166720/18

epoch 12: 182080/182380 (1.00 %) finished / train loss: 0.22732027660407164
epoch 12: 182240/182380 (1.00 %) finished / train loss: 0.2273222292092309
epoch 12: 182380/182380 (1.00 %) finished / train loss: 0.22731551469150166
