In [10]:

import sys
sys.path.append('/home/pedru/Documents/tiny_diffusion_model')

from tiny_diffusion_model import TimeInputMLP, ScheduleLogLinear, BarnsleyFern, training_loop, moving_average, samples


In [11]:
import torch
from torch.utils.data import DataLoader
import matplotlib.pyplot as plt
import numpy as np

# Configurações
BATCH_SIZE = 2048
EPOCHS = 10000
LR = 1e-3
DEVICE = 'cuda' if torch.cuda.is_available() else 'cpu'

# 1. Dataset
dataset = BarnsleyFern(10000)
loader = DataLoader(dataset, batch_size=BATCH_SIZE, shuffle=True)

# 2. Modelo e scheduler
model = TimeInputMLP(dim=2).to(DEVICE)
schedule = ScheduleLogLinear(N=200, sigma_min=0.01, sigma_max=10)

# 3. Treinamento
losses = []
for state in training_loop(loader, model, schedule, epochs=EPOCHS, lr=LR):
    losses.append(state.loss.item())
    if state._ % 10 == 0:
        print(f"Epoch {state._}: Loss = {state.loss.item():.4f}")

# 4. Visualização da perda
plt.plot(moving_average(losses, 10))
plt.title("Training Loss (Moving Average)")
plt.xlabel("Step")
plt.ylabel("Loss")
plt.grid()
plt.show()

# 5. Geração de amostras
sigmas = schedule.sample_sigmas(steps=50).to(DEVICE)

samples_list = []
for sample in samples(model, sigmas, batchsize=1024):
    samples_list.append(sample.cpu())

# 6. Visualizar imagem final
final_sample = samples_list[-1].numpy()
plt.scatter(final_sample[:, 0], final_sample[:, 1], s=0.5, alpha=0.7)
plt.title("Generated Sample (Final Step)")
plt.axis('equal')
plt.grid(True)
plt.show()


  0%|          | 2/10000 [00:00<17:23,  9.58it/s]

Epoch 0: Loss = 0.9817
Epoch 0: Loss = 0.9796
Epoch 0: Loss = 0.9763
Epoch 0: Loss = 0.9569
Epoch 0: Loss = 0.9366


  0%|          | 12/10000 [00:01<14:36, 11.40it/s]

Epoch 10: Loss = 0.7908
Epoch 10: Loss = 0.7631
Epoch 10: Loss = 0.7722
Epoch 10: Loss = 0.7920
Epoch 10: Loss = 0.7609


  0%|          | 22/10000 [00:01<14:01, 11.85it/s]

Epoch 20: Loss = 0.7328
Epoch 20: Loss = 0.7611
Epoch 20: Loss = 0.7571
Epoch 20: Loss = 0.7483
Epoch 20: Loss = 0.7199


  0%|          | 32/10000 [00:02<15:02, 11.04it/s]

Epoch 30: Loss = 0.7186
Epoch 30: Loss = 0.7514
Epoch 30: Loss = 0.7360
Epoch 30: Loss = 0.7403
Epoch 30: Loss = 0.7477


  0%|          | 42/10000 [00:03<14:20, 11.57it/s]

Epoch 40: Loss = 0.7394
Epoch 40: Loss = 0.7233
Epoch 40: Loss = 0.7183
Epoch 40: Loss = 0.7207
Epoch 40: Loss = 0.7445


  1%|          | 52/10000 [00:04<12:18, 13.48it/s]

Epoch 50: Loss = 0.7177
Epoch 50: Loss = 0.7211
Epoch 50: Loss = 0.7284
Epoch 50: Loss = 0.7070
Epoch 50: Loss = 0.7158


  1%|          | 62/10000 [00:05<12:25, 13.34it/s]

Epoch 60: Loss = 0.6914
Epoch 60: Loss = 0.6717
Epoch 60: Loss = 0.7221
Epoch 60: Loss = 0.6986
Epoch 60: Loss = 0.7089


  1%|          | 72/10000 [00:06<13:05, 12.63it/s]

Epoch 70: Loss = 0.6717
Epoch 70: Loss = 0.7454
Epoch 70: Loss = 0.6837
Epoch 70: Loss = 0.7117
Epoch 70: Loss = 0.7186


  1%|          | 82/10000 [00:06<12:08, 13.62it/s]

Epoch 80: Loss = 0.6754
Epoch 80: Loss = 0.7151
Epoch 80: Loss = 0.7278
Epoch 80: Loss = 0.6965
Epoch 80: Loss = 0.6972


  1%|          | 92/10000 [00:07<12:22, 13.34it/s]

Epoch 90: Loss = 0.7323
Epoch 90: Loss = 0.7100
Epoch 90: Loss = 0.6927
Epoch 90: Loss = 0.7078
Epoch 90: Loss = 0.6892


  1%|          | 102/10000 [00:08<14:19, 11.52it/s]

Epoch 100: Loss = 0.6935
Epoch 100: Loss = 0.7186
Epoch 100: Loss = 0.7095
Epoch 100: Loss = 0.7034
Epoch 100: Loss = 0.7141


  1%|          | 112/10000 [00:09<12:25, 13.26it/s]

Epoch 110: Loss = 0.6920
Epoch 110: Loss = 0.6924
Epoch 110: Loss = 0.6661
Epoch 110: Loss = 0.6725
Epoch 110: Loss = 0.7135


  1%|          | 122/10000 [00:09<12:10, 13.52it/s]

Epoch 120: Loss = 0.6703
Epoch 120: Loss = 0.6522
Epoch 120: Loss = 0.6838
Epoch 120: Loss = 0.6654
Epoch 120: Loss = 0.7226


  1%|▏         | 132/10000 [00:10<11:40, 14.08it/s]

Epoch 130: Loss = 0.7057
Epoch 130: Loss = 0.6769
Epoch 130: Loss = 0.7037
Epoch 130: Loss = 0.6861
Epoch 130: Loss = 0.6972


  1%|▏         | 142/10000 [00:11<11:39, 14.09it/s]

Epoch 140: Loss = 0.6996
Epoch 140: Loss = 0.6930
Epoch 140: Loss = 0.6879
Epoch 140: Loss = 0.6730
Epoch 140: Loss = 0.7106


  2%|▏         | 152/10000 [00:12<12:26, 13.19it/s]

Epoch 150: Loss = 0.7098
Epoch 150: Loss = 0.6929
Epoch 150: Loss = 0.7034
Epoch 150: Loss = 0.7244
Epoch 150: Loss = 0.6867


  2%|▏         | 162/10000 [00:12<12:40, 12.94it/s]

Epoch 160: Loss = 0.6824
Epoch 160: Loss = 0.6995
Epoch 160: Loss = 0.7348
Epoch 160: Loss = 0.6735
Epoch 160: Loss = 0.6828


  2%|▏         | 172/10000 [00:13<14:56, 10.97it/s]

Epoch 170: Loss = 0.6733
Epoch 170: Loss = 0.6836
Epoch 170: Loss = 0.6986
Epoch 170: Loss = 0.6692
Epoch 170: Loss = 0.7010


  2%|▏         | 182/10000 [00:14<12:28, 13.12it/s]

Epoch 180: Loss = 0.7022
Epoch 180: Loss = 0.6511
Epoch 180: Loss = 0.6761
Epoch 180: Loss = 0.6988
Epoch 180: Loss = 0.7082


  2%|▏         | 192/10000 [00:15<11:57, 13.68it/s]

Epoch 190: Loss = 0.6818
Epoch 190: Loss = 0.6530
Epoch 190: Loss = 0.6472
Epoch 190: Loss = 0.6787
Epoch 190: Loss = 0.7264


  2%|▏         | 202/10000 [00:16<15:38, 10.44it/s]

Epoch 200: Loss = 0.6550
Epoch 200: Loss = 0.6803
Epoch 200: Loss = 0.6780
Epoch 200: Loss = 0.7202
Epoch 200: Loss = 0.6667


  2%|▏         | 212/10000 [00:17<12:49, 12.73it/s]

Epoch 210: Loss = 0.6762
Epoch 210: Loss = 0.6341
Epoch 210: Loss = 0.6561
Epoch 210: Loss = 0.6930
Epoch 210: Loss = 0.7004


  2%|▏         | 222/10000 [00:17<11:51, 13.75it/s]

Epoch 220: Loss = 0.7028
Epoch 220: Loss = 0.6820
Epoch 220: Loss = 0.6781
Epoch 220: Loss = 0.7110
Epoch 220: Loss = 0.6971


  2%|▏         | 232/10000 [00:18<13:05, 12.44it/s]

Epoch 230: Loss = 0.6877
Epoch 230: Loss = 0.6751
Epoch 230: Loss = 0.6822
Epoch 230: Loss = 0.6628
Epoch 230: Loss = 0.6875


  2%|▏         | 242/10000 [00:19<13:53, 11.71it/s]

Epoch 240: Loss = 0.6992
Epoch 240: Loss = 0.6791
Epoch 240: Loss = 0.7027
Epoch 240: Loss = 0.6915
Epoch 240: Loss = 0.6811


  3%|▎         | 252/10000 [00:20<14:51, 10.93it/s]

Epoch 250: Loss = 0.6875
Epoch 250: Loss = 0.6705
Epoch 250: Loss = 0.6916
Epoch 250: Loss = 0.6907
Epoch 250: Loss = 0.6454


  3%|▎         | 262/10000 [00:21<12:28, 13.01it/s]

Epoch 260: Loss = 0.6971
Epoch 260: Loss = 0.6982
Epoch 260: Loss = 0.6622
Epoch 260: Loss = 0.6768
Epoch 260: Loss = 0.6953


  3%|▎         | 272/10000 [00:21<12:30, 12.96it/s]

Epoch 270: Loss = 0.6910
Epoch 270: Loss = 0.6853
Epoch 270: Loss = 0.7112
Epoch 270: Loss = 0.6953
Epoch 270: Loss = 0.6442


  3%|▎         | 282/10000 [00:22<11:44, 13.79it/s]

Epoch 280: Loss = 0.6639
Epoch 280: Loss = 0.6870
Epoch 280: Loss = 0.6849
Epoch 280: Loss = 0.6866
Epoch 280: Loss = 0.6739


  3%|▎         | 292/10000 [00:23<14:03, 11.51it/s]

Epoch 290: Loss = 0.6888
Epoch 290: Loss = 0.6856
Epoch 290: Loss = 0.6490
Epoch 290: Loss = 0.6985
Epoch 290: Loss = 0.6634


  3%|▎         | 302/10000 [00:24<12:47, 12.64it/s]

Epoch 300: Loss = 0.7124
Epoch 300: Loss = 0.6875
Epoch 300: Loss = 0.7046
Epoch 300: Loss = 0.6874
Epoch 300: Loss = 0.6889


  3%|▎         | 312/10000 [00:25<13:00, 12.42it/s]

Epoch 310: Loss = 0.6783
Epoch 310: Loss = 0.6927
Epoch 310: Loss = 0.6649
Epoch 310: Loss = 0.7255
Epoch 310: Loss = 0.7315


  3%|▎         | 322/10000 [00:25<12:44, 12.67it/s]

Epoch 320: Loss = 0.6769
Epoch 320: Loss = 0.6973
Epoch 320: Loss = 0.6453
Epoch 320: Loss = 0.6967
Epoch 320: Loss = 0.7073


  3%|▎         | 332/10000 [00:26<11:48, 13.65it/s]

Epoch 330: Loss = 0.6585
Epoch 330: Loss = 0.6704
Epoch 330: Loss = 0.6678
Epoch 330: Loss = 0.6908
Epoch 330: Loss = 0.7038


  3%|▎         | 342/10000 [00:27<14:01, 11.47it/s]

Epoch 340: Loss = 0.7119
Epoch 340: Loss = 0.6850
Epoch 340: Loss = 0.6879
Epoch 340: Loss = 0.7031
Epoch 340: Loss = 0.6425


  4%|▎         | 352/10000 [00:28<14:06, 11.40it/s]

Epoch 350: Loss = 0.6854
Epoch 350: Loss = 0.6733
Epoch 350: Loss = 0.6848
Epoch 350: Loss = 0.6810
Epoch 350: Loss = 0.6622


  4%|▎         | 362/10000 [00:29<14:23, 11.16it/s]

Epoch 360: Loss = 0.6608
Epoch 360: Loss = 0.6709
Epoch 360: Loss = 0.6944
Epoch 360: Loss = 0.7047
Epoch 360: Loss = 0.6541


  4%|▎         | 372/10000 [00:30<13:29, 11.89it/s]

Epoch 370: Loss = 0.6939
Epoch 370: Loss = 0.6933
Epoch 370: Loss = 0.6686
Epoch 370: Loss = 0.6722
Epoch 370: Loss = 0.6836


  4%|▍         | 382/10000 [00:31<13:15, 12.09it/s]

Epoch 380: Loss = 0.6711
Epoch 380: Loss = 0.6731
Epoch 380: Loss = 0.6604
Epoch 380: Loss = 0.6826
Epoch 380: Loss = 0.6592


  4%|▍         | 392/10000 [00:31<13:03, 12.26it/s]

Epoch 390: Loss = 0.6653
Epoch 390: Loss = 0.7223
Epoch 390: Loss = 0.6984
Epoch 390: Loss = 0.6786
Epoch 390: Loss = 0.6824


  4%|▍         | 402/10000 [00:32<14:57, 10.70it/s]

Epoch 400: Loss = 0.6891
Epoch 400: Loss = 0.6846
Epoch 400: Loss = 0.6978
Epoch 400: Loss = 0.6650
Epoch 400: Loss = 0.6874


  4%|▍         | 412/10000 [00:33<14:44, 10.84it/s]

Epoch 410: Loss = 0.6809
Epoch 410: Loss = 0.6615
Epoch 410: Loss = 0.6719
Epoch 410: Loss = 0.7134
Epoch 410: Loss = 0.6768


  4%|▍         | 422/10000 [00:34<14:32, 10.98it/s]

Epoch 420: Loss = 0.7039
Epoch 420: Loss = 0.6745
Epoch 420: Loss = 0.6575
Epoch 420: Loss = 0.6680
Epoch 420: Loss = 0.7140


  4%|▍         | 432/10000 [00:35<13:13, 12.06it/s]

Epoch 430: Loss = 0.6889
Epoch 430: Loss = 0.6937
Epoch 430: Loss = 0.6646
Epoch 430: Loss = 0.6422
Epoch 430: Loss = 0.7175


  4%|▍         | 442/10000 [00:36<12:03, 13.22it/s]

Epoch 440: Loss = 0.6989
Epoch 440: Loss = 0.7005
Epoch 440: Loss = 0.6781
Epoch 440: Loss = 0.7104
Epoch 440: Loss = 0.6760


  5%|▍         | 452/10000 [00:36<11:34, 13.74it/s]

Epoch 450: Loss = 0.6599
Epoch 450: Loss = 0.6715
Epoch 450: Loss = 0.6435
Epoch 450: Loss = 0.6922
Epoch 450: Loss = 0.7045


  5%|▍         | 462/10000 [00:37<12:03, 13.18it/s]

Epoch 460: Loss = 0.6821
Epoch 460: Loss = 0.7176
Epoch 460: Loss = 0.6706
Epoch 460: Loss = 0.6616
Epoch 460: Loss = 0.6574


  5%|▍         | 472/10000 [00:38<12:35, 12.62it/s]

Epoch 470: Loss = 0.6589
Epoch 470: Loss = 0.6865
Epoch 470: Loss = 0.6831
Epoch 470: Loss = 0.6797
Epoch 470: Loss = 0.6832


  5%|▍         | 482/10000 [00:39<11:27, 13.85it/s]

Epoch 480: Loss = 0.6923
Epoch 480: Loss = 0.6849
Epoch 480: Loss = 0.6894
Epoch 480: Loss = 0.6798
Epoch 480: Loss = 0.6667


  5%|▍         | 492/10000 [00:40<13:39, 11.61it/s]

Epoch 490: Loss = 0.6610
Epoch 490: Loss = 0.6570
Epoch 490: Loss = 0.6865
Epoch 490: Loss = 0.6871
Epoch 490: Loss = 0.6972


  5%|▌         | 502/10000 [00:40<12:19, 12.84it/s]

Epoch 500: Loss = 0.6552
Epoch 500: Loss = 0.6840
Epoch 500: Loss = 0.7067
Epoch 500: Loss = 0.6681
Epoch 500: Loss = 0.6695


  5%|▌         | 512/10000 [00:41<11:25, 13.84it/s]

Epoch 510: Loss = 0.6556
Epoch 510: Loss = 0.7129
Epoch 510: Loss = 0.6527
Epoch 510: Loss = 0.6912
Epoch 510: Loss = 0.6520


  5%|▌         | 522/10000 [00:42<11:25, 13.83it/s]

Epoch 520: Loss = 0.6799
Epoch 520: Loss = 0.6626
Epoch 520: Loss = 0.6840
Epoch 520: Loss = 0.6867
Epoch 520: Loss = 0.6755


  5%|▌         | 532/10000 [00:43<12:32, 12.58it/s]

Epoch 530: Loss = 0.6842
Epoch 530: Loss = 0.6414
Epoch 530: Loss = 0.6811
Epoch 530: Loss = 0.7014
Epoch 530: Loss = 0.6639


  5%|▌         | 542/10000 [00:43<11:31, 13.67it/s]

Epoch 540: Loss = 0.6953
Epoch 540: Loss = 0.6788
Epoch 540: Loss = 0.7115
Epoch 540: Loss = 0.6780
Epoch 540: Loss = 0.7043


  6%|▌         | 552/10000 [00:44<14:41, 10.72it/s]

Epoch 550: Loss = 0.6845
Epoch 550: Loss = 0.6803
Epoch 550: Loss = 0.6726
Epoch 550: Loss = 0.6463
Epoch 550: Loss = 0.6805


  6%|▌         | 562/10000 [00:45<13:15, 11.87it/s]

Epoch 560: Loss = 0.6846
Epoch 560: Loss = 0.6756
Epoch 560: Loss = 0.7027
Epoch 560: Loss = 0.6619
Epoch 560: Loss = 0.6766


  6%|▌         | 572/10000 [00:46<13:01, 12.07it/s]

Epoch 570: Loss = 0.6638
Epoch 570: Loss = 0.6437
Epoch 570: Loss = 0.6992
Epoch 570: Loss = 0.6786
Epoch 570: Loss = 0.6857


  6%|▌         | 582/10000 [00:47<12:18, 12.75it/s]

Epoch 580: Loss = 0.6898
Epoch 580: Loss = 0.6954
Epoch 580: Loss = 0.6838
Epoch 580: Loss = 0.7049
Epoch 580: Loss = 0.7016


  6%|▌         | 592/10000 [00:48<12:30, 12.54it/s]

Epoch 590: Loss = 0.7039
Epoch 590: Loss = 0.6852
Epoch 590: Loss = 0.6779
Epoch 590: Loss = 0.6542
Epoch 590: Loss = 0.6729


  6%|▌         | 602/10000 [00:48<12:43, 12.31it/s]

Epoch 600: Loss = 0.6737
Epoch 600: Loss = 0.6411
Epoch 600: Loss = 0.6741
Epoch 600: Loss = 0.6734
Epoch 600: Loss = 0.6887


  6%|▌         | 612/10000 [00:49<13:04, 11.96it/s]

Epoch 610: Loss = 0.7195
Epoch 610: Loss = 0.6821
Epoch 610: Loss = 0.6672
Epoch 610: Loss = 0.6839
Epoch 610: Loss = 0.6898


  6%|▌         | 622/10000 [00:50<12:52, 12.14it/s]

Epoch 620: Loss = 0.6798
Epoch 620: Loss = 0.6991
Epoch 620: Loss = 0.6634
Epoch 620: Loss = 0.6886
Epoch 620: Loss = 0.7205


  6%|▋         | 632/10000 [00:51<11:41, 13.35it/s]

Epoch 630: Loss = 0.6476
Epoch 630: Loss = 0.6678
Epoch 630: Loss = 0.6524
Epoch 630: Loss = 0.6893
Epoch 630: Loss = 0.6769


  6%|▋         | 642/10000 [00:52<12:17, 12.69it/s]

Epoch 640: Loss = 0.7037
Epoch 640: Loss = 0.6805
Epoch 640: Loss = 0.6913
Epoch 640: Loss = 0.7029
Epoch 640: Loss = 0.6597


  7%|▋         | 652/10000 [00:53<11:55, 13.06it/s]

Epoch 650: Loss = 0.7082
Epoch 650: Loss = 0.6934
Epoch 650: Loss = 0.6613
Epoch 650: Loss = 0.6818
Epoch 650: Loss = 0.6367


  7%|▋         | 662/10000 [00:53<11:35, 13.43it/s]

Epoch 660: Loss = 0.6858
Epoch 660: Loss = 0.6615
Epoch 660: Loss = 0.6612
Epoch 660: Loss = 0.6777
Epoch 660: Loss = 0.6513


  7%|▋         | 672/10000 [00:54<11:20, 13.72it/s]

Epoch 670: Loss = 0.6513
Epoch 670: Loss = 0.6773
Epoch 670: Loss = 0.7033
Epoch 670: Loss = 0.6694
Epoch 670: Loss = 0.6874


  7%|▋         | 682/10000 [00:55<12:00, 12.94it/s]

Epoch 680: Loss = 0.6511
Epoch 680: Loss = 0.6848
Epoch 680: Loss = 0.6799
Epoch 680: Loss = 0.6486
Epoch 680: Loss = 0.6720


  7%|▋         | 692/10000 [00:56<12:56, 11.99it/s]

Epoch 690: Loss = 0.7121
Epoch 690: Loss = 0.6619
Epoch 690: Loss = 0.6977
Epoch 690: Loss = 0.6909
Epoch 690: Loss = 0.6876


  7%|▋         | 702/10000 [00:56<11:32, 13.43it/s]

Epoch 700: Loss = 0.6766
Epoch 700: Loss = 0.6675
Epoch 700: Loss = 0.6563
Epoch 700: Loss = 0.6702
Epoch 700: Loss = 0.6599


  7%|▋         | 712/10000 [00:57<11:57, 12.94it/s]

Epoch 710: Loss = 0.6503
Epoch 710: Loss = 0.6844
Epoch 710: Loss = 0.6707
Epoch 710: Loss = 0.6929
Epoch 710: Loss = 0.6559


  7%|▋         | 722/10000 [00:58<12:30, 12.37it/s]

Epoch 720: Loss = 0.6920
Epoch 720: Loss = 0.6916
Epoch 720: Loss = 0.6755
Epoch 720: Loss = 0.6787
Epoch 720: Loss = 0.6794


  7%|▋         | 732/10000 [00:59<13:21, 11.56it/s]

Epoch 730: Loss = 0.6652
Epoch 730: Loss = 0.6940
Epoch 730: Loss = 0.6767
Epoch 730: Loss = 0.6513
Epoch 730: Loss = 0.6859


  7%|▋         | 742/10000 [01:00<13:03, 11.81it/s]

Epoch 740: Loss = 0.7035
Epoch 740: Loss = 0.6835
Epoch 740: Loss = 0.6680
Epoch 740: Loss = 0.6877
Epoch 740: Loss = 0.6837


  8%|▊         | 752/10000 [01:01<14:09, 10.89it/s]

Epoch 750: Loss = 0.6707
Epoch 750: Loss = 0.6560
Epoch 750: Loss = 0.6782
Epoch 750: Loss = 0.6553
Epoch 750: Loss = 0.6993


  8%|▊         | 762/10000 [01:01<12:16, 12.54it/s]

Epoch 760: Loss = 0.7028
Epoch 760: Loss = 0.6468
Epoch 760: Loss = 0.6559
Epoch 760: Loss = 0.6782
Epoch 760: Loss = 0.6647


  8%|▊         | 772/10000 [01:02<12:35, 12.21it/s]

Epoch 770: Loss = 0.6797
Epoch 770: Loss = 0.7124
Epoch 770: Loss = 0.6805
Epoch 770: Loss = 0.6960
Epoch 770: Loss = 0.6739


  8%|▊         | 782/10000 [01:03<11:41, 13.15it/s]

Epoch 780: Loss = 0.6782
Epoch 780: Loss = 0.6993
Epoch 780: Loss = 0.6694
Epoch 780: Loss = 0.6765
Epoch 780: Loss = 0.6641


  8%|▊         | 792/10000 [01:04<12:01, 12.76it/s]

Epoch 790: Loss = 0.6730
Epoch 790: Loss = 0.6898
Epoch 790: Loss = 0.6869
Epoch 790: Loss = 0.6713
Epoch 790: Loss = 0.6450


  8%|▊         | 802/10000 [01:05<11:59, 12.78it/s]

Epoch 800: Loss = 0.6605
Epoch 800: Loss = 0.6750
Epoch 800: Loss = 0.6723
Epoch 800: Loss = 0.6826
Epoch 800: Loss = 0.7018


  8%|▊         | 812/10000 [01:05<11:53, 12.88it/s]

Epoch 810: Loss = 0.6480
Epoch 810: Loss = 0.6731
Epoch 810: Loss = 0.6631
Epoch 810: Loss = 0.7023
Epoch 810: Loss = 0.7013


  8%|▊         | 822/10000 [01:06<14:23, 10.63it/s]

Epoch 820: Loss = 0.6790
Epoch 820: Loss = 0.7031
Epoch 820: Loss = 0.6617
Epoch 820: Loss = 0.6948
Epoch 820: Loss = 0.6716


  8%|▊         | 832/10000 [01:07<12:44, 12.00it/s]

Epoch 830: Loss = 0.6433
Epoch 830: Loss = 0.6775
Epoch 830: Loss = 0.6704
Epoch 830: Loss = 0.6751
Epoch 830: Loss = 0.6617


  8%|▊         | 842/10000 [01:08<13:13, 11.54it/s]

Epoch 840: Loss = 0.6864
Epoch 840: Loss = 0.6587
Epoch 840: Loss = 0.6832
Epoch 840: Loss = 0.6799
Epoch 840: Loss = 0.6934


  9%|▊         | 852/10000 [01:09<13:01, 11.70it/s]

Epoch 850: Loss = 0.6898
Epoch 850: Loss = 0.6623
Epoch 850: Loss = 0.6517
Epoch 850: Loss = 0.6770
Epoch 850: Loss = 0.6665


  9%|▊         | 862/10000 [01:10<11:38, 13.08it/s]

Epoch 860: Loss = 0.6475
Epoch 860: Loss = 0.6978
Epoch 860: Loss = 0.6800
Epoch 860: Loss = 0.7011
Epoch 860: Loss = 0.6648


  9%|▊         | 872/10000 [01:11<11:52, 12.81it/s]

Epoch 870: Loss = 0.6684
Epoch 870: Loss = 0.6911
Epoch 870: Loss = 0.6755
Epoch 870: Loss = 0.6651
Epoch 870: Loss = 0.6680


  9%|▉         | 882/10000 [01:11<11:07, 13.67it/s]

Epoch 880: Loss = 0.7101
Epoch 880: Loss = 0.6857
Epoch 880: Loss = 0.6567
Epoch 880: Loss = 0.6561
Epoch 880: Loss = 0.6472


  9%|▉         | 892/10000 [01:12<11:04, 13.72it/s]

Epoch 890: Loss = 0.6545
Epoch 890: Loss = 0.6847
Epoch 890: Loss = 0.6652
Epoch 890: Loss = 0.6734
Epoch 890: Loss = 0.6900


  9%|▉         | 902/10000 [01:13<11:16, 13.44it/s]

Epoch 900: Loss = 0.6694
Epoch 900: Loss = 0.7235
Epoch 900: Loss = 0.6761
Epoch 900: Loss = 0.6966
Epoch 900: Loss = 0.6903


  9%|▉         | 912/10000 [01:13<11:12, 13.52it/s]

Epoch 910: Loss = 0.7013
Epoch 910: Loss = 0.7082
Epoch 910: Loss = 0.6824
Epoch 910: Loss = 0.7055
Epoch 910: Loss = 0.6823


  9%|▉         | 922/10000 [01:14<11:24, 13.26it/s]

Epoch 920: Loss = 0.6854
Epoch 920: Loss = 0.6883
Epoch 920: Loss = 0.6862
Epoch 920: Loss = 0.6936
Epoch 920: Loss = 0.6674


  9%|▉         | 932/10000 [01:15<12:22, 12.21it/s]

Epoch 930: Loss = 0.6690
Epoch 930: Loss = 0.6708
Epoch 930: Loss = 0.6637
Epoch 930: Loss = 0.6877
Epoch 930: Loss = 0.6613


  9%|▉         | 942/10000 [01:16<11:30, 13.11it/s]

Epoch 940: Loss = 0.6999
Epoch 940: Loss = 0.7061
Epoch 940: Loss = 0.6926
Epoch 940: Loss = 0.6848
Epoch 940: Loss = 0.6674


 10%|▉         | 952/10000 [01:17<12:08, 12.42it/s]

Epoch 950: Loss = 0.6881
Epoch 950: Loss = 0.6828
Epoch 950: Loss = 0.7081
Epoch 950: Loss = 0.7043
Epoch 950: Loss = 0.6410


 10%|▉         | 962/10000 [01:18<14:08, 10.65it/s]

Epoch 960: Loss = 0.7019
Epoch 960: Loss = 0.6633
Epoch 960: Loss = 0.6743
Epoch 960: Loss = 0.6843
Epoch 960: Loss = 0.6391


 10%|▉         | 972/10000 [01:19<12:31, 12.01it/s]

Epoch 970: Loss = 0.6767
Epoch 970: Loss = 0.6968
Epoch 970: Loss = 0.6996
Epoch 970: Loss = 0.6442
Epoch 970: Loss = 0.6636


 10%|▉         | 982/10000 [01:19<11:07, 13.50it/s]

Epoch 980: Loss = 0.6734
Epoch 980: Loss = 0.6900
Epoch 980: Loss = 0.6712
Epoch 980: Loss = 0.6860
Epoch 980: Loss = 0.6654


 10%|▉         | 992/10000 [01:20<11:23, 13.19it/s]

Epoch 990: Loss = 0.6486
Epoch 990: Loss = 0.6985
Epoch 990: Loss = 0.7019
Epoch 990: Loss = 0.7030
Epoch 990: Loss = 0.6805


 10%|█         | 1002/10000 [01:21<11:07, 13.49it/s]

Epoch 1000: Loss = 0.6875
Epoch 1000: Loss = 0.7024
Epoch 1000: Loss = 0.6958
Epoch 1000: Loss = 0.6670
Epoch 1000: Loss = 0.6998


 10%|█         | 1012/10000 [01:22<12:14, 12.24it/s]

Epoch 1010: Loss = 0.6706
Epoch 1010: Loss = 0.6662
Epoch 1010: Loss = 0.6849
Epoch 1010: Loss = 0.6599
Epoch 1010: Loss = 0.6787


 10%|█         | 1022/10000 [01:22<12:03, 12.41it/s]

Epoch 1020: Loss = 0.6767
Epoch 1020: Loss = 0.6449
Epoch 1020: Loss = 0.6917
Epoch 1020: Loss = 0.6832
Epoch 1020: Loss = 0.6405


 10%|█         | 1032/10000 [01:23<11:31, 12.96it/s]

Epoch 1030: Loss = 0.6884
Epoch 1030: Loss = 0.6804
Epoch 1030: Loss = 0.6438
Epoch 1030: Loss = 0.7058
Epoch 1030: Loss = 0.6776


 10%|█         | 1042/10000 [01:24<10:51, 13.75it/s]

Epoch 1040: Loss = 0.6415
Epoch 1040: Loss = 0.6573
Epoch 1040: Loss = 0.6524
Epoch 1040: Loss = 0.6816
Epoch 1040: Loss = 0.6880


 11%|█         | 1052/10000 [01:25<11:46, 12.66it/s]

Epoch 1050: Loss = 0.6623
Epoch 1050: Loss = 0.7098
Epoch 1050: Loss = 0.6675
Epoch 1050: Loss = 0.6678
Epoch 1050: Loss = 0.6549


 11%|█         | 1062/10000 [01:26<13:05, 11.38it/s]

Epoch 1060: Loss = 0.6574
Epoch 1060: Loss = 0.6437
Epoch 1060: Loss = 0.6536
Epoch 1060: Loss = 0.6844
Epoch 1060: Loss = 0.7095


 11%|█         | 1072/10000 [01:27<12:25, 11.98it/s]

Epoch 1070: Loss = 0.6742
Epoch 1070: Loss = 0.6761
Epoch 1070: Loss = 0.6654
Epoch 1070: Loss = 0.6797
Epoch 1070: Loss = 0.6744


 11%|█         | 1082/10000 [01:27<10:53, 13.64it/s]

Epoch 1080: Loss = 0.7476
Epoch 1080: Loss = 0.6711
Epoch 1080: Loss = 0.6977
Epoch 1080: Loss = 0.6876
Epoch 1080: Loss = 0.6733


 11%|█         | 1092/10000 [01:28<11:07, 13.34it/s]

Epoch 1090: Loss = 0.6999
Epoch 1090: Loss = 0.6884
Epoch 1090: Loss = 0.6735
Epoch 1090: Loss = 0.6597
Epoch 1090: Loss = 0.7026


 11%|█         | 1102/10000 [01:29<12:09, 12.20it/s]

Epoch 1100: Loss = 0.6757
Epoch 1100: Loss = 0.6874
Epoch 1100: Loss = 0.6335
Epoch 1100: Loss = 0.7100
Epoch 1100: Loss = 0.6656


 11%|█         | 1112/10000 [01:30<11:48, 12.55it/s]

Epoch 1110: Loss = 0.6382
Epoch 1110: Loss = 0.6881
Epoch 1110: Loss = 0.6715
Epoch 1110: Loss = 0.6777
Epoch 1110: Loss = 0.7092


 11%|█         | 1122/10000 [01:31<11:38, 12.71it/s]

Epoch 1120: Loss = 0.7077
Epoch 1120: Loss = 0.6593
Epoch 1120: Loss = 0.6697
Epoch 1120: Loss = 0.6805
Epoch 1120: Loss = 0.6514


 11%|█▏        | 1132/10000 [01:31<10:53, 13.57it/s]

Epoch 1130: Loss = 0.6877
Epoch 1130: Loss = 0.6580
Epoch 1130: Loss = 0.6874
Epoch 1130: Loss = 0.6428
Epoch 1130: Loss = 0.6724


 11%|█▏        | 1142/10000 [01:32<10:40, 13.83it/s]

Epoch 1140: Loss = 0.6860
Epoch 1140: Loss = 0.6553
Epoch 1140: Loss = 0.6909
Epoch 1140: Loss = 0.6877
Epoch 1140: Loss = 0.7083


 12%|█▏        | 1152/10000 [01:33<11:40, 12.63it/s]

Epoch 1150: Loss = 0.6962
Epoch 1150: Loss = 0.6610
Epoch 1150: Loss = 0.6592
Epoch 1150: Loss = 0.6905
Epoch 1150: Loss = 0.6520


 12%|█▏        | 1162/10000 [01:34<10:59, 13.40it/s]

Epoch 1160: Loss = 0.6795
Epoch 1160: Loss = 0.6708
Epoch 1160: Loss = 0.6906
Epoch 1160: Loss = 0.6449
Epoch 1160: Loss = 0.6917


 12%|█▏        | 1172/10000 [01:34<12:40, 11.60it/s]

Epoch 1170: Loss = 0.6799
Epoch 1170: Loss = 0.6775
Epoch 1170: Loss = 0.6573
Epoch 1170: Loss = 0.6806
Epoch 1170: Loss = 0.7120


 12%|█▏        | 1182/10000 [01:35<11:34, 12.71it/s]

Epoch 1180: Loss = 0.6652
Epoch 1180: Loss = 0.6674
Epoch 1180: Loss = 0.6871
Epoch 1180: Loss = 0.6621
Epoch 1180: Loss = 0.6800


 12%|█▏        | 1192/10000 [01:36<11:17, 13.00it/s]

Epoch 1190: Loss = 0.6746
Epoch 1190: Loss = 0.6688
Epoch 1190: Loss = 0.6687
Epoch 1190: Loss = 0.6735
Epoch 1190: Loss = 0.6783


 12%|█▏        | 1202/10000 [01:37<11:20, 12.92it/s]

Epoch 1200: Loss = 0.7092
Epoch 1200: Loss = 0.6718
Epoch 1200: Loss = 0.6593
Epoch 1200: Loss = 0.6713
Epoch 1200: Loss = 0.6635


 12%|█▏        | 1212/10000 [01:38<11:33, 12.67it/s]

Epoch 1210: Loss = 0.6705
Epoch 1210: Loss = 0.7295
Epoch 1210: Loss = 0.6371
Epoch 1210: Loss = 0.6683
Epoch 1210: Loss = 0.7134


 12%|█▏        | 1222/10000 [01:38<11:07, 13.15it/s]

Epoch 1220: Loss = 0.6722
Epoch 1220: Loss = 0.6675
Epoch 1220: Loss = 0.6861
Epoch 1220: Loss = 0.6695
Epoch 1220: Loss = 0.6682


 12%|█▏        | 1232/10000 [01:39<12:30, 11.68it/s]

Epoch 1230: Loss = 0.6485
Epoch 1230: Loss = 0.6540
Epoch 1230: Loss = 0.7112
Epoch 1230: Loss = 0.6709
Epoch 1230: Loss = 0.6649


 12%|█▏        | 1242/10000 [01:40<11:26, 12.76it/s]

Epoch 1240: Loss = 0.6862
Epoch 1240: Loss = 0.6681
Epoch 1240: Loss = 0.6483
Epoch 1240: Loss = 0.6518
Epoch 1240: Loss = 0.6513


 13%|█▎        | 1252/10000 [01:41<12:53, 11.31it/s]

Epoch 1250: Loss = 0.6849
Epoch 1250: Loss = 0.6998
Epoch 1250: Loss = 0.6792
Epoch 1250: Loss = 0.6589
Epoch 1250: Loss = 0.7247


 13%|█▎        | 1262/10000 [01:42<12:04, 12.06it/s]

Epoch 1260: Loss = 0.6619
Epoch 1260: Loss = 0.6882
Epoch 1260: Loss = 0.6683
Epoch 1260: Loss = 0.6419
Epoch 1260: Loss = 0.6722


 13%|█▎        | 1272/10000 [01:43<11:50, 12.28it/s]

Epoch 1270: Loss = 0.6821
Epoch 1270: Loss = 0.6462
Epoch 1270: Loss = 0.6881
Epoch 1270: Loss = 0.6535
Epoch 1270: Loss = 0.6755


 13%|█▎        | 1282/10000 [01:43<10:49, 13.42it/s]

Epoch 1280: Loss = 0.7012
Epoch 1280: Loss = 0.6962
Epoch 1280: Loss = 0.7196
Epoch 1280: Loss = 0.6815
Epoch 1280: Loss = 0.6888


 13%|█▎        | 1292/10000 [01:44<10:40, 13.59it/s]

Epoch 1290: Loss = 0.6769
Epoch 1290: Loss = 0.6514
Epoch 1290: Loss = 0.6437
Epoch 1290: Loss = 0.6350
Epoch 1290: Loss = 0.6400


 13%|█▎        | 1302/10000 [01:45<12:48, 11.31it/s]

Epoch 1300: Loss = 0.6583
Epoch 1300: Loss = 0.6657
Epoch 1300: Loss = 0.6668
Epoch 1300: Loss = 0.6487
Epoch 1300: Loss = 0.6614


 13%|█▎        | 1312/10000 [01:46<12:38, 11.46it/s]

Epoch 1310: Loss = 0.6802
Epoch 1310: Loss = 0.7096
Epoch 1310: Loss = 0.6989
Epoch 1310: Loss = 0.6719
Epoch 1310: Loss = 0.6770


 13%|█▎        | 1322/10000 [01:47<12:19, 11.73it/s]

Epoch 1320: Loss = 0.6800
Epoch 1320: Loss = 0.6858
Epoch 1320: Loss = 0.6832
Epoch 1320: Loss = 0.6899
Epoch 1320: Loss = 0.6588


 13%|█▎        | 1332/10000 [01:48<12:39, 11.41it/s]

Epoch 1330: Loss = 0.6689
Epoch 1330: Loss = 0.6481
Epoch 1330: Loss = 0.6988
Epoch 1330: Loss = 0.6851
Epoch 1330: Loss = 0.6632


 13%|█▎        | 1342/10000 [01:49<12:17, 11.74it/s]

Epoch 1340: Loss = 0.6667
Epoch 1340: Loss = 0.6847
Epoch 1340: Loss = 0.6861
Epoch 1340: Loss = 0.6598
Epoch 1340: Loss = 0.6553


 14%|█▎        | 1352/10000 [01:50<12:50, 11.22it/s]

Epoch 1350: Loss = 0.6886
Epoch 1350: Loss = 0.6280
Epoch 1350: Loss = 0.6372
Epoch 1350: Loss = 0.7037
Epoch 1350: Loss = 0.6584


 14%|█▎        | 1362/10000 [01:50<10:59, 13.10it/s]

Epoch 1360: Loss = 0.6788
Epoch 1360: Loss = 0.6761
Epoch 1360: Loss = 0.6337
Epoch 1360: Loss = 0.6486
Epoch 1360: Loss = 0.6413


 14%|█▎        | 1372/10000 [01:51<11:34, 12.42it/s]

Epoch 1370: Loss = 0.6626
Epoch 1370: Loss = 0.6789
Epoch 1370: Loss = 0.6772
Epoch 1370: Loss = 0.6956
Epoch 1370: Loss = 0.6672


 14%|█▍        | 1382/10000 [01:52<11:40, 12.30it/s]

Epoch 1380: Loss = 0.6788
Epoch 1380: Loss = 0.6746
Epoch 1380: Loss = 0.6456
Epoch 1380: Loss = 0.6839
Epoch 1380: Loss = 0.6495


 14%|█▍        | 1392/10000 [01:53<11:38, 12.32it/s]

Epoch 1390: Loss = 0.6839
Epoch 1390: Loss = 0.6840
Epoch 1390: Loss = 0.6558
Epoch 1390: Loss = 0.6633
Epoch 1390: Loss = 0.6702


 14%|█▍        | 1402/10000 [01:54<11:16, 12.70it/s]

Epoch 1400: Loss = 0.7025
Epoch 1400: Loss = 0.6755
Epoch 1400: Loss = 0.6515
Epoch 1400: Loss = 0.6769
Epoch 1400: Loss = 0.6738


 14%|█▍        | 1412/10000 [01:54<12:41, 11.27it/s]

Epoch 1410: Loss = 0.7141
Epoch 1410: Loss = 0.6518
Epoch 1410: Loss = 0.6992
Epoch 1410: Loss = 0.6746
Epoch 1410: Loss = 0.6911


 14%|█▍        | 1422/10000 [01:55<11:23, 12.56it/s]

Epoch 1420: Loss = 0.6635
Epoch 1420: Loss = 0.6714
Epoch 1420: Loss = 0.6744
Epoch 1420: Loss = 0.6852
Epoch 1420: Loss = 0.6929


 14%|█▍        | 1432/10000 [01:56<10:49, 13.19it/s]

Epoch 1430: Loss = 0.6630
Epoch 1430: Loss = 0.6274
Epoch 1430: Loss = 0.6792
Epoch 1430: Loss = 0.6641
Epoch 1430: Loss = 0.6337


 14%|█▍        | 1442/10000 [01:57<12:49, 11.12it/s]

Epoch 1440: Loss = 0.6678
Epoch 1440: Loss = 0.6569
Epoch 1440: Loss = 0.6400
Epoch 1440: Loss = 0.6837
Epoch 1440: Loss = 0.6372


 15%|█▍        | 1452/10000 [01:58<11:47, 12.08it/s]

Epoch 1450: Loss = 0.6623
Epoch 1450: Loss = 0.7006
Epoch 1450: Loss = 0.6535
Epoch 1450: Loss = 0.6684
Epoch 1450: Loss = 0.6528


 15%|█▍        | 1462/10000 [01:59<11:21, 12.53it/s]

Epoch 1460: Loss = 0.7048
Epoch 1460: Loss = 0.6571
Epoch 1460: Loss = 0.6841
Epoch 1460: Loss = 0.6642
Epoch 1460: Loss = 0.6634


 15%|█▍        | 1472/10000 [01:59<10:41, 13.30it/s]

Epoch 1470: Loss = 0.6441
Epoch 1470: Loss = 0.6715
Epoch 1470: Loss = 0.7042
Epoch 1470: Loss = 0.6656
Epoch 1470: Loss = 0.7039


 15%|█▍        | 1482/10000 [02:00<10:21, 13.70it/s]

Epoch 1480: Loss = 0.6744
Epoch 1480: Loss = 0.6669
Epoch 1480: Loss = 0.7109
Epoch 1480: Loss = 0.6672
Epoch 1480: Loss = 0.6939


 15%|█▍        | 1492/10000 [02:01<11:12, 12.65it/s]

Epoch 1490: Loss = 0.7107
Epoch 1490: Loss = 0.6514
Epoch 1490: Loss = 0.6797
Epoch 1490: Loss = 0.6314
Epoch 1490: Loss = 0.6703


 15%|█▌        | 1502/10000 [02:02<10:26, 13.57it/s]

Epoch 1500: Loss = 0.6917
Epoch 1500: Loss = 0.6482
Epoch 1500: Loss = 0.6815
Epoch 1500: Loss = 0.7044
Epoch 1500: Loss = 0.6624


 15%|█▌        | 1512/10000 [02:03<11:17, 12.53it/s]

Epoch 1510: Loss = 0.6979
Epoch 1510: Loss = 0.6847
Epoch 1510: Loss = 0.6461
Epoch 1510: Loss = 0.6710
Epoch 1510: Loss = 0.6771


 15%|█▌        | 1522/10000 [02:03<11:31, 12.26it/s]

Epoch 1520: Loss = 0.6734
Epoch 1520: Loss = 0.6545
Epoch 1520: Loss = 0.6489
Epoch 1520: Loss = 0.6883
Epoch 1520: Loss = 0.6498


 15%|█▌        | 1532/10000 [02:04<12:22, 11.40it/s]

Epoch 1530: Loss = 0.7239
Epoch 1530: Loss = 0.7167
Epoch 1530: Loss = 0.6878
Epoch 1530: Loss = 0.6800
Epoch 1530: Loss = 0.6964


 15%|█▌        | 1542/10000 [02:05<11:59, 11.76it/s]

Epoch 1540: Loss = 0.6543
Epoch 1540: Loss = 0.6802
Epoch 1540: Loss = 0.7026
Epoch 1540: Loss = 0.6574
Epoch 1540: Loss = 0.6549


 16%|█▌        | 1552/10000 [02:06<10:38, 13.24it/s]

Epoch 1550: Loss = 0.6470
Epoch 1550: Loss = 0.6520
Epoch 1550: Loss = 0.6888
Epoch 1550: Loss = 0.6586
Epoch 1550: Loss = 0.6621


 16%|█▌        | 1562/10000 [02:07<10:53, 12.92it/s]

Epoch 1560: Loss = 0.6975
Epoch 1560: Loss = 0.6664
Epoch 1560: Loss = 0.6909
Epoch 1560: Loss = 0.6568
Epoch 1560: Loss = 0.6935


 16%|█▌        | 1572/10000 [02:08<12:47, 10.97it/s]

Epoch 1570: Loss = 0.6726
Epoch 1570: Loss = 0.6708
Epoch 1570: Loss = 0.6678
Epoch 1570: Loss = 0.6718
Epoch 1570: Loss = 0.6710


 16%|█▌        | 1582/10000 [02:09<13:12, 10.63it/s]

Epoch 1580: Loss = 0.6855
Epoch 1580: Loss = 0.6616
Epoch 1580: Loss = 0.6582
Epoch 1580: Loss = 0.6649
Epoch 1580: Loss = 0.6792


 16%|█▌        | 1592/10000 [02:10<12:29, 11.22it/s]

Epoch 1590: Loss = 0.6827
Epoch 1590: Loss = 0.7027
Epoch 1590: Loss = 0.6880
Epoch 1590: Loss = 0.7061
Epoch 1590: Loss = 0.6994


 16%|█▌        | 1602/10000 [02:10<10:47, 12.96it/s]

Epoch 1600: Loss = 0.6814
Epoch 1600: Loss = 0.6668
Epoch 1600: Loss = 0.6847
Epoch 1600: Loss = 0.6831
Epoch 1600: Loss = 0.6885


 16%|█▌        | 1612/10000 [02:11<10:31, 13.29it/s]

Epoch 1610: Loss = 0.6971
Epoch 1610: Loss = 0.6678
Epoch 1610: Loss = 0.6419
Epoch 1610: Loss = 0.6351
Epoch 1610: Loss = 0.6566


 16%|█▌        | 1622/10000 [02:12<11:11, 12.48it/s]

Epoch 1620: Loss = 0.6711
Epoch 1620: Loss = 0.6701
Epoch 1620: Loss = 0.6584
Epoch 1620: Loss = 0.6594
Epoch 1620: Loss = 0.6709


 16%|█▋        | 1632/10000 [02:13<12:45, 10.93it/s]

Epoch 1630: Loss = 0.6965
Epoch 1630: Loss = 0.6681
Epoch 1630: Loss = 0.6932
Epoch 1630: Loss = 0.6850
Epoch 1630: Loss = 0.6851


 16%|█▋        | 1640/10000 [02:14<12:50, 10.84it/s]

Epoch 1640: Loss = 0.7068
Epoch 1640: Loss = 0.6869
Epoch 1640: Loss = 0.6604
Epoch 1640: Loss = 0.6653
Epoch 1640: Loss = 0.6445


 17%|█▋        | 1652/10000 [02:15<11:44, 11.85it/s]

Epoch 1650: Loss = 0.6726
Epoch 1650: Loss = 0.6617
Epoch 1650: Loss = 0.6738
Epoch 1650: Loss = 0.7140
Epoch 1650: Loss = 0.6651


 17%|█▋        | 1662/10000 [02:16<11:19, 12.28it/s]

Epoch 1660: Loss = 0.6970
Epoch 1660: Loss = 0.6531
Epoch 1660: Loss = 0.6895
Epoch 1660: Loss = 0.6630
Epoch 1660: Loss = 0.6893


 17%|█▋        | 1672/10000 [02:16<10:26, 13.30it/s]

Epoch 1670: Loss = 0.6671
Epoch 1670: Loss = 0.6618
Epoch 1670: Loss = 0.6625
Epoch 1670: Loss = 0.6850
Epoch 1670: Loss = 0.6559


 17%|█▋        | 1682/10000 [02:17<10:27, 13.26it/s]

Epoch 1680: Loss = 0.6645
Epoch 1680: Loss = 0.6732
Epoch 1680: Loss = 0.7013
Epoch 1680: Loss = 0.6415
Epoch 1680: Loss = 0.6892


 17%|█▋        | 1692/10000 [02:18<11:15, 12.30it/s]

Epoch 1690: Loss = 0.6562
Epoch 1690: Loss = 0.6877
Epoch 1690: Loss = 0.6522
Epoch 1690: Loss = 0.6482
Epoch 1690: Loss = 0.6972


 17%|█▋        | 1702/10000 [02:19<10:28, 13.20it/s]

Epoch 1700: Loss = 0.6826
Epoch 1700: Loss = 0.6824
Epoch 1700: Loss = 0.6884
Epoch 1700: Loss = 0.6754
Epoch 1700: Loss = 0.6758


 17%|█▋        | 1712/10000 [02:20<11:30, 12.01it/s]

Epoch 1710: Loss = 0.6957
Epoch 1710: Loss = 0.6845
Epoch 1710: Loss = 0.7024
Epoch 1710: Loss = 0.6815
Epoch 1710: Loss = 0.6572


 17%|█▋        | 1722/10000 [02:20<11:27, 12.05it/s]

Epoch 1720: Loss = 0.6817
Epoch 1720: Loss = 0.6537
Epoch 1720: Loss = 0.7048
Epoch 1720: Loss = 0.6752
Epoch 1720: Loss = 0.6679


 17%|█▋        | 1732/10000 [02:21<11:11, 12.31it/s]

Epoch 1730: Loss = 0.6912
Epoch 1730: Loss = 0.6652
Epoch 1730: Loss = 0.6511
Epoch 1730: Loss = 0.6813
Epoch 1730: Loss = 0.6569


 17%|█▋        | 1742/10000 [02:22<11:33, 11.90it/s]

Epoch 1740: Loss = 0.6572
Epoch 1740: Loss = 0.6470
Epoch 1740: Loss = 0.6641
Epoch 1740: Loss = 0.6700
Epoch 1740: Loss = 0.6643


 18%|█▊        | 1752/10000 [02:23<11:11, 12.28it/s]

Epoch 1750: Loss = 0.6908
Epoch 1750: Loss = 0.6775
Epoch 1750: Loss = 0.6832
Epoch 1750: Loss = 0.6694
Epoch 1750: Loss = 0.6284


 18%|█▊        | 1762/10000 [02:24<11:11, 12.27it/s]

Epoch 1760: Loss = 0.6422
Epoch 1760: Loss = 0.6614
Epoch 1760: Loss = 0.6790
Epoch 1760: Loss = 0.6748
Epoch 1760: Loss = 0.6952


 18%|█▊        | 1772/10000 [02:25<12:30, 10.96it/s]

Epoch 1770: Loss = 0.6447
Epoch 1770: Loss = 0.6620
Epoch 1770: Loss = 0.6747
Epoch 1770: Loss = 0.6768
Epoch 1770: Loss = 0.6878


 18%|█▊        | 1782/10000 [02:25<11:29, 11.92it/s]

Epoch 1780: Loss = 0.6570
Epoch 1780: Loss = 0.6635
Epoch 1780: Loss = 0.7006
Epoch 1780: Loss = 0.6920
Epoch 1780: Loss = 0.6698


 18%|█▊        | 1792/10000 [02:26<10:30, 13.02it/s]

Epoch 1790: Loss = 0.6566
Epoch 1790: Loss = 0.6953
Epoch 1790: Loss = 0.6869
Epoch 1790: Loss = 0.7141
Epoch 1790: Loss = 0.6758


 18%|█▊        | 1802/10000 [02:27<10:43, 12.73it/s]

Epoch 1800: Loss = 0.6525
Epoch 1800: Loss = 0.6998
Epoch 1800: Loss = 0.6755
Epoch 1800: Loss = 0.6888
Epoch 1800: Loss = 0.7106


 18%|█▊        | 1812/10000 [02:28<10:28, 13.03it/s]

Epoch 1810: Loss = 0.6587
Epoch 1810: Loss = 0.6770
Epoch 1810: Loss = 0.6918
Epoch 1810: Loss = 0.6564
Epoch 1810: Loss = 0.6849


 18%|█▊        | 1822/10000 [02:29<12:26, 10.95it/s]

Epoch 1820: Loss = 0.6564
Epoch 1820: Loss = 0.6752
Epoch 1820: Loss = 0.6956
Epoch 1820: Loss = 0.6697
Epoch 1820: Loss = 0.6615


 18%|█▊        | 1832/10000 [02:30<10:30, 12.96it/s]

Epoch 1830: Loss = 0.6596
Epoch 1830: Loss = 0.6263
Epoch 1830: Loss = 0.6809
Epoch 1830: Loss = 0.6570
Epoch 1830: Loss = 0.6705


 18%|█▊        | 1842/10000 [02:30<11:32, 11.78it/s]

Epoch 1840: Loss = 0.6501
Epoch 1840: Loss = 0.6513
Epoch 1840: Loss = 0.6914
Epoch 1840: Loss = 0.7072
Epoch 1840: Loss = 0.6519


 19%|█▊        | 1852/10000 [02:31<10:21, 13.12it/s]

Epoch 1850: Loss = 0.6657
Epoch 1850: Loss = 0.6880
Epoch 1850: Loss = 0.6436
Epoch 1850: Loss = 0.6606
Epoch 1850: Loss = 0.7009


 19%|█▊        | 1862/10000 [02:32<10:37, 12.76it/s]

Epoch 1860: Loss = 0.6435
Epoch 1860: Loss = 0.6720
Epoch 1860: Loss = 0.6661
Epoch 1860: Loss = 0.6730
Epoch 1860: Loss = 0.7028


 19%|█▊        | 1872/10000 [02:33<10:11, 13.28it/s]

Epoch 1870: Loss = 0.6755
Epoch 1870: Loss = 0.6847
Epoch 1870: Loss = 0.7172
Epoch 1870: Loss = 0.6534
Epoch 1870: Loss = 0.6573


 19%|█▉        | 1882/10000 [02:34<10:59, 12.32it/s]

Epoch 1880: Loss = 0.6785
Epoch 1880: Loss = 0.6941
Epoch 1880: Loss = 0.7044
Epoch 1880: Loss = 0.6478
Epoch 1880: Loss = 0.7230


 19%|█▉        | 1892/10000 [02:34<10:20, 13.06it/s]

Epoch 1890: Loss = 0.6464
Epoch 1890: Loss = 0.6757
Epoch 1890: Loss = 0.6493
Epoch 1890: Loss = 0.6918
Epoch 1890: Loss = 0.6656


 19%|█▉        | 1902/10000 [02:35<10:07, 13.33it/s]

Epoch 1900: Loss = 0.6730
Epoch 1900: Loss = 0.7042
Epoch 1900: Loss = 0.6695
Epoch 1900: Loss = 0.6837
Epoch 1900: Loss = 0.6710


 19%|█▉        | 1912/10000 [02:36<10:26, 12.90it/s]

Epoch 1910: Loss = 0.7187
Epoch 1910: Loss = 0.6593
Epoch 1910: Loss = 0.6658
Epoch 1910: Loss = 0.6744
Epoch 1910: Loss = 0.6712


 19%|█▉        | 1922/10000 [02:37<10:33, 12.76it/s]

Epoch 1920: Loss = 0.6354
Epoch 1920: Loss = 0.6656
Epoch 1920: Loss = 0.6963
Epoch 1920: Loss = 0.6672
Epoch 1920: Loss = 0.6695


 19%|█▉        | 1932/10000 [02:38<11:00, 12.21it/s]

Epoch 1930: Loss = 0.6869
Epoch 1930: Loss = 0.6917
Epoch 1930: Loss = 0.6918
Epoch 1930: Loss = 0.6601
Epoch 1930: Loss = 0.6713


 19%|█▉        | 1942/10000 [02:38<11:35, 11.58it/s]

Epoch 1940: Loss = 0.6699
Epoch 1940: Loss = 0.6957
Epoch 1940: Loss = 0.6770
Epoch 1940: Loss = 0.6729
Epoch 1940: Loss = 0.6751


 20%|█▉        | 1952/10000 [02:39<10:07, 13.25it/s]

Epoch 1950: Loss = 0.6686
Epoch 1950: Loss = 0.6726
Epoch 1950: Loss = 0.6822
Epoch 1950: Loss = 0.6761
Epoch 1950: Loss = 0.6673


 20%|█▉        | 1962/10000 [02:40<10:06, 13.25it/s]

Epoch 1960: Loss = 0.6951
Epoch 1960: Loss = 0.6771
Epoch 1960: Loss = 0.6790
Epoch 1960: Loss = 0.6598
Epoch 1960: Loss = 0.6689


 20%|█▉        | 1972/10000 [02:41<11:48, 11.34it/s]

Epoch 1970: Loss = 0.6728
Epoch 1970: Loss = 0.6694
Epoch 1970: Loss = 0.6644
Epoch 1970: Loss = 0.7159
Epoch 1970: Loss = 0.6637


 20%|█▉        | 1982/10000 [02:42<10:46, 12.40it/s]

Epoch 1980: Loss = 0.7137
Epoch 1980: Loss = 0.6868
Epoch 1980: Loss = 0.6605
Epoch 1980: Loss = 0.6954
Epoch 1980: Loss = 0.6516


 20%|█▉        | 1992/10000 [02:43<11:28, 11.62it/s]

Epoch 1990: Loss = 0.6938
Epoch 1990: Loss = 0.6440
Epoch 1990: Loss = 0.6958
Epoch 1990: Loss = 0.6714
Epoch 1990: Loss = 0.6958


 20%|██        | 2002/10000 [02:43<10:18, 12.94it/s]

Epoch 2000: Loss = 0.6539
Epoch 2000: Loss = 0.6753
Epoch 2000: Loss = 0.6598
Epoch 2000: Loss = 0.6658
Epoch 2000: Loss = 0.6725


 20%|██        | 2012/10000 [02:44<11:44, 11.34it/s]

Epoch 2010: Loss = 0.6667
Epoch 2010: Loss = 0.6468
Epoch 2010: Loss = 0.6959
Epoch 2010: Loss = 0.6499
Epoch 2010: Loss = 0.6612


 20%|██        | 2022/10000 [02:45<11:31, 11.53it/s]

Epoch 2020: Loss = 0.6561
Epoch 2020: Loss = 0.6998
Epoch 2020: Loss = 0.6532
Epoch 2020: Loss = 0.6452
Epoch 2020: Loss = 0.6804


 20%|██        | 2032/10000 [02:46<10:43, 12.38it/s]

Epoch 2030: Loss = 0.6742
Epoch 2030: Loss = 0.6791
Epoch 2030: Loss = 0.6702
Epoch 2030: Loss = 0.6534
Epoch 2030: Loss = 0.6738


 20%|██        | 2042/10000 [02:47<09:58, 13.29it/s]

Epoch 2040: Loss = 0.7073
Epoch 2040: Loss = 0.6799
Epoch 2040: Loss = 0.6654
Epoch 2040: Loss = 0.6969
Epoch 2040: Loss = 0.6991


 21%|██        | 2052/10000 [02:48<11:20, 11.68it/s]

Epoch 2050: Loss = 0.6700
Epoch 2050: Loss = 0.6617
Epoch 2050: Loss = 0.6290
Epoch 2050: Loss = 0.6730
Epoch 2050: Loss = 0.6880


 21%|██        | 2062/10000 [02:48<10:20, 12.79it/s]

Epoch 2060: Loss = 0.6722
Epoch 2060: Loss = 0.6942
Epoch 2060: Loss = 0.6939
Epoch 2060: Loss = 0.6795
Epoch 2060: Loss = 0.6859


 21%|██        | 2072/10000 [02:49<10:28, 12.61it/s]

Epoch 2070: Loss = 0.7213
Epoch 2070: Loss = 0.6640
Epoch 2070: Loss = 0.6800
Epoch 2070: Loss = 0.6682
Epoch 2070: Loss = 0.6700


 21%|██        | 2082/10000 [02:50<09:45, 13.52it/s]

Epoch 2080: Loss = 0.6750
Epoch 2080: Loss = 0.6795
Epoch 2080: Loss = 0.7102
Epoch 2080: Loss = 0.6808
Epoch 2080: Loss = 0.6592


 21%|██        | 2092/10000 [02:51<10:31, 12.52it/s]

Epoch 2090: Loss = 0.6947
Epoch 2090: Loss = 0.6626
Epoch 2090: Loss = 0.6485
Epoch 2090: Loss = 0.6675
Epoch 2090: Loss = 0.6434


 21%|██        | 2102/10000 [02:52<11:04, 11.89it/s]

Epoch 2100: Loss = 0.6617
Epoch 2100: Loss = 0.6456
Epoch 2100: Loss = 0.6916
Epoch 2100: Loss = 0.6088
Epoch 2100: Loss = 0.6593


 21%|██        | 2112/10000 [02:52<09:52, 13.32it/s]

Epoch 2110: Loss = 0.6897
Epoch 2110: Loss = 0.7018
Epoch 2110: Loss = 0.6699
Epoch 2110: Loss = 0.6856
Epoch 2110: Loss = 0.6597


 21%|██        | 2120/10000 [02:53<10:20, 12.70it/s]

Epoch 2120: Loss = 0.6670
Epoch 2120: Loss = 0.6993
Epoch 2120: Loss = 0.6695
Epoch 2120: Loss = 0.6727
Epoch 2120: Loss = 0.6453


 21%|██▏       | 2132/10000 [02:54<10:14, 12.81it/s]

Epoch 2130: Loss = 0.6756
Epoch 2130: Loss = 0.6924
Epoch 2130: Loss = 0.6900
Epoch 2130: Loss = 0.7082
Epoch 2130: Loss = 0.6624


 21%|██▏       | 2142/10000 [02:55<10:23, 12.60it/s]

Epoch 2140: Loss = 0.6528
Epoch 2140: Loss = 0.6978
Epoch 2140: Loss = 0.6747
Epoch 2140: Loss = 0.6945
Epoch 2140: Loss = 0.6707


 22%|██▏       | 2152/10000 [02:56<10:02, 13.03it/s]

Epoch 2150: Loss = 0.6902
Epoch 2150: Loss = 0.6829
Epoch 2150: Loss = 0.6667
Epoch 2150: Loss = 0.6603
Epoch 2150: Loss = 0.7007


 22%|██▏       | 2162/10000 [02:56<10:09, 12.85it/s]

Epoch 2160: Loss = 0.6672
Epoch 2160: Loss = 0.6543
Epoch 2160: Loss = 0.6994
Epoch 2160: Loss = 0.6870
Epoch 2160: Loss = 0.6832


 22%|██▏       | 2172/10000 [02:57<12:18, 10.60it/s]

Epoch 2170: Loss = 0.6675
Epoch 2170: Loss = 0.6979
Epoch 2170: Loss = 0.6470
Epoch 2170: Loss = 0.6649
Epoch 2170: Loss = 0.6562


 22%|██▏       | 2182/10000 [02:58<09:58, 13.06it/s]

Epoch 2180: Loss = 0.6692
Epoch 2180: Loss = 0.6666
Epoch 2180: Loss = 0.6725
Epoch 2180: Loss = 0.6849
Epoch 2180: Loss = 0.6663


 22%|██▏       | 2190/10000 [02:59<11:02, 11.80it/s]

Epoch 2190: Loss = 0.6538
Epoch 2190: Loss = 0.6686
Epoch 2190: Loss = 0.6840
Epoch 2190: Loss = 0.6613
Epoch 2190: Loss = 0.6808


 22%|██▏       | 2202/10000 [03:00<11:05, 11.71it/s]

Epoch 2200: Loss = 0.6556
Epoch 2200: Loss = 0.6764
Epoch 2200: Loss = 0.6740
Epoch 2200: Loss = 0.6599
Epoch 2200: Loss = 0.6757


 22%|██▏       | 2212/10000 [03:01<11:52, 10.93it/s]

Epoch 2210: Loss = 0.6731
Epoch 2210: Loss = 0.6639
Epoch 2210: Loss = 0.6554
Epoch 2210: Loss = 0.6739
Epoch 2210: Loss = 0.6997


 22%|██▏       | 2222/10000 [03:02<12:18, 10.53it/s]

Epoch 2220: Loss = 0.6859
Epoch 2220: Loss = 0.6610
Epoch 2220: Loss = 0.6980
Epoch 2220: Loss = 0.7044
Epoch 2220: Loss = 0.6660


 22%|██▏       | 2232/10000 [03:03<12:16, 10.54it/s]

Epoch 2230: Loss = 0.6841
Epoch 2230: Loss = 0.6824
Epoch 2230: Loss = 0.6649
Epoch 2230: Loss = 0.6746
Epoch 2230: Loss = 0.6912


 22%|██▏       | 2242/10000 [03:04<10:52, 11.88it/s]

Epoch 2240: Loss = 0.6780
Epoch 2240: Loss = 0.6634
Epoch 2240: Loss = 0.6850
Epoch 2240: Loss = 0.6940
Epoch 2240: Loss = 0.6823


 23%|██▎       | 2252/10000 [03:05<11:10, 11.55it/s]

Epoch 2250: Loss = 0.6678
Epoch 2250: Loss = 0.6915
Epoch 2250: Loss = 0.6510
Epoch 2250: Loss = 0.6807
Epoch 2250: Loss = 0.6905


 23%|██▎       | 2260/10000 [03:05<09:57, 12.96it/s]

Epoch 2260: Loss = 0.6863
Epoch 2260: Loss = 0.6765
Epoch 2260: Loss = 0.6623
Epoch 2260: Loss = 0.6640
Epoch 2260: Loss = 0.6340


 23%|██▎       | 2272/10000 [03:06<10:07, 12.73it/s]

Epoch 2270: Loss = 0.6675
Epoch 2270: Loss = 0.6857
Epoch 2270: Loss = 0.6624
Epoch 2270: Loss = 0.6594
Epoch 2270: Loss = 0.7030


 23%|██▎       | 2282/10000 [03:07<09:43, 13.24it/s]

Epoch 2280: Loss = 0.7007
Epoch 2280: Loss = 0.6629
Epoch 2280: Loss = 0.6667
Epoch 2280: Loss = 0.6824
Epoch 2280: Loss = 0.7008


 23%|██▎       | 2292/10000 [03:08<11:47, 10.90it/s]

Epoch 2290: Loss = 0.6638
Epoch 2290: Loss = 0.6615
Epoch 2290: Loss = 0.6846
Epoch 2290: Loss = 0.6833
Epoch 2290: Loss = 0.6614


 23%|██▎       | 2302/10000 [03:09<10:57, 11.70it/s]

Epoch 2300: Loss = 0.6405
Epoch 2300: Loss = 0.6968
Epoch 2300: Loss = 0.6600
Epoch 2300: Loss = 0.6744
Epoch 2300: Loss = 0.6825


 23%|██▎       | 2312/10000 [03:10<10:46, 11.89it/s]

Epoch 2310: Loss = 0.6536
Epoch 2310: Loss = 0.6776
Epoch 2310: Loss = 0.6850
Epoch 2310: Loss = 0.6742
Epoch 2310: Loss = 0.6556


 23%|██▎       | 2322/10000 [03:11<11:57, 10.70it/s]

Epoch 2320: Loss = 0.6777
Epoch 2320: Loss = 0.6811
Epoch 2320: Loss = 0.6484
Epoch 2320: Loss = 0.6868
Epoch 2320: Loss = 0.6988


 23%|██▎       | 2332/10000 [03:11<11:13, 11.39it/s]

Epoch 2330: Loss = 0.6458
Epoch 2330: Loss = 0.6501
Epoch 2330: Loss = 0.6516
Epoch 2330: Loss = 0.6491
Epoch 2330: Loss = 0.6765


 23%|██▎       | 2342/10000 [03:12<10:15, 12.43it/s]

Epoch 2340: Loss = 0.6444
Epoch 2340: Loss = 0.6904
Epoch 2340: Loss = 0.6939
Epoch 2340: Loss = 0.6672
Epoch 2340: Loss = 0.6885


 24%|██▎       | 2352/10000 [03:13<09:54, 12.86it/s]

Epoch 2350: Loss = 0.6679
Epoch 2350: Loss = 0.6594
Epoch 2350: Loss = 0.6635
Epoch 2350: Loss = 0.6521
Epoch 2350: Loss = 0.7113


 24%|██▎       | 2362/10000 [03:14<11:17, 11.28it/s]

Epoch 2360: Loss = 0.7018
Epoch 2360: Loss = 0.7030
Epoch 2360: Loss = 0.6748
Epoch 2360: Loss = 0.6756
Epoch 2360: Loss = 0.6560


 24%|██▎       | 2372/10000 [03:15<10:29, 12.12it/s]

Epoch 2370: Loss = 0.6566
Epoch 2370: Loss = 0.6570
Epoch 2370: Loss = 0.6798
Epoch 2370: Loss = 0.6891
Epoch 2370: Loss = 0.6825


 24%|██▍       | 2382/10000 [03:16<09:37, 13.19it/s]

Epoch 2380: Loss = 0.6727
Epoch 2380: Loss = 0.6426
Epoch 2380: Loss = 0.6714
Epoch 2380: Loss = 0.6656
Epoch 2380: Loss = 0.6719


 24%|██▍       | 2392/10000 [03:16<10:03, 12.60it/s]

Epoch 2390: Loss = 0.6582
Epoch 2390: Loss = 0.6924
Epoch 2390: Loss = 0.6939
Epoch 2390: Loss = 0.6740
Epoch 2390: Loss = 0.6810


 24%|██▍       | 2402/10000 [03:17<10:17, 12.31it/s]

Epoch 2400: Loss = 0.6582
Epoch 2400: Loss = 0.7066
Epoch 2400: Loss = 0.6738
Epoch 2400: Loss = 0.6764
Epoch 2400: Loss = 0.6748


 24%|██▍       | 2412/10000 [03:18<11:24, 11.09it/s]

Epoch 2410: Loss = 0.6717
Epoch 2410: Loss = 0.6616
Epoch 2410: Loss = 0.6733
Epoch 2410: Loss = 0.6747
Epoch 2410: Loss = 0.6847


 24%|██▍       | 2422/10000 [03:19<10:39, 11.85it/s]

Epoch 2420: Loss = 0.6625
Epoch 2420: Loss = 0.6965
Epoch 2420: Loss = 0.6934
Epoch 2420: Loss = 0.6333
Epoch 2420: Loss = 0.6595


 24%|██▍       | 2432/10000 [03:20<10:21, 12.18it/s]

Epoch 2430: Loss = 0.6681
Epoch 2430: Loss = 0.7089
Epoch 2430: Loss = 0.6832
Epoch 2430: Loss = 0.6934
Epoch 2430: Loss = 0.6837


 24%|██▍       | 2442/10000 [03:21<10:06, 12.47it/s]

Epoch 2440: Loss = 0.6854
Epoch 2440: Loss = 0.6691
Epoch 2440: Loss = 0.6516
Epoch 2440: Loss = 0.6823
Epoch 2440: Loss = 0.6332


 25%|██▍       | 2452/10000 [03:21<10:53, 11.54it/s]

Epoch 2450: Loss = 0.6847
Epoch 2450: Loss = 0.6898
Epoch 2450: Loss = 0.6619
Epoch 2450: Loss = 0.6737
Epoch 2450: Loss = 0.6860


 25%|██▍       | 2462/10000 [03:22<09:40, 12.99it/s]

Epoch 2460: Loss = 0.6806
Epoch 2460: Loss = 0.6805
Epoch 2460: Loss = 0.6901
Epoch 2460: Loss = 0.6744
Epoch 2460: Loss = 0.6698


 25%|██▍       | 2472/10000 [03:23<10:30, 11.94it/s]

Epoch 2470: Loss = 0.6923
Epoch 2470: Loss = 0.6721
Epoch 2470: Loss = 0.6901
Epoch 2470: Loss = 0.6830
Epoch 2470: Loss = 0.7050


 25%|██▍       | 2482/10000 [03:24<10:11, 12.29it/s]

Epoch 2480: Loss = 0.6692
Epoch 2480: Loss = 0.6905
Epoch 2480: Loss = 0.6709
Epoch 2480: Loss = 0.6527
Epoch 2480: Loss = 0.6498


 25%|██▍       | 2492/10000 [03:25<09:27, 13.22it/s]

Epoch 2490: Loss = 0.6663
Epoch 2490: Loss = 0.6552
Epoch 2490: Loss = 0.6631
Epoch 2490: Loss = 0.6586
Epoch 2490: Loss = 0.6597


 25%|██▌       | 2502/10000 [03:25<10:44, 11.64it/s]

Epoch 2500: Loss = 0.6705
Epoch 2500: Loss = 0.6674
Epoch 2500: Loss = 0.6622
Epoch 2500: Loss = 0.6543
Epoch 2500: Loss = 0.6500


 25%|██▌       | 2512/10000 [03:26<09:31, 13.11it/s]

Epoch 2510: Loss = 0.6581
Epoch 2510: Loss = 0.6919
Epoch 2510: Loss = 0.6783
Epoch 2510: Loss = 0.6731
Epoch 2510: Loss = 0.6720


 25%|██▌       | 2522/10000 [03:27<11:03, 11.28it/s]

Epoch 2520: Loss = 0.6587
Epoch 2520: Loss = 0.6683
Epoch 2520: Loss = 0.6338
Epoch 2520: Loss = 0.6748
Epoch 2520: Loss = 0.6965


 25%|██▌       | 2532/10000 [03:28<10:27, 11.90it/s]

Epoch 2530: Loss = 0.6724
Epoch 2530: Loss = 0.7114
Epoch 2530: Loss = 0.6626
Epoch 2530: Loss = 0.6601
Epoch 2530: Loss = 0.6979


 25%|██▌       | 2542/10000 [03:29<11:57, 10.40it/s]

Epoch 2540: Loss = 0.7093
Epoch 2540: Loss = 0.6722
Epoch 2540: Loss = 0.6773
Epoch 2540: Loss = 0.6723
Epoch 2540: Loss = 0.6628


 26%|██▌       | 2552/10000 [03:30<10:11, 12.18it/s]

Epoch 2550: Loss = 0.6920
Epoch 2550: Loss = 0.7094
Epoch 2550: Loss = 0.6765
Epoch 2550: Loss = 0.7075
Epoch 2550: Loss = 0.7007


 26%|██▌       | 2562/10000 [03:30<08:57, 13.84it/s]

Epoch 2560: Loss = 0.6762
Epoch 2560: Loss = 0.6913
Epoch 2560: Loss = 0.6580
Epoch 2560: Loss = 0.6682
Epoch 2560: Loss = 0.6834


 26%|██▌       | 2572/10000 [03:31<08:48, 14.06it/s]

Epoch 2570: Loss = 0.6729
Epoch 2570: Loss = 0.6386
Epoch 2570: Loss = 0.6632
Epoch 2570: Loss = 0.6830
Epoch 2570: Loss = 0.6372


 26%|██▌       | 2582/10000 [03:32<09:07, 13.55it/s]

Epoch 2580: Loss = 0.6766
Epoch 2580: Loss = 0.6682
Epoch 2580: Loss = 0.6794
Epoch 2580: Loss = 0.6705
Epoch 2580: Loss = 0.6670


 26%|██▌       | 2592/10000 [03:33<10:37, 11.62it/s]

Epoch 2590: Loss = 0.6562
Epoch 2590: Loss = 0.6604
Epoch 2590: Loss = 0.6645
Epoch 2590: Loss = 0.7046
Epoch 2590: Loss = 0.6717


 26%|██▌       | 2602/10000 [03:34<10:22, 11.89it/s]

Epoch 2600: Loss = 0.6611
Epoch 2600: Loss = 0.6344
Epoch 2600: Loss = 0.6800
Epoch 2600: Loss = 0.6646
Epoch 2600: Loss = 0.6109


 26%|██▌       | 2612/10000 [03:35<11:11, 11.00it/s]

Epoch 2610: Loss = 0.6971
Epoch 2610: Loss = 0.6763
Epoch 2610: Loss = 0.6649
Epoch 2610: Loss = 0.6529
Epoch 2610: Loss = 0.6799


 26%|██▌       | 2622/10000 [03:35<10:15, 11.98it/s]

Epoch 2620: Loss = 0.6399
Epoch 2620: Loss = 0.6827
Epoch 2620: Loss = 0.7010
Epoch 2620: Loss = 0.6617
Epoch 2620: Loss = 0.6601


 26%|██▋       | 2632/10000 [03:36<09:03, 13.55it/s]

Epoch 2630: Loss = 0.6577
Epoch 2630: Loss = 0.6746
Epoch 2630: Loss = 0.6511
Epoch 2630: Loss = 0.6744
Epoch 2630: Loss = 0.7015


 26%|██▋       | 2642/10000 [03:37<08:40, 14.14it/s]

Epoch 2640: Loss = 0.6788
Epoch 2640: Loss = 0.6795
Epoch 2640: Loss = 0.6490
Epoch 2640: Loss = 0.7127
Epoch 2640: Loss = 0.6890


 27%|██▋       | 2652/10000 [03:38<09:13, 13.29it/s]

Epoch 2650: Loss = 0.6692
Epoch 2650: Loss = 0.6482
Epoch 2650: Loss = 0.6513
Epoch 2650: Loss = 0.6840
Epoch 2650: Loss = 0.6619


 27%|██▋       | 2662/10000 [03:38<08:45, 13.96it/s]

Epoch 2660: Loss = 0.6742
Epoch 2660: Loss = 0.6788
Epoch 2660: Loss = 0.6832
Epoch 2660: Loss = 0.6816
Epoch 2660: Loss = 0.7062


 27%|██▋       | 2672/10000 [03:39<08:49, 13.84it/s]

Epoch 2670: Loss = 0.6796
Epoch 2670: Loss = 0.6686
Epoch 2670: Loss = 0.6547
Epoch 2670: Loss = 0.6574
Epoch 2670: Loss = 0.6956


 27%|██▋       | 2682/10000 [03:40<09:04, 13.43it/s]

Epoch 2680: Loss = 0.6701
Epoch 2680: Loss = 0.6331
Epoch 2680: Loss = 0.6852
Epoch 2680: Loss = 0.6490
Epoch 2680: Loss = 0.6738


 27%|██▋       | 2692/10000 [03:41<08:43, 13.96it/s]

Epoch 2690: Loss = 0.6674
Epoch 2690: Loss = 0.7288
Epoch 2690: Loss = 0.7005
Epoch 2690: Loss = 0.6884
Epoch 2690: Loss = 0.6631


 27%|██▋       | 2702/10000 [03:41<08:47, 13.84it/s]

Epoch 2700: Loss = 0.6678
Epoch 2700: Loss = 0.6885
Epoch 2700: Loss = 0.6771
Epoch 2700: Loss = 0.6910
Epoch 2700: Loss = 0.7067


 27%|██▋       | 2712/10000 [03:42<08:47, 13.81it/s]

Epoch 2710: Loss = 0.7048
Epoch 2710: Loss = 0.6861
Epoch 2710: Loss = 0.6785
Epoch 2710: Loss = 0.6694
Epoch 2710: Loss = 0.6802


 27%|██▋       | 2722/10000 [03:43<08:37, 14.07it/s]

Epoch 2720: Loss = 0.6635
Epoch 2720: Loss = 0.6565
Epoch 2720: Loss = 0.6586
Epoch 2720: Loss = 0.6353
Epoch 2720: Loss = 0.6734


 27%|██▋       | 2732/10000 [03:44<08:32, 14.18it/s]

Epoch 2730: Loss = 0.6665
Epoch 2730: Loss = 0.6900
Epoch 2730: Loss = 0.6928
Epoch 2730: Loss = 0.7215
Epoch 2730: Loss = 0.6709


 27%|██▋       | 2742/10000 [03:44<08:47, 13.75it/s]

Epoch 2740: Loss = 0.6833
Epoch 2740: Loss = 0.6332
Epoch 2740: Loss = 0.6526
Epoch 2740: Loss = 0.6733
Epoch 2740: Loss = 0.6671


 28%|██▊       | 2752/10000 [03:45<09:09, 13.18it/s]

Epoch 2750: Loss = 0.6844
Epoch 2750: Loss = 0.6855
Epoch 2750: Loss = 0.6746
Epoch 2750: Loss = 0.6622
Epoch 2750: Loss = 0.6755


 28%|██▊       | 2762/10000 [03:46<08:58, 13.45it/s]

Epoch 2760: Loss = 0.7027
Epoch 2760: Loss = 0.6538
Epoch 2760: Loss = 0.6669
Epoch 2760: Loss = 0.6710
Epoch 2760: Loss = 0.6531


 28%|██▊       | 2772/10000 [03:47<09:23, 12.84it/s]

Epoch 2770: Loss = 0.6503
Epoch 2770: Loss = 0.6606
Epoch 2770: Loss = 0.6583
Epoch 2770: Loss = 0.6931
Epoch 2770: Loss = 0.6873


 28%|██▊       | 2782/10000 [03:47<08:37, 13.94it/s]

Epoch 2780: Loss = 0.6640
Epoch 2780: Loss = 0.6613
Epoch 2780: Loss = 0.6711
Epoch 2780: Loss = 0.6626
Epoch 2780: Loss = 0.6505


 28%|██▊       | 2792/10000 [03:48<08:25, 14.25it/s]

Epoch 2790: Loss = 0.7051
Epoch 2790: Loss = 0.6945
Epoch 2790: Loss = 0.6530
Epoch 2790: Loss = 0.6372
Epoch 2790: Loss = 0.6517


 28%|██▊       | 2802/10000 [03:49<08:32, 14.05it/s]

Epoch 2800: Loss = 0.6763
Epoch 2800: Loss = 0.6620
Epoch 2800: Loss = 0.6767
Epoch 2800: Loss = 0.6572
Epoch 2800: Loss = 0.6942


 28%|██▊       | 2812/10000 [03:50<10:36, 11.30it/s]

Epoch 2810: Loss = 0.6536
Epoch 2810: Loss = 0.6605
Epoch 2810: Loss = 0.6580
Epoch 2810: Loss = 0.6660
Epoch 2810: Loss = 0.6868


 28%|██▊       | 2822/10000 [03:51<10:14, 11.67it/s]

Epoch 2820: Loss = 0.6819
Epoch 2820: Loss = 0.6631
Epoch 2820: Loss = 0.6943
Epoch 2820: Loss = 0.6610
Epoch 2820: Loss = 0.6949


 28%|██▊       | 2832/10000 [03:51<09:17, 12.87it/s]

Epoch 2830: Loss = 0.6665
Epoch 2830: Loss = 0.6483
Epoch 2830: Loss = 0.6733
Epoch 2830: Loss = 0.6754
Epoch 2830: Loss = 0.6683


 28%|██▊       | 2842/10000 [03:52<08:35, 13.88it/s]

Epoch 2840: Loss = 0.6980
Epoch 2840: Loss = 0.6675
Epoch 2840: Loss = 0.6273
Epoch 2840: Loss = 0.6656
Epoch 2840: Loss = 0.6895


 29%|██▊       | 2852/10000 [03:53<08:26, 14.13it/s]

Epoch 2850: Loss = 0.6679
Epoch 2850: Loss = 0.6957
Epoch 2850: Loss = 0.6499
Epoch 2850: Loss = 0.6798
Epoch 2850: Loss = 0.7116


 29%|██▊       | 2862/10000 [03:54<09:59, 11.91it/s]

Epoch 2860: Loss = 0.6739
Epoch 2860: Loss = 0.6750
Epoch 2860: Loss = 0.7122
Epoch 2860: Loss = 0.6706
Epoch 2860: Loss = 0.6556


 29%|██▊       | 2872/10000 [03:54<09:18, 12.77it/s]

Epoch 2870: Loss = 0.6545
Epoch 2870: Loss = 0.6723
Epoch 2870: Loss = 0.6724
Epoch 2870: Loss = 0.7036
Epoch 2870: Loss = 0.6723


 29%|██▉       | 2882/10000 [03:55<10:05, 11.76it/s]

Epoch 2880: Loss = 0.6758
Epoch 2880: Loss = 0.6598
Epoch 2880: Loss = 0.7010
Epoch 2880: Loss = 0.6635
Epoch 2880: Loss = 0.6947


 29%|██▉       | 2892/10000 [03:56<09:11, 12.89it/s]

Epoch 2890: Loss = 0.6573
Epoch 2890: Loss = 0.6503
Epoch 2890: Loss = 0.7020
Epoch 2890: Loss = 0.6729
Epoch 2890: Loss = 0.6775


 29%|██▉       | 2902/10000 [03:57<08:26, 14.01it/s]

Epoch 2900: Loss = 0.6680
Epoch 2900: Loss = 0.6491
Epoch 2900: Loss = 0.6644
Epoch 2900: Loss = 0.6932
Epoch 2900: Loss = 0.6973


 29%|██▉       | 2912/10000 [03:57<08:12, 14.40it/s]

Epoch 2910: Loss = 0.6407
Epoch 2910: Loss = 0.6438
Epoch 2910: Loss = 0.6780
Epoch 2910: Loss = 0.6603
Epoch 2910: Loss = 0.6675


 29%|██▉       | 2922/10000 [03:58<08:24, 14.04it/s]

Epoch 2920: Loss = 0.6726
Epoch 2920: Loss = 0.6914
Epoch 2920: Loss = 0.6883
Epoch 2920: Loss = 0.6565
Epoch 2920: Loss = 0.6615


 29%|██▉       | 2932/10000 [03:59<08:45, 13.46it/s]

Epoch 2930: Loss = 0.6648
Epoch 2930: Loss = 0.6744
Epoch 2930: Loss = 0.6879
Epoch 2930: Loss = 0.6697
Epoch 2930: Loss = 0.7032


 29%|██▉       | 2942/10000 [04:00<08:20, 14.10it/s]

Epoch 2940: Loss = 0.6637
Epoch 2940: Loss = 0.6830
Epoch 2940: Loss = 0.6998
Epoch 2940: Loss = 0.6441
Epoch 2940: Loss = 0.6952


 30%|██▉       | 2952/10000 [04:00<08:39, 13.56it/s]

Epoch 2950: Loss = 0.6715
Epoch 2950: Loss = 0.6848
Epoch 2950: Loss = 0.6563
Epoch 2950: Loss = 0.6904
Epoch 2950: Loss = 0.6631


 30%|██▉       | 2962/10000 [04:01<08:44, 13.43it/s]

Epoch 2960: Loss = 0.6338
Epoch 2960: Loss = 0.6879
Epoch 2960: Loss = 0.6522
Epoch 2960: Loss = 0.6504
Epoch 2960: Loss = 0.6834


 30%|██▉       | 2972/10000 [04:02<08:23, 13.97it/s]

Epoch 2970: Loss = 0.6720
Epoch 2970: Loss = 0.6644
Epoch 2970: Loss = 0.6585
Epoch 2970: Loss = 0.6656
Epoch 2970: Loss = 0.6955


 30%|██▉       | 2982/10000 [04:03<09:21, 12.50it/s]

Epoch 2980: Loss = 0.6699
Epoch 2980: Loss = 0.6561
Epoch 2980: Loss = 0.6569
Epoch 2980: Loss = 0.6755
Epoch 2980: Loss = 0.6952


 30%|██▉       | 2992/10000 [04:03<10:19, 11.32it/s]

Epoch 2990: Loss = 0.6659
Epoch 2990: Loss = 0.6914
Epoch 2990: Loss = 0.6707
Epoch 2990: Loss = 0.6763
Epoch 2990: Loss = 0.6605


 30%|███       | 3002/10000 [04:04<09:56, 11.73it/s]

Epoch 3000: Loss = 0.6897
Epoch 3000: Loss = 0.6671
Epoch 3000: Loss = 0.6934
Epoch 3000: Loss = 0.7136
Epoch 3000: Loss = 0.6755


 30%|███       | 3012/10000 [04:05<10:20, 11.25it/s]

Epoch 3010: Loss = 0.6288
Epoch 3010: Loss = 0.6513
Epoch 3010: Loss = 0.6734
Epoch 3010: Loss = 0.6649
Epoch 3010: Loss = 0.6431


 30%|███       | 3022/10000 [04:06<11:05, 10.48it/s]

Epoch 3020: Loss = 0.6675
Epoch 3020: Loss = 0.6735
Epoch 3020: Loss = 0.6471
Epoch 3020: Loss = 0.6841
Epoch 3020: Loss = 0.7109


 30%|███       | 3032/10000 [04:07<09:57, 11.66it/s]

Epoch 3030: Loss = 0.6539
Epoch 3030: Loss = 0.6439
Epoch 3030: Loss = 0.6665
Epoch 3030: Loss = 0.6721
Epoch 3030: Loss = 0.6702


 30%|███       | 3042/10000 [04:08<09:24, 12.32it/s]

Epoch 3040: Loss = 0.6816
Epoch 3040: Loss = 0.7076
Epoch 3040: Loss = 0.6493
Epoch 3040: Loss = 0.6560
Epoch 3040: Loss = 0.6403


 31%|███       | 3052/10000 [04:09<11:13, 10.32it/s]

Epoch 3050: Loss = 0.6804
Epoch 3050: Loss = 0.6755
Epoch 3050: Loss = 0.6718
Epoch 3050: Loss = 0.6739
Epoch 3050: Loss = 0.6725


 31%|███       | 3060/10000 [04:10<10:52, 10.64it/s]

Epoch 3060: Loss = 0.6677
Epoch 3060: Loss = 0.6494
Epoch 3060: Loss = 0.7063
Epoch 3060: Loss = 0.6640
Epoch 3060: Loss = 0.6848


 31%|███       | 3072/10000 [04:11<11:05, 10.41it/s]

Epoch 3070: Loss = 0.6667
Epoch 3070: Loss = 0.6950
Epoch 3070: Loss = 0.6968
Epoch 3070: Loss = 0.6580
Epoch 3070: Loss = 0.6890


 31%|███       | 3082/10000 [04:12<10:00, 11.52it/s]

Epoch 3080: Loss = 0.6651
Epoch 3080: Loss = 0.6784
Epoch 3080: Loss = 0.6841
Epoch 3080: Loss = 0.6444
Epoch 3080: Loss = 0.6384


 31%|███       | 3092/10000 [04:13<10:53, 10.58it/s]

Epoch 3090: Loss = 0.6941
Epoch 3090: Loss = 0.6586
Epoch 3090: Loss = 0.6692
Epoch 3090: Loss = 0.6920
Epoch 3090: Loss = 0.6585


 31%|███       | 3102/10000 [04:13<09:17, 12.38it/s]

Epoch 3100: Loss = 0.6696
Epoch 3100: Loss = 0.6749
Epoch 3100: Loss = 0.6665
Epoch 3100: Loss = 0.6897
Epoch 3100: Loss = 0.6951


 31%|███       | 3112/10000 [04:14<09:42, 11.82it/s]

Epoch 3110: Loss = 0.6772
Epoch 3110: Loss = 0.6546
Epoch 3110: Loss = 0.6694
Epoch 3110: Loss = 0.6829
Epoch 3110: Loss = 0.6849


 31%|███       | 3122/10000 [04:15<08:49, 13.00it/s]

Epoch 3120: Loss = 0.6881
Epoch 3120: Loss = 0.6233
Epoch 3120: Loss = 0.6780
Epoch 3120: Loss = 0.6648
Epoch 3120: Loss = 0.6501


 31%|███▏      | 3132/10000 [04:16<10:08, 11.29it/s]

Epoch 3130: Loss = 0.6828
Epoch 3130: Loss = 0.6689
Epoch 3130: Loss = 0.6728
Epoch 3130: Loss = 0.6810
Epoch 3130: Loss = 0.6520


 31%|███▏      | 3141/10000 [04:17<10:46, 10.61it/s]

Epoch 3140: Loss = 0.6881
Epoch 3140: Loss = 0.6954
Epoch 3140: Loss = 0.6347
Epoch 3140: Loss = 0.6238
Epoch 3140: Loss = 0.6850


 32%|███▏      | 3153/10000 [04:18<08:54, 12.82it/s]

Epoch 3150: Loss = 0.6583
Epoch 3150: Loss = 0.6460
Epoch 3150: Loss = 0.6791
Epoch 3150: Loss = 0.6437
Epoch 3150: Loss = 0.6808


 32%|███▏      | 3163/10000 [04:18<08:13, 13.87it/s]

Epoch 3160: Loss = 0.6821
Epoch 3160: Loss = 0.6515
Epoch 3160: Loss = 0.6487
Epoch 3160: Loss = 0.6477
Epoch 3160: Loss = 0.6828


 32%|███▏      | 3173/10000 [04:19<08:03, 14.11it/s]

Epoch 3170: Loss = 0.6821
Epoch 3170: Loss = 0.6715
Epoch 3170: Loss = 0.6747
Epoch 3170: Loss = 0.6506
Epoch 3170: Loss = 0.6640


 32%|███▏      | 3183/10000 [04:20<08:03, 14.11it/s]

Epoch 3180: Loss = 0.6465
Epoch 3180: Loss = 0.6413
Epoch 3180: Loss = 0.6649
Epoch 3180: Loss = 0.6810
Epoch 3180: Loss = 0.6608


 32%|███▏      | 3193/10000 [04:21<08:06, 13.99it/s]

Epoch 3190: Loss = 0.7106
Epoch 3190: Loss = 0.7082
Epoch 3190: Loss = 0.6948
Epoch 3190: Loss = 0.6723
Epoch 3190: Loss = 0.7074


 32%|███▏      | 3201/10000 [04:21<09:53, 11.46it/s]

Epoch 3200: Loss = 0.6685
Epoch 3200: Loss = 0.6783
Epoch 3200: Loss = 0.6451
Epoch 3200: Loss = 0.6635
Epoch 3200: Loss = 0.6750


 32%|███▏      | 3211/10000 [04:22<09:43, 11.63it/s]

Epoch 3210: Loss = 0.6963
Epoch 3210: Loss = 0.6675
Epoch 3210: Loss = 0.7087
Epoch 3210: Loss = 0.6590
Epoch 3210: Loss = 0.6618


 32%|███▏      | 3221/10000 [04:23<11:11, 10.09it/s]

Epoch 3220: Loss = 0.6487
Epoch 3220: Loss = 0.6748
Epoch 3220: Loss = 0.6969
Epoch 3220: Loss = 0.6755
Epoch 3220: Loss = 0.6737


 32%|███▏      | 3231/10000 [04:24<09:52, 11.42it/s]

Epoch 3230: Loss = 0.6447
Epoch 3230: Loss = 0.6764
Epoch 3230: Loss = 0.7319
Epoch 3230: Loss = 0.6917
Epoch 3230: Loss = 0.6751


 32%|███▏      | 3241/10000 [04:25<09:34, 11.76it/s]

Epoch 3240: Loss = 0.6733
Epoch 3240: Loss = 0.6690
Epoch 3240: Loss = 0.6748
Epoch 3240: Loss = 0.6918
Epoch 3240: Loss = 0.6688


 33%|███▎      | 3251/10000 [04:26<09:11, 12.24it/s]

Epoch 3250: Loss = 0.6754
Epoch 3250: Loss = 0.6943
Epoch 3250: Loss = 0.6443
Epoch 3250: Loss = 0.6681
Epoch 3250: Loss = 0.6310


 33%|███▎      | 3261/10000 [04:26<08:43, 12.87it/s]

Epoch 3260: Loss = 0.6875
Epoch 3260: Loss = 0.6531
Epoch 3260: Loss = 0.6552
Epoch 3260: Loss = 0.6534
Epoch 3260: Loss = 0.6641


 33%|███▎      | 3273/10000 [04:27<08:23, 13.37it/s]

Epoch 3270: Loss = 0.6659
Epoch 3270: Loss = 0.6737
Epoch 3270: Loss = 0.6901
Epoch 3270: Loss = 0.6658
Epoch 3270: Loss = 0.6376


 33%|███▎      | 3283/10000 [04:28<07:54, 14.15it/s]

Epoch 3280: Loss = 0.6506
Epoch 3280: Loss = 0.6574
Epoch 3280: Loss = 0.6964
Epoch 3280: Loss = 0.6700
Epoch 3280: Loss = 0.6258


 33%|███▎      | 3293/10000 [04:29<08:30, 13.15it/s]

Epoch 3290: Loss = 0.6767
Epoch 3290: Loss = 0.6825
Epoch 3290: Loss = 0.6590
Epoch 3290: Loss = 0.6684
Epoch 3290: Loss = 0.6538


 33%|███▎      | 3303/10000 [04:30<07:50, 14.25it/s]

Epoch 3300: Loss = 0.6654
Epoch 3300: Loss = 0.6777
Epoch 3300: Loss = 0.6392
Epoch 3300: Loss = 0.6898
Epoch 3300: Loss = 0.6680


 33%|███▎      | 3313/10000 [04:30<07:56, 14.02it/s]

Epoch 3310: Loss = 0.6631
Epoch 3310: Loss = 0.6602
Epoch 3310: Loss = 0.6816
Epoch 3310: Loss = 0.7132
Epoch 3310: Loss = 0.6440


 33%|███▎      | 3323/10000 [04:31<08:15, 13.49it/s]

Epoch 3320: Loss = 0.6650
Epoch 3320: Loss = 0.6749
Epoch 3320: Loss = 0.6669
Epoch 3320: Loss = 0.6597
Epoch 3320: Loss = 0.6642


 33%|███▎      | 3333/10000 [04:32<08:02, 13.82it/s]

Epoch 3330: Loss = 0.6708
Epoch 3330: Loss = 0.6829
Epoch 3330: Loss = 0.6776
Epoch 3330: Loss = 0.6879
Epoch 3330: Loss = 0.6642


 33%|███▎      | 3341/10000 [04:32<08:21, 13.28it/s]

Epoch 3340: Loss = 0.6791
Epoch 3340: Loss = 0.6583
Epoch 3340: Loss = 0.6602
Epoch 3340: Loss = 0.6554
Epoch 3340: Loss = 0.6933


 34%|███▎      | 3353/10000 [04:33<07:58, 13.89it/s]

Epoch 3350: Loss = 0.6627
Epoch 3350: Loss = 0.6593
Epoch 3350: Loss = 0.7244
Epoch 3350: Loss = 0.6261
Epoch 3350: Loss = 0.6594


 34%|███▎      | 3363/10000 [04:34<08:47, 12.58it/s]

Epoch 3360: Loss = 0.7023
Epoch 3360: Loss = 0.6447
Epoch 3360: Loss = 0.6566
Epoch 3360: Loss = 0.6997
Epoch 3360: Loss = 0.6546


 34%|███▎      | 3371/10000 [04:35<08:59, 12.29it/s]

Epoch 3370: Loss = 0.6232
Epoch 3370: Loss = 0.6544
Epoch 3370: Loss = 0.6879
Epoch 3370: Loss = 0.6978
Epoch 3370: Loss = 0.6673


 34%|███▍      | 3383/10000 [04:36<08:18, 13.28it/s]

Epoch 3380: Loss = 0.6699
Epoch 3380: Loss = 0.6615
Epoch 3380: Loss = 0.6676
Epoch 3380: Loss = 0.6591
Epoch 3380: Loss = 0.6970


 34%|███▍      | 3393/10000 [04:36<07:46, 14.15it/s]

Epoch 3390: Loss = 0.6775
Epoch 3390: Loss = 0.6285
Epoch 3390: Loss = 0.7062
Epoch 3390: Loss = 0.6642
Epoch 3390: Loss = 0.6885


 34%|███▍      | 3401/10000 [04:37<08:16, 13.30it/s]

Epoch 3400: Loss = 0.6725
Epoch 3400: Loss = 0.6623
Epoch 3400: Loss = 0.6880
Epoch 3400: Loss = 0.6767
Epoch 3400: Loss = 0.6844


 34%|███▍      | 3413/10000 [04:38<07:49, 14.04it/s]

Epoch 3410: Loss = 0.6667
Epoch 3410: Loss = 0.6649
Epoch 3410: Loss = 0.6535
Epoch 3410: Loss = 0.6710
Epoch 3410: Loss = 0.6999


 34%|███▍      | 3423/10000 [04:39<07:58, 13.74it/s]

Epoch 3420: Loss = 0.7191
Epoch 3420: Loss = 0.6552
Epoch 3420: Loss = 0.6739
Epoch 3420: Loss = 0.6401
Epoch 3420: Loss = 0.6667


 34%|███▍      | 3431/10000 [04:39<09:28, 11.55it/s]

Epoch 3430: Loss = 0.6660
Epoch 3430: Loss = 0.6662
Epoch 3430: Loss = 0.6466
Epoch 3430: Loss = 0.7043
Epoch 3430: Loss = 0.6993


 34%|███▍      | 3441/10000 [04:40<07:56, 13.75it/s]

Epoch 3440: Loss = 0.6550
Epoch 3440: Loss = 0.6488
Epoch 3440: Loss = 0.6804
Epoch 3440: Loss = 0.6726
Epoch 3440: Loss = 0.6736


 35%|███▍      | 3453/10000 [04:41<07:45, 14.08it/s]

Epoch 3450: Loss = 0.6457
Epoch 3450: Loss = 0.6575
Epoch 3450: Loss = 0.6476
Epoch 3450: Loss = 0.6549
Epoch 3450: Loss = 0.6760


 35%|███▍      | 3463/10000 [04:42<07:41, 14.18it/s]

Epoch 3460: Loss = 0.6859
Epoch 3460: Loss = 0.6570
Epoch 3460: Loss = 0.6680
Epoch 3460: Loss = 0.6758
Epoch 3460: Loss = 0.6644


 35%|███▍      | 3473/10000 [04:42<08:05, 13.43it/s]

Epoch 3470: Loss = 0.6776
Epoch 3470: Loss = 0.7141
Epoch 3470: Loss = 0.6633
Epoch 3470: Loss = 0.6658
Epoch 3470: Loss = 0.6938


 35%|███▍      | 3483/10000 [04:43<07:44, 14.04it/s]

Epoch 3480: Loss = 0.6539
Epoch 3480: Loss = 0.6448
Epoch 3480: Loss = 0.6627
Epoch 3480: Loss = 0.6711
Epoch 3480: Loss = 0.6686


 35%|███▍      | 3491/10000 [04:44<07:39, 14.16it/s]

Epoch 3490: Loss = 0.6857
Epoch 3490: Loss = 0.6931
Epoch 3490: Loss = 0.6804
Epoch 3490: Loss = 0.6609
Epoch 3490: Loss = 0.6849


 35%|███▌      | 3503/10000 [04:45<08:12, 13.20it/s]

Epoch 3500: Loss = 0.6913
Epoch 3500: Loss = 0.6774
Epoch 3500: Loss = 0.7080
Epoch 3500: Loss = 0.6735
Epoch 3500: Loss = 0.6895


 35%|███▌      | 3513/10000 [04:45<07:38, 14.16it/s]

Epoch 3510: Loss = 0.7098
Epoch 3510: Loss = 0.6642
Epoch 3510: Loss = 0.7053
Epoch 3510: Loss = 0.6907
Epoch 3510: Loss = 0.6865


 35%|███▌      | 3521/10000 [04:46<08:49, 12.24it/s]

Epoch 3520: Loss = 0.6748
Epoch 3520: Loss = 0.6950
Epoch 3520: Loss = 0.6697
Epoch 3520: Loss = 0.6535
Epoch 3520: Loss = 0.6698


 35%|███▌      | 3533/10000 [04:47<07:56, 13.56it/s]

Epoch 3530: Loss = 0.6073
Epoch 3530: Loss = 0.6735
Epoch 3530: Loss = 0.6527
Epoch 3530: Loss = 0.6524
Epoch 3530: Loss = 0.6543


 35%|███▌      | 3543/10000 [04:48<07:41, 14.00it/s]

Epoch 3540: Loss = 0.6850
Epoch 3540: Loss = 0.6705
Epoch 3540: Loss = 0.6650
Epoch 3540: Loss = 0.6665
Epoch 3540: Loss = 0.6651


 36%|███▌      | 3553/10000 [04:48<07:31, 14.29it/s]

Epoch 3550: Loss = 0.6196
Epoch 3550: Loss = 0.6410
Epoch 3550: Loss = 0.6552
Epoch 3550: Loss = 0.6679
Epoch 3550: Loss = 0.6650


 36%|███▌      | 3561/10000 [04:49<08:10, 13.12it/s]

Epoch 3560: Loss = 0.6806
Epoch 3560: Loss = 0.6461
Epoch 3560: Loss = 0.6836
Epoch 3560: Loss = 0.6827
Epoch 3560: Loss = 0.6838


 36%|███▌      | 3573/10000 [04:50<07:43, 13.85it/s]

Epoch 3570: Loss = 0.6687
Epoch 3570: Loss = 0.6743
Epoch 3570: Loss = 0.6750
Epoch 3570: Loss = 0.6645
Epoch 3570: Loss = 0.6589


 36%|███▌      | 3581/10000 [04:50<07:55, 13.49it/s]

Epoch 3580: Loss = 0.6709
Epoch 3580: Loss = 0.6834
Epoch 3580: Loss = 0.6980
Epoch 3580: Loss = 0.6762
Epoch 3580: Loss = 0.6773


 36%|███▌      | 3591/10000 [04:51<08:48, 12.12it/s]

Epoch 3590: Loss = 0.6819
Epoch 3590: Loss = 0.6889
Epoch 3590: Loss = 0.6566
Epoch 3590: Loss = 0.6658
Epoch 3590: Loss = 0.6679


 36%|███▌      | 3601/10000 [04:52<08:14, 12.94it/s]

Epoch 3600: Loss = 0.6451
Epoch 3600: Loss = 0.6760
Epoch 3600: Loss = 0.6849
Epoch 3600: Loss = 0.7008
Epoch 3600: Loss = 0.6484


 36%|███▌      | 3613/10000 [04:53<08:24, 12.67it/s]

Epoch 3610: Loss = 0.6603
Epoch 3610: Loss = 0.6510
Epoch 3610: Loss = 0.6754
Epoch 3610: Loss = 0.6552
Epoch 3610: Loss = 0.6898


 36%|███▌      | 3621/10000 [04:54<08:19, 12.77it/s]

Epoch 3620: Loss = 0.6835
Epoch 3620: Loss = 0.6879
Epoch 3620: Loss = 0.6510
Epoch 3620: Loss = 0.6881
Epoch 3620: Loss = 0.6892


 36%|███▋      | 3631/10000 [04:55<10:00, 10.61it/s]

Epoch 3630: Loss = 0.7065
Epoch 3630: Loss = 0.6925
Epoch 3630: Loss = 0.6368
Epoch 3630: Loss = 0.6741
Epoch 3630: Loss = 0.6665


 36%|███▋      | 3641/10000 [04:56<10:42,  9.90it/s]

Epoch 3640: Loss = 0.6631
Epoch 3640: Loss = 0.7011
Epoch 3640: Loss = 0.6898
Epoch 3640: Loss = 0.6590
Epoch 3640: Loss = 0.6991


 37%|███▋      | 3651/10000 [04:57<10:14, 10.33it/s]

Epoch 3650: Loss = 0.6512
Epoch 3650: Loss = 0.6565
Epoch 3650: Loss = 0.6658
Epoch 3650: Loss = 0.6615
Epoch 3650: Loss = 0.6464


 37%|███▋      | 3661/10000 [04:57<08:42, 12.14it/s]

Epoch 3660: Loss = 0.6582
Epoch 3660: Loss = 0.6784
Epoch 3660: Loss = 0.6403
Epoch 3660: Loss = 0.6663
Epoch 3660: Loss = 0.7038


 37%|███▋      | 3671/10000 [04:58<09:07, 11.55it/s]

Epoch 3670: Loss = 0.6583
Epoch 3670: Loss = 0.6935
Epoch 3670: Loss = 0.6874
Epoch 3670: Loss = 0.6299
Epoch 3670: Loss = 0.6776


 37%|███▋      | 3681/10000 [04:59<10:18, 10.21it/s]

Epoch 3680: Loss = 0.6932
Epoch 3680: Loss = 0.6726
Epoch 3680: Loss = 0.6651
Epoch 3680: Loss = 0.6331
Epoch 3680: Loss = 0.6579


 37%|███▋      | 3691/10000 [05:00<10:21, 10.15it/s]

Epoch 3690: Loss = 0.7061
Epoch 3690: Loss = 0.6792
Epoch 3690: Loss = 0.6862
Epoch 3690: Loss = 0.6813
Epoch 3690: Loss = 0.6549


 37%|███▋      | 3700/10000 [05:01<09:02, 11.62it/s]

Epoch 3700: Loss = 0.6472
Epoch 3700: Loss = 0.6903
Epoch 3700: Loss = 0.6388
Epoch 3700: Loss = 0.6928
Epoch 3700: Loss = 0.7094


 37%|███▋      | 3712/10000 [05:02<09:35, 10.92it/s]

Epoch 3710: Loss = 0.6832
Epoch 3710: Loss = 0.6671
Epoch 3710: Loss = 0.6875
Epoch 3710: Loss = 0.6595
Epoch 3710: Loss = 0.7103


 37%|███▋      | 3722/10000 [05:03<08:11, 12.77it/s]

Epoch 3720: Loss = 0.6641
Epoch 3720: Loss = 0.6901
Epoch 3720: Loss = 0.6578
Epoch 3720: Loss = 0.6737
Epoch 3720: Loss = 0.6582


 37%|███▋      | 3732/10000 [05:04<09:30, 10.98it/s]

Epoch 3730: Loss = 0.6644
Epoch 3730: Loss = 0.6917
Epoch 3730: Loss = 0.6623
Epoch 3730: Loss = 0.6781
Epoch 3730: Loss = 0.6920


 37%|███▋      | 3742/10000 [05:05<08:20, 12.50it/s]

Epoch 3740: Loss = 0.6934
Epoch 3740: Loss = 0.6580
Epoch 3740: Loss = 0.6579
Epoch 3740: Loss = 0.6605
Epoch 3740: Loss = 0.6550


 38%|███▊      | 3752/10000 [05:05<07:42, 13.52it/s]

Epoch 3750: Loss = 0.6516
Epoch 3750: Loss = 0.6774
Epoch 3750: Loss = 0.6608
Epoch 3750: Loss = 0.6499
Epoch 3750: Loss = 0.6551


 38%|███▊      | 3762/10000 [05:06<08:11, 12.68it/s]

Epoch 3760: Loss = 0.6861
Epoch 3760: Loss = 0.7085
Epoch 3760: Loss = 0.6742
Epoch 3760: Loss = 0.6547
Epoch 3760: Loss = 0.6648


 38%|███▊      | 3772/10000 [05:07<07:43, 13.43it/s]

Epoch 3770: Loss = 0.6725
Epoch 3770: Loss = 0.6703
Epoch 3770: Loss = 0.7020
Epoch 3770: Loss = 0.6590
Epoch 3770: Loss = 0.6489


 38%|███▊      | 3782/10000 [05:08<09:18, 11.13it/s]

Epoch 3780: Loss = 0.6789
Epoch 3780: Loss = 0.6588
Epoch 3780: Loss = 0.7042
Epoch 3780: Loss = 0.6810
Epoch 3780: Loss = 0.6851


 38%|███▊      | 3792/10000 [05:09<08:50, 11.69it/s]

Epoch 3790: Loss = 0.6646
Epoch 3790: Loss = 0.6640
Epoch 3790: Loss = 0.6634
Epoch 3790: Loss = 0.6492
Epoch 3790: Loss = 0.7013


 38%|███▊      | 3802/10000 [05:10<08:04, 12.79it/s]

Epoch 3800: Loss = 0.6770
Epoch 3800: Loss = 0.6749
Epoch 3800: Loss = 0.6634
Epoch 3800: Loss = 0.6874
Epoch 3800: Loss = 0.6831


 38%|███▊      | 3812/10000 [05:10<07:32, 13.66it/s]

Epoch 3810: Loss = 0.6787
Epoch 3810: Loss = 0.6898
Epoch 3810: Loss = 0.6716
Epoch 3810: Loss = 0.6600
Epoch 3810: Loss = 0.6714


 38%|███▊      | 3822/10000 [05:11<07:49, 13.16it/s]

Epoch 3820: Loss = 0.7094
Epoch 3820: Loss = 0.6765
Epoch 3820: Loss = 0.6587
Epoch 3820: Loss = 0.6568
Epoch 3820: Loss = 0.6384


 38%|███▊      | 3832/10000 [05:12<07:38, 13.46it/s]

Epoch 3830: Loss = 0.6755
Epoch 3830: Loss = 0.6795
Epoch 3830: Loss = 0.6646
Epoch 3830: Loss = 0.6577
Epoch 3830: Loss = 0.6912


 38%|███▊      | 3842/10000 [05:13<08:43, 11.76it/s]

Epoch 3840: Loss = 0.6535
Epoch 3840: Loss = 0.6772
Epoch 3840: Loss = 0.6506
Epoch 3840: Loss = 0.6536
Epoch 3840: Loss = 0.6571


 39%|███▊      | 3852/10000 [05:13<07:41, 13.33it/s]

Epoch 3850: Loss = 0.6778
Epoch 3850: Loss = 0.6632
Epoch 3850: Loss = 0.6631
Epoch 3850: Loss = 0.6553
Epoch 3850: Loss = 0.6538


 39%|███▊      | 3862/10000 [05:14<08:22, 12.21it/s]

Epoch 3860: Loss = 0.6674
Epoch 3860: Loss = 0.6765
Epoch 3860: Loss = 0.7029
Epoch 3860: Loss = 0.6900
Epoch 3860: Loss = 0.6902


 39%|███▊      | 3872/10000 [05:15<08:31, 11.99it/s]

Epoch 3870: Loss = 0.6729
Epoch 3870: Loss = 0.6453
Epoch 3870: Loss = 0.6508
Epoch 3870: Loss = 0.6894
Epoch 3870: Loss = 0.6783


 39%|███▉      | 3882/10000 [05:16<07:44, 13.18it/s]

Epoch 3880: Loss = 0.7032
Epoch 3880: Loss = 0.6379
Epoch 3880: Loss = 0.6436
Epoch 3880: Loss = 0.6832
Epoch 3880: Loss = 0.6355


 39%|███▉      | 3892/10000 [05:17<08:33, 11.89it/s]

Epoch 3890: Loss = 0.6763
Epoch 3890: Loss = 0.6313
Epoch 3890: Loss = 0.6755
Epoch 3890: Loss = 0.6452
Epoch 3890: Loss = 0.6910


 39%|███▉      | 3900/10000 [05:17<09:46, 10.40it/s]

Epoch 3900: Loss = 0.6961
Epoch 3900: Loss = 0.6507
Epoch 3900: Loss = 0.6925
Epoch 3900: Loss = 0.6900
Epoch 3900: Loss = 0.7030


 39%|███▉      | 3912/10000 [05:19<08:50, 11.48it/s]

Epoch 3910: Loss = 0.6702
Epoch 3910: Loss = 0.6964
Epoch 3910: Loss = 0.6589
Epoch 3910: Loss = 0.6598
Epoch 3910: Loss = 0.6548


 39%|███▉      | 3922/10000 [05:19<07:49, 12.94it/s]

Epoch 3920: Loss = 0.7097
Epoch 3920: Loss = 0.6811
Epoch 3920: Loss = 0.6799
Epoch 3920: Loss = 0.6953
Epoch 3920: Loss = 0.6703


 39%|███▉      | 3932/10000 [05:20<09:12, 10.98it/s]

Epoch 3930: Loss = 0.7066
Epoch 3930: Loss = 0.6924
Epoch 3930: Loss = 0.6555
Epoch 3930: Loss = 0.6442
Epoch 3930: Loss = 0.6433


 39%|███▉      | 3942/10000 [05:21<07:49, 12.92it/s]

Epoch 3940: Loss = 0.6777
Epoch 3940: Loss = 0.6440
Epoch 3940: Loss = 0.6851
Epoch 3940: Loss = 0.6295
Epoch 3940: Loss = 0.6364


 40%|███▉      | 3952/10000 [05:22<07:30, 13.41it/s]

Epoch 3950: Loss = 0.7090
Epoch 3950: Loss = 0.6595
Epoch 3950: Loss = 0.6696
Epoch 3950: Loss = 0.7006
Epoch 3950: Loss = 0.6759


 40%|███▉      | 3962/10000 [05:23<08:19, 12.08it/s]

Epoch 3960: Loss = 0.6290
Epoch 3960: Loss = 0.6343
Epoch 3960: Loss = 0.6793
Epoch 3960: Loss = 0.6656
Epoch 3960: Loss = 0.6767


 40%|███▉      | 3972/10000 [05:23<07:51, 12.79it/s]

Epoch 3970: Loss = 0.6717
Epoch 3970: Loss = 0.6678
Epoch 3970: Loss = 0.6541
Epoch 3970: Loss = 0.6840
Epoch 3970: Loss = 0.6546


 40%|███▉      | 3982/10000 [05:24<07:48, 12.85it/s]

Epoch 3980: Loss = 0.6834
Epoch 3980: Loss = 0.6631
Epoch 3980: Loss = 0.6822
Epoch 3980: Loss = 0.6582
Epoch 3980: Loss = 0.6313


 40%|███▉      | 3992/10000 [05:25<07:36, 13.17it/s]

Epoch 3990: Loss = 0.6577
Epoch 3990: Loss = 0.6572
Epoch 3990: Loss = 0.6899
Epoch 3990: Loss = 0.6694
Epoch 3990: Loss = 0.6582


 40%|████      | 4002/10000 [05:26<07:10, 13.94it/s]

Epoch 4000: Loss = 0.6775
Epoch 4000: Loss = 0.6774
Epoch 4000: Loss = 0.6855
Epoch 4000: Loss = 0.6742
Epoch 4000: Loss = 0.6751


 40%|████      | 4012/10000 [05:26<07:58, 12.53it/s]

Epoch 4010: Loss = 0.6762
Epoch 4010: Loss = 0.7026
Epoch 4010: Loss = 0.6918
Epoch 4010: Loss = 0.6682
Epoch 4010: Loss = 0.6665


 40%|████      | 4022/10000 [05:27<07:21, 13.56it/s]

Epoch 4020: Loss = 0.6845
Epoch 4020: Loss = 0.6641
Epoch 4020: Loss = 0.6677
Epoch 4020: Loss = 0.6391
Epoch 4020: Loss = 0.6803


 40%|████      | 4032/10000 [05:28<07:13, 13.78it/s]

Epoch 4030: Loss = 0.6756
Epoch 4030: Loss = 0.6829
Epoch 4030: Loss = 0.6405
Epoch 4030: Loss = 0.6810
Epoch 4030: Loss = 0.6321


 40%|████      | 4042/10000 [05:29<06:59, 14.19it/s]

Epoch 4040: Loss = 0.6712
Epoch 4040: Loss = 0.6651
Epoch 4040: Loss = 0.6683
Epoch 4040: Loss = 0.6835
Epoch 4040: Loss = 0.6412


 41%|████      | 4052/10000 [05:29<07:38, 12.98it/s]

Epoch 4050: Loss = 0.6617
Epoch 4050: Loss = 0.6479
Epoch 4050: Loss = 0.6932
Epoch 4050: Loss = 0.6468
Epoch 4050: Loss = 0.6418


 41%|████      | 4062/10000 [05:30<07:16, 13.60it/s]

Epoch 4060: Loss = 0.6929
Epoch 4060: Loss = 0.6622
Epoch 4060: Loss = 0.6606
Epoch 4060: Loss = 0.6977
Epoch 4060: Loss = 0.6685


 41%|████      | 4072/10000 [05:31<07:02, 14.03it/s]

Epoch 4070: Loss = 0.6841
Epoch 4070: Loss = 0.6702
Epoch 4070: Loss = 0.7035
Epoch 4070: Loss = 0.6905
Epoch 4070: Loss = 0.6317


 41%|████      | 4082/10000 [05:32<07:08, 13.81it/s]

Epoch 4080: Loss = 0.6316
Epoch 4080: Loss = 0.6519
Epoch 4080: Loss = 0.7102
Epoch 4080: Loss = 0.6956
Epoch 4080: Loss = 0.6500


 41%|████      | 4092/10000 [05:32<07:08, 13.79it/s]

Epoch 4090: Loss = 0.6699
Epoch 4090: Loss = 0.6637
Epoch 4090: Loss = 0.7034
Epoch 4090: Loss = 0.6782
Epoch 4090: Loss = 0.6842


 41%|████      | 4102/10000 [05:33<07:01, 14.00it/s]

Epoch 4100: Loss = 0.6636
Epoch 4100: Loss = 0.6937
Epoch 4100: Loss = 0.6495
Epoch 4100: Loss = 0.6881
Epoch 4100: Loss = 0.6404


 41%|████      | 4112/10000 [05:34<07:47, 12.59it/s]

Epoch 4110: Loss = 0.6880
Epoch 4110: Loss = 0.6633
Epoch 4110: Loss = 0.6637
Epoch 4110: Loss = 0.6645
Epoch 4110: Loss = 0.6755


 41%|████      | 4122/10000 [05:35<08:45, 11.20it/s]

Epoch 4120: Loss = 0.6707
Epoch 4120: Loss = 0.6387
Epoch 4120: Loss = 0.6735
Epoch 4120: Loss = 0.6552
Epoch 4120: Loss = 0.6823


 41%|████▏     | 4132/10000 [05:36<08:15, 11.84it/s]

Epoch 4130: Loss = 0.6697
Epoch 4130: Loss = 0.6656
Epoch 4130: Loss = 0.6701
Epoch 4130: Loss = 0.6734
Epoch 4130: Loss = 0.6964


 41%|████▏     | 4142/10000 [05:37<07:46, 12.55it/s]

Epoch 4140: Loss = 0.6397
Epoch 4140: Loss = 0.6569
Epoch 4140: Loss = 0.6429
Epoch 4140: Loss = 0.6510
Epoch 4140: Loss = 0.6909


 42%|████▏     | 4152/10000 [05:37<07:06, 13.72it/s]

Epoch 4150: Loss = 0.6402
Epoch 4150: Loss = 0.6825
Epoch 4150: Loss = 0.6920
Epoch 4150: Loss = 0.7117
Epoch 4150: Loss = 0.6356


 42%|████▏     | 4162/10000 [05:38<07:07, 13.66it/s]

Epoch 4160: Loss = 0.6498
Epoch 4160: Loss = 0.7008
Epoch 4160: Loss = 0.6820
Epoch 4160: Loss = 0.6377
Epoch 4160: Loss = 0.6902


 42%|████▏     | 4172/10000 [05:39<07:36, 12.76it/s]

Epoch 4170: Loss = 0.6639
Epoch 4170: Loss = 0.6959
Epoch 4170: Loss = 0.6804
Epoch 4170: Loss = 0.6781
Epoch 4170: Loss = 0.6836


 42%|████▏     | 4182/10000 [05:40<08:10, 11.87it/s]

Epoch 4180: Loss = 0.6572
Epoch 4180: Loss = 0.6757
Epoch 4180: Loss = 0.7014
Epoch 4180: Loss = 0.6643
Epoch 4180: Loss = 0.6397


 42%|████▏     | 4192/10000 [05:40<07:44, 12.49it/s]

Epoch 4190: Loss = 0.6653
Epoch 4190: Loss = 0.6678
Epoch 4190: Loss = 0.6885
Epoch 4190: Loss = 0.6768
Epoch 4190: Loss = 0.6807


 42%|████▏     | 4202/10000 [05:41<07:05, 13.64it/s]

Epoch 4200: Loss = 0.6599
Epoch 4200: Loss = 0.6792
Epoch 4200: Loss = 0.6847
Epoch 4200: Loss = 0.6531
Epoch 4200: Loss = 0.7086


 42%|████▏     | 4212/10000 [05:42<07:20, 13.13it/s]

Epoch 4210: Loss = 0.6684
Epoch 4210: Loss = 0.6798
Epoch 4210: Loss = 0.6515
Epoch 4210: Loss = 0.6752
Epoch 4210: Loss = 0.6576


 42%|████▏     | 4222/10000 [05:43<07:13, 13.34it/s]

Epoch 4220: Loss = 0.6612
Epoch 4220: Loss = 0.6534
Epoch 4220: Loss = 0.6971
Epoch 4220: Loss = 0.6465
Epoch 4220: Loss = 0.6549


 42%|████▏     | 4232/10000 [05:43<06:57, 13.82it/s]

Epoch 4230: Loss = 0.6599
Epoch 4230: Loss = 0.6886
Epoch 4230: Loss = 0.6659
Epoch 4230: Loss = 0.6917
Epoch 4230: Loss = 0.6400


 42%|████▏     | 4242/10000 [05:44<07:16, 13.20it/s]

Epoch 4240: Loss = 0.6817
Epoch 4240: Loss = 0.6568
Epoch 4240: Loss = 0.6654
Epoch 4240: Loss = 0.6720
Epoch 4240: Loss = 0.6937


 43%|████▎     | 4252/10000 [05:45<07:37, 12.57it/s]

Epoch 4250: Loss = 0.6671
Epoch 4250: Loss = 0.6797
Epoch 4250: Loss = 0.6871
Epoch 4250: Loss = 0.6414
Epoch 4250: Loss = 0.6944


 43%|████▎     | 4262/10000 [05:46<08:21, 11.44it/s]

Epoch 4260: Loss = 0.6599
Epoch 4260: Loss = 0.6722
Epoch 4260: Loss = 0.6991
Epoch 4260: Loss = 0.6402
Epoch 4260: Loss = 0.6627


 43%|████▎     | 4272/10000 [05:47<07:14, 13.17it/s]

Epoch 4270: Loss = 0.6393
Epoch 4270: Loss = 0.6876
Epoch 4270: Loss = 0.6678
Epoch 4270: Loss = 0.6995
Epoch 4270: Loss = 0.6766


 43%|████▎     | 4282/10000 [05:47<07:14, 13.17it/s]

Epoch 4280: Loss = 0.6572
Epoch 4280: Loss = 0.6776
Epoch 4280: Loss = 0.6795
Epoch 4280: Loss = 0.6739
Epoch 4280: Loss = 0.6802


 43%|████▎     | 4292/10000 [05:48<06:58, 13.65it/s]

Epoch 4290: Loss = 0.6869
Epoch 4290: Loss = 0.6568
Epoch 4290: Loss = 0.6687
Epoch 4290: Loss = 0.6689
Epoch 4290: Loss = 0.6638


 43%|████▎     | 4302/10000 [05:49<06:45, 14.04it/s]

Epoch 4300: Loss = 0.6508
Epoch 4300: Loss = 0.6739
Epoch 4300: Loss = 0.6845
Epoch 4300: Loss = 0.6974
Epoch 4300: Loss = 0.6642


 43%|████▎     | 4312/10000 [05:50<06:46, 14.00it/s]

Epoch 4310: Loss = 0.6325
Epoch 4310: Loss = 0.6388
Epoch 4310: Loss = 0.6724
Epoch 4310: Loss = 0.6580
Epoch 4310: Loss = 0.6318


 43%|████▎     | 4322/10000 [05:51<08:29, 11.14it/s]

Epoch 4320: Loss = 0.6815
Epoch 4320: Loss = 0.6556
Epoch 4320: Loss = 0.6738
Epoch 4320: Loss = 0.6914
Epoch 4320: Loss = 0.6514


 43%|████▎     | 4332/10000 [05:51<07:00, 13.48it/s]

Epoch 4330: Loss = 0.6767
Epoch 4330: Loss = 0.6981
Epoch 4330: Loss = 0.6580
Epoch 4330: Loss = 0.6419
Epoch 4330: Loss = 0.6706


 43%|████▎     | 4342/10000 [05:52<06:48, 13.87it/s]

Epoch 4340: Loss = 0.6772
Epoch 4340: Loss = 0.6604
Epoch 4340: Loss = 0.6816
Epoch 4340: Loss = 0.6774
Epoch 4340: Loss = 0.6676


 44%|████▎     | 4352/10000 [05:53<06:41, 14.07it/s]

Epoch 4350: Loss = 0.6575
Epoch 4350: Loss = 0.6465
Epoch 4350: Loss = 0.6858
Epoch 4350: Loss = 0.6503
Epoch 4350: Loss = 0.6572


 44%|████▎     | 4362/10000 [05:53<06:45, 13.91it/s]

Epoch 4360: Loss = 0.6699
Epoch 4360: Loss = 0.6907
Epoch 4360: Loss = 0.6732
Epoch 4360: Loss = 0.6803
Epoch 4360: Loss = 0.6664


 44%|████▎     | 4372/10000 [05:54<07:45, 12.09it/s]

Epoch 4370: Loss = 0.6679
Epoch 4370: Loss = 0.6478
Epoch 4370: Loss = 0.6946
Epoch 4370: Loss = 0.6692
Epoch 4370: Loss = 0.6437


 44%|████▍     | 4382/10000 [05:55<06:49, 13.72it/s]

Epoch 4380: Loss = 0.6654
Epoch 4380: Loss = 0.6748
Epoch 4380: Loss = 0.6837
Epoch 4380: Loss = 0.6837
Epoch 4380: Loss = 0.6671


 44%|████▍     | 4392/10000 [05:56<07:45, 12.04it/s]

Epoch 4390: Loss = 0.6882
Epoch 4390: Loss = 0.6828
Epoch 4390: Loss = 0.6662
Epoch 4390: Loss = 0.6851
Epoch 4390: Loss = 0.6464


 44%|████▍     | 4402/10000 [05:57<06:47, 13.73it/s]

Epoch 4400: Loss = 0.6714
Epoch 4400: Loss = 0.6691
Epoch 4400: Loss = 0.6843
Epoch 4400: Loss = 0.6752
Epoch 4400: Loss = 0.6847


 44%|████▍     | 4412/10000 [05:57<08:15, 11.29it/s]

Epoch 4410: Loss = 0.6526
Epoch 4410: Loss = 0.6531
Epoch 4410: Loss = 0.6794
Epoch 4410: Loss = 0.6751
Epoch 4410: Loss = 0.6598


 44%|████▍     | 4422/10000 [05:58<07:17, 12.75it/s]

Epoch 4420: Loss = 0.6777
Epoch 4420: Loss = 0.6847
Epoch 4420: Loss = 0.6534
Epoch 4420: Loss = 0.6650
Epoch 4420: Loss = 0.6421


 44%|████▍     | 4432/10000 [05:59<07:10, 12.94it/s]

Epoch 4430: Loss = 0.6864
Epoch 4430: Loss = 0.6897
Epoch 4430: Loss = 0.6887
Epoch 4430: Loss = 0.6955
Epoch 4430: Loss = 0.6739


 44%|████▍     | 4442/10000 [06:00<06:42, 13.81it/s]

Epoch 4440: Loss = 0.6573
Epoch 4440: Loss = 0.6982
Epoch 4440: Loss = 0.6632
Epoch 4440: Loss = 0.6712
Epoch 4440: Loss = 0.6842


 45%|████▍     | 4452/10000 [06:00<06:42, 13.79it/s]

Epoch 4450: Loss = 0.6583
Epoch 4450: Loss = 0.6599
Epoch 4450: Loss = 0.7015
Epoch 4450: Loss = 0.6556
Epoch 4450: Loss = 0.6921


 45%|████▍     | 4462/10000 [06:01<06:48, 13.55it/s]

Epoch 4460: Loss = 0.6617
Epoch 4460: Loss = 0.6473
Epoch 4460: Loss = 0.6830
Epoch 4460: Loss = 0.6916
Epoch 4460: Loss = 0.6425


 45%|████▍     | 4472/10000 [06:02<06:57, 13.24it/s]

Epoch 4470: Loss = 0.6626
Epoch 4470: Loss = 0.6617
Epoch 4470: Loss = 0.6679
Epoch 4470: Loss = 0.7067
Epoch 4470: Loss = 0.6548


 45%|████▍     | 4482/10000 [06:03<07:03, 13.02it/s]

Epoch 4480: Loss = 0.7005
Epoch 4480: Loss = 0.6729
Epoch 4480: Loss = 0.6566
Epoch 4480: Loss = 0.6604
Epoch 4480: Loss = 0.6730


 45%|████▍     | 4492/10000 [06:04<06:45, 13.57it/s]

Epoch 4490: Loss = 0.6623
Epoch 4490: Loss = 0.6432
Epoch 4490: Loss = 0.6890
Epoch 4490: Loss = 0.6901
Epoch 4490: Loss = 0.6333


 45%|████▌     | 4502/10000 [06:04<06:30, 14.07it/s]

Epoch 4500: Loss = 0.6670
Epoch 4500: Loss = 0.6609
Epoch 4500: Loss = 0.6456
Epoch 4500: Loss = 0.6583
Epoch 4500: Loss = 0.6612


 45%|████▌     | 4512/10000 [06:05<07:11, 12.71it/s]

Epoch 4510: Loss = 0.6454
Epoch 4510: Loss = 0.7091
Epoch 4510: Loss = 0.6663
Epoch 4510: Loss = 0.6465
Epoch 4510: Loss = 0.6670


 45%|████▌     | 4522/10000 [06:06<06:50, 13.36it/s]

Epoch 4520: Loss = 0.6672
Epoch 4520: Loss = 0.6831
Epoch 4520: Loss = 0.6774
Epoch 4520: Loss = 0.6654
Epoch 4520: Loss = 0.6341


 45%|████▌     | 4532/10000 [06:07<07:07, 12.78it/s]

Epoch 4530: Loss = 0.6576
Epoch 4530: Loss = 0.6870
Epoch 4530: Loss = 0.6890
Epoch 4530: Loss = 0.6949
Epoch 4530: Loss = 0.7009


 45%|████▌     | 4542/10000 [06:07<07:05, 12.84it/s]

Epoch 4540: Loss = 0.6652
Epoch 4540: Loss = 0.6632
Epoch 4540: Loss = 0.6623
Epoch 4540: Loss = 0.6730
Epoch 4540: Loss = 0.6986


 46%|████▌     | 4552/10000 [06:08<08:23, 10.82it/s]

Epoch 4550: Loss = 0.6811
Epoch 4550: Loss = 0.6860
Epoch 4550: Loss = 0.6840
Epoch 4550: Loss = 0.6666
Epoch 4550: Loss = 0.7115


 46%|████▌     | 4562/10000 [06:09<06:57, 13.03it/s]

Epoch 4560: Loss = 0.6707
Epoch 4560: Loss = 0.7020
Epoch 4560: Loss = 0.6422
Epoch 4560: Loss = 0.6797
Epoch 4560: Loss = 0.6729


 46%|████▌     | 4572/10000 [06:10<06:34, 13.75it/s]

Epoch 4570: Loss = 0.6493
Epoch 4570: Loss = 0.6856
Epoch 4570: Loss = 0.6834
Epoch 4570: Loss = 0.6711
Epoch 4570: Loss = 0.6645


 46%|████▌     | 4582/10000 [06:11<06:57, 12.97it/s]

Epoch 4580: Loss = 0.6775
Epoch 4580: Loss = 0.6425
Epoch 4580: Loss = 0.6547
Epoch 4580: Loss = 0.6334
Epoch 4580: Loss = 0.6786


 46%|████▌     | 4592/10000 [06:11<06:30, 13.85it/s]

Epoch 4590: Loss = 0.6789
Epoch 4590: Loss = 0.6760
Epoch 4590: Loss = 0.7004
Epoch 4590: Loss = 0.6793
Epoch 4590: Loss = 0.7121


 46%|████▌     | 4602/10000 [06:12<06:51, 13.11it/s]

Epoch 4600: Loss = 0.6667
Epoch 4600: Loss = 0.6729
Epoch 4600: Loss = 0.6568
Epoch 4600: Loss = 0.6615
Epoch 4600: Loss = 0.6578


 46%|████▌     | 4612/10000 [06:13<06:31, 13.75it/s]

Epoch 4610: Loss = 0.6783
Epoch 4610: Loss = 0.7001
Epoch 4610: Loss = 0.7039
Epoch 4610: Loss = 0.7031
Epoch 4610: Loss = 0.6264


 46%|████▌     | 4622/10000 [06:14<06:20, 14.15it/s]

Epoch 4620: Loss = 0.6656
Epoch 4620: Loss = 0.6345
Epoch 4620: Loss = 0.6943
Epoch 4620: Loss = 0.6984
Epoch 4620: Loss = 0.6173


 46%|████▋     | 4632/10000 [06:14<06:40, 13.39it/s]

Epoch 4630: Loss = 0.6831
Epoch 4630: Loss = 0.6714
Epoch 4630: Loss = 0.6793
Epoch 4630: Loss = 0.6524
Epoch 4630: Loss = 0.6645


 46%|████▋     | 4642/10000 [06:15<06:21, 14.06it/s]

Epoch 4640: Loss = 0.6750
Epoch 4640: Loss = 0.6776
Epoch 4640: Loss = 0.7150
Epoch 4640: Loss = 0.6591
Epoch 4640: Loss = 0.6260


 47%|████▋     | 4652/10000 [06:16<06:32, 13.64it/s]

Epoch 4650: Loss = 0.6605
Epoch 4650: Loss = 0.6915
Epoch 4650: Loss = 0.6659
Epoch 4650: Loss = 0.6861
Epoch 4650: Loss = 0.6844


 47%|████▋     | 4662/10000 [06:17<06:43, 13.23it/s]

Epoch 4660: Loss = 0.6710
Epoch 4660: Loss = 0.6526
Epoch 4660: Loss = 0.6588
Epoch 4660: Loss = 0.6689
Epoch 4660: Loss = 0.7009


 47%|████▋     | 4672/10000 [06:17<06:46, 13.11it/s]

Epoch 4670: Loss = 0.6652
Epoch 4670: Loss = 0.6530
Epoch 4670: Loss = 0.6635
Epoch 4670: Loss = 0.6838
Epoch 4670: Loss = 0.6736


 47%|████▋     | 4682/10000 [06:18<06:22, 13.89it/s]

Epoch 4680: Loss = 0.6768
Epoch 4680: Loss = 0.6579
Epoch 4680: Loss = 0.6646
Epoch 4680: Loss = 0.6433
Epoch 4680: Loss = 0.6882


 47%|████▋     | 4692/10000 [06:19<06:15, 14.14it/s]

Epoch 4690: Loss = 0.6636
Epoch 4690: Loss = 0.6741
Epoch 4690: Loss = 0.6773
Epoch 4690: Loss = 0.6842
Epoch 4690: Loss = 0.6637


 47%|████▋     | 4702/10000 [06:19<06:15, 14.11it/s]

Epoch 4700: Loss = 0.6667
Epoch 4700: Loss = 0.6703
Epoch 4700: Loss = 0.6946
Epoch 4700: Loss = 0.6566
Epoch 4700: Loss = 0.6495


 47%|████▋     | 4712/10000 [06:20<07:02, 12.53it/s]

Epoch 4710: Loss = 0.6577
Epoch 4710: Loss = 0.6685
Epoch 4710: Loss = 0.7111
Epoch 4710: Loss = 0.6961
Epoch 4710: Loss = 0.6857


 47%|████▋     | 4722/10000 [06:21<06:40, 13.18it/s]

Epoch 4720: Loss = 0.6516
Epoch 4720: Loss = 0.6524
Epoch 4720: Loss = 0.6902
Epoch 4720: Loss = 0.6796
Epoch 4720: Loss = 0.6496


 47%|████▋     | 4732/10000 [06:22<07:23, 11.89it/s]

Epoch 4730: Loss = 0.6735
Epoch 4730: Loss = 0.6860
Epoch 4730: Loss = 0.6976
Epoch 4730: Loss = 0.6594
Epoch 4730: Loss = 0.6637


 47%|████▋     | 4742/10000 [06:23<06:27, 13.56it/s]

Epoch 4740: Loss = 0.6583
Epoch 4740: Loss = 0.6565
Epoch 4740: Loss = 0.6708
Epoch 4740: Loss = 0.6750
Epoch 4740: Loss = 0.6881


 48%|████▊     | 4752/10000 [06:23<06:32, 13.38it/s]

Epoch 4750: Loss = 0.6336
Epoch 4750: Loss = 0.6674
Epoch 4750: Loss = 0.6679
Epoch 4750: Loss = 0.6438
Epoch 4750: Loss = 0.6451


 48%|████▊     | 4762/10000 [06:24<06:48, 12.84it/s]

Epoch 4760: Loss = 0.6117
Epoch 4760: Loss = 0.6453
Epoch 4760: Loss = 0.6595
Epoch 4760: Loss = 0.6847
Epoch 4760: Loss = 0.6604


 48%|████▊     | 4772/10000 [06:25<06:22, 13.66it/s]

Epoch 4770: Loss = 0.7037
Epoch 4770: Loss = 0.6629
Epoch 4770: Loss = 0.6637
Epoch 4770: Loss = 0.6577
Epoch 4770: Loss = 0.6806


 48%|████▊     | 4782/10000 [06:26<06:12, 14.03it/s]

Epoch 4780: Loss = 0.6592
Epoch 4780: Loss = 0.6749
Epoch 4780: Loss = 0.6413
Epoch 4780: Loss = 0.7031
Epoch 4780: Loss = 0.7269


 48%|████▊     | 4792/10000 [06:26<06:15, 13.85it/s]

Epoch 4790: Loss = 0.6595
Epoch 4790: Loss = 0.6680
Epoch 4790: Loss = 0.6533
Epoch 4790: Loss = 0.6919
Epoch 4790: Loss = 0.6911


 48%|████▊     | 4802/10000 [06:27<06:22, 13.58it/s]

Epoch 4800: Loss = 0.6739
Epoch 4800: Loss = 0.6961
Epoch 4800: Loss = 0.6766
Epoch 4800: Loss = 0.6624
Epoch 4800: Loss = 0.6515


 48%|████▊     | 4812/10000 [06:28<06:29, 13.34it/s]

Epoch 4810: Loss = 0.6873
Epoch 4810: Loss = 0.7045
Epoch 4810: Loss = 0.6821
Epoch 4810: Loss = 0.6327
Epoch 4810: Loss = 0.6874


 48%|████▊     | 4822/10000 [06:29<06:38, 13.00it/s]

Epoch 4820: Loss = 0.6650
Epoch 4820: Loss = 0.6850
Epoch 4820: Loss = 0.6510
Epoch 4820: Loss = 0.6903
Epoch 4820: Loss = 0.6531


 48%|████▊     | 4832/10000 [06:29<06:17, 13.68it/s]

Epoch 4830: Loss = 0.6460
Epoch 4830: Loss = 0.6984
Epoch 4830: Loss = 0.6338
Epoch 4830: Loss = 0.6936
Epoch 4830: Loss = 0.6623


 48%|████▊     | 4842/10000 [06:30<06:37, 12.98it/s]

Epoch 4840: Loss = 0.6646
Epoch 4840: Loss = 0.6671
Epoch 4840: Loss = 0.6938
Epoch 4840: Loss = 0.6545
Epoch 4840: Loss = 0.6670


 49%|████▊     | 4852/10000 [06:31<06:15, 13.72it/s]

Epoch 4850: Loss = 0.6854
Epoch 4850: Loss = 0.6758
Epoch 4850: Loss = 0.6975
Epoch 4850: Loss = 0.6658
Epoch 4850: Loss = 0.6546


 49%|████▊     | 4862/10000 [06:32<06:05, 14.04it/s]

Epoch 4860: Loss = 0.6682
Epoch 4860: Loss = 0.6988
Epoch 4860: Loss = 0.6502
Epoch 4860: Loss = 0.6759
Epoch 4860: Loss = 0.6559


 49%|████▊     | 4872/10000 [06:32<06:40, 12.80it/s]

Epoch 4870: Loss = 0.6779
Epoch 4870: Loss = 0.6771
Epoch 4870: Loss = 0.6487
Epoch 4870: Loss = 0.6806
Epoch 4870: Loss = 0.6492


 49%|████▉     | 4882/10000 [06:33<07:03, 12.08it/s]

Epoch 4880: Loss = 0.6763
Epoch 4880: Loss = 0.6723
Epoch 4880: Loss = 0.6567
Epoch 4880: Loss = 0.7108
Epoch 4880: Loss = 0.6539


 49%|████▉     | 4892/10000 [06:34<06:58, 12.21it/s]

Epoch 4890: Loss = 0.6736
Epoch 4890: Loss = 0.6325
Epoch 4890: Loss = 0.6582
Epoch 4890: Loss = 0.6631
Epoch 4890: Loss = 0.6512


 49%|████▉     | 4902/10000 [06:35<06:39, 12.77it/s]

Epoch 4900: Loss = 0.6478
Epoch 4900: Loss = 0.6501
Epoch 4900: Loss = 0.6311
Epoch 4900: Loss = 0.6841
Epoch 4900: Loss = 0.6493


 49%|████▉     | 4912/10000 [06:36<06:56, 12.22it/s]

Epoch 4910: Loss = 0.6441
Epoch 4910: Loss = 0.6476
Epoch 4910: Loss = 0.6763
Epoch 4910: Loss = 0.6722
Epoch 4910: Loss = 0.6244


 49%|████▉     | 4922/10000 [06:36<06:26, 13.14it/s]

Epoch 4920: Loss = 0.6381
Epoch 4920: Loss = 0.6404
Epoch 4920: Loss = 0.6290
Epoch 4920: Loss = 0.6764
Epoch 4920: Loss = 0.6679


 49%|████▉     | 4932/10000 [06:37<06:25, 13.14it/s]

Epoch 4930: Loss = 0.6612
Epoch 4930: Loss = 0.6742
Epoch 4930: Loss = 0.6818
Epoch 4930: Loss = 0.6433
Epoch 4930: Loss = 0.6927


 49%|████▉     | 4942/10000 [06:38<07:20, 11.49it/s]

Epoch 4940: Loss = 0.6853
Epoch 4940: Loss = 0.6685
Epoch 4940: Loss = 0.6706
Epoch 4940: Loss = 0.6482
Epoch 4940: Loss = 0.6818


 50%|████▉     | 4952/10000 [06:39<07:22, 11.41it/s]

Epoch 4950: Loss = 0.6844
Epoch 4950: Loss = 0.6691
Epoch 4950: Loss = 0.6465
Epoch 4950: Loss = 0.6650
Epoch 4950: Loss = 0.6670


 50%|████▉     | 4962/10000 [06:40<06:28, 12.97it/s]

Epoch 4960: Loss = 0.6694
Epoch 4960: Loss = 0.6862
Epoch 4960: Loss = 0.6696
Epoch 4960: Loss = 0.6622
Epoch 4960: Loss = 0.6648


 50%|████▉     | 4972/10000 [06:40<06:41, 12.52it/s]

Epoch 4970: Loss = 0.6644
Epoch 4970: Loss = 0.6499
Epoch 4970: Loss = 0.6750
Epoch 4970: Loss = 0.6800
Epoch 4970: Loss = 0.6525


 50%|████▉     | 4982/10000 [06:41<07:01, 11.90it/s]

Epoch 4980: Loss = 0.7150
Epoch 4980: Loss = 0.6432
Epoch 4980: Loss = 0.6728
Epoch 4980: Loss = 0.6738
Epoch 4980: Loss = 0.6556


 50%|████▉     | 4992/10000 [06:42<06:13, 13.39it/s]

Epoch 4990: Loss = 0.6697
Epoch 4990: Loss = 0.6984
Epoch 4990: Loss = 0.6774
Epoch 4990: Loss = 0.6889
Epoch 4990: Loss = 0.6886


 50%|█████     | 5002/10000 [06:43<05:56, 14.01it/s]

Epoch 5000: Loss = 0.6589
Epoch 5000: Loss = 0.6513
Epoch 5000: Loss = 0.6985
Epoch 5000: Loss = 0.6642
Epoch 5000: Loss = 0.6795


 50%|█████     | 5012/10000 [06:44<06:05, 13.66it/s]

Epoch 5010: Loss = 0.6537
Epoch 5010: Loss = 0.6438
Epoch 5010: Loss = 0.6851
Epoch 5010: Loss = 0.6586
Epoch 5010: Loss = 0.6652


 50%|█████     | 5022/10000 [06:44<06:08, 13.50it/s]

Epoch 5020: Loss = 0.6853
Epoch 5020: Loss = 0.6732
Epoch 5020: Loss = 0.6601
Epoch 5020: Loss = 0.6835
Epoch 5020: Loss = 0.6517


 50%|█████     | 5032/10000 [06:45<06:18, 13.14it/s]

Epoch 5030: Loss = 0.6709
Epoch 5030: Loss = 0.6591
Epoch 5030: Loss = 0.6803
Epoch 5030: Loss = 0.6646
Epoch 5030: Loss = 0.6406


 50%|█████     | 5042/10000 [06:46<06:03, 13.64it/s]

Epoch 5040: Loss = 0.6670
Epoch 5040: Loss = 0.6527
Epoch 5040: Loss = 0.7048
Epoch 5040: Loss = 0.6541
Epoch 5040: Loss = 0.6775


 51%|█████     | 5052/10000 [06:46<05:53, 13.99it/s]

Epoch 5050: Loss = 0.6818
Epoch 5050: Loss = 0.6695
Epoch 5050: Loss = 0.6537
Epoch 5050: Loss = 0.6722
Epoch 5050: Loss = 0.6698


 51%|█████     | 5062/10000 [06:47<06:03, 13.60it/s]

Epoch 5060: Loss = 0.6926
Epoch 5060: Loss = 0.6756
Epoch 5060: Loss = 0.6713
Epoch 5060: Loss = 0.6857
Epoch 5060: Loss = 0.6544


 51%|█████     | 5072/10000 [06:48<06:10, 13.30it/s]

Epoch 5070: Loss = 0.6414
Epoch 5070: Loss = 0.6822
Epoch 5070: Loss = 0.6650
Epoch 5070: Loss = 0.6529
Epoch 5070: Loss = 0.6695


 51%|█████     | 5082/10000 [06:49<06:05, 13.45it/s]

Epoch 5080: Loss = 0.6379
Epoch 5080: Loss = 0.6798
Epoch 5080: Loss = 0.7028
Epoch 5080: Loss = 0.6466
Epoch 5080: Loss = 0.6929


 51%|█████     | 5092/10000 [06:50<05:53, 13.88it/s]

Epoch 5090: Loss = 0.6940
Epoch 5090: Loss = 0.6624
Epoch 5090: Loss = 0.6530
Epoch 5090: Loss = 0.6603
Epoch 5090: Loss = 0.6776


 51%|█████     | 5102/10000 [06:50<05:53, 13.87it/s]

Epoch 5100: Loss = 0.6973
Epoch 5100: Loss = 0.6883
Epoch 5100: Loss = 0.6784
Epoch 5100: Loss = 0.6686
Epoch 5100: Loss = 0.6515


 51%|█████     | 5112/10000 [06:51<06:21, 12.82it/s]

Epoch 5110: Loss = 0.6592
Epoch 5110: Loss = 0.6564
Epoch 5110: Loss = 0.6800
Epoch 5110: Loss = 0.6795
Epoch 5110: Loss = 0.6864


 51%|█████     | 5122/10000 [06:52<06:02, 13.45it/s]

Epoch 5120: Loss = 0.6909
Epoch 5120: Loss = 0.6603
Epoch 5120: Loss = 0.6836
Epoch 5120: Loss = 0.6589
Epoch 5120: Loss = 0.6603


 51%|█████▏    | 5132/10000 [06:53<06:50, 11.86it/s]

Epoch 5130: Loss = 0.6668
Epoch 5130: Loss = 0.6715
Epoch 5130: Loss = 0.6648
Epoch 5130: Loss = 0.6267
Epoch 5130: Loss = 0.6610


 51%|█████▏    | 5140/10000 [06:53<06:28, 12.52it/s]

Epoch 5140: Loss = 0.6633
Epoch 5140: Loss = 0.6772
Epoch 5140: Loss = 0.6710
Epoch 5140: Loss = 0.6435
Epoch 5140: Loss = 0.6531


 52%|█████▏    | 5152/10000 [06:54<06:58, 11.58it/s]

Epoch 5150: Loss = 0.6450
Epoch 5150: Loss = 0.7028
Epoch 5150: Loss = 0.6682
Epoch 5150: Loss = 0.6729
Epoch 5150: Loss = 0.6474


 52%|█████▏    | 5162/10000 [06:55<08:00, 10.07it/s]

Epoch 5160: Loss = 0.6961
Epoch 5160: Loss = 0.6562
Epoch 5160: Loss = 0.6436
Epoch 5160: Loss = 0.6487
Epoch 5160: Loss = 0.6892


 52%|█████▏    | 5172/10000 [06:56<06:28, 12.42it/s]

Epoch 5170: Loss = 0.6975
Epoch 5170: Loss = 0.6811
Epoch 5170: Loss = 0.6864
Epoch 5170: Loss = 0.7053
Epoch 5170: Loss = 0.6655


 52%|█████▏    | 5182/10000 [06:57<05:52, 13.67it/s]

Epoch 5180: Loss = 0.6328
Epoch 5180: Loss = 0.6536
Epoch 5180: Loss = 0.6740
Epoch 5180: Loss = 0.6561
Epoch 5180: Loss = 0.6628


 52%|█████▏    | 5192/10000 [06:58<05:40, 14.14it/s]

Epoch 5190: Loss = 0.6767
Epoch 5190: Loss = 0.6593
Epoch 5190: Loss = 0.6460
Epoch 5190: Loss = 0.6549
Epoch 5190: Loss = 0.6687


 52%|█████▏    | 5202/10000 [06:58<06:00, 13.29it/s]

Epoch 5200: Loss = 0.6889
Epoch 5200: Loss = 0.6328
Epoch 5200: Loss = 0.6812
Epoch 5200: Loss = 0.6656
Epoch 5200: Loss = 0.6428


 52%|█████▏    | 5212/10000 [06:59<05:42, 13.98it/s]

Epoch 5210: Loss = 0.6556
Epoch 5210: Loss = 0.6734
Epoch 5210: Loss = 0.6996
Epoch 5210: Loss = 0.6522
Epoch 5210: Loss = 0.6490


 52%|█████▏    | 5222/10000 [07:00<05:54, 13.49it/s]

Epoch 5220: Loss = 0.6812
Epoch 5220: Loss = 0.6344
Epoch 5220: Loss = 0.6792
Epoch 5220: Loss = 0.6417
Epoch 5220: Loss = 0.6902


 52%|█████▏    | 5232/10000 [07:01<05:51, 13.58it/s]

Epoch 5230: Loss = 0.6775
Epoch 5230: Loss = 0.6546
Epoch 5230: Loss = 0.6472
Epoch 5230: Loss = 0.6735
Epoch 5230: Loss = 0.6682


 52%|█████▏    | 5242/10000 [07:01<06:37, 11.96it/s]

Epoch 5240: Loss = 0.6952
Epoch 5240: Loss = 0.6868
Epoch 5240: Loss = 0.6807
Epoch 5240: Loss = 0.6566
Epoch 5240: Loss = 0.6648


 53%|█████▎    | 5252/10000 [07:02<06:17, 12.59it/s]

Epoch 5250: Loss = 0.6590
Epoch 5250: Loss = 0.6634
Epoch 5250: Loss = 0.6523
Epoch 5250: Loss = 0.6695
Epoch 5250: Loss = 0.6690


 53%|█████▎    | 5262/10000 [07:03<06:44, 11.72it/s]

Epoch 5260: Loss = 0.6792
Epoch 5260: Loss = 0.6940
Epoch 5260: Loss = 0.6568
Epoch 5260: Loss = 0.6751
Epoch 5260: Loss = 0.6605


 53%|█████▎    | 5272/10000 [07:04<06:10, 12.74it/s]

Epoch 5270: Loss = 0.6431
Epoch 5270: Loss = 0.6811
Epoch 5270: Loss = 0.6734
Epoch 5270: Loss = 0.6931
Epoch 5270: Loss = 0.6423


 53%|█████▎    | 5282/10000 [07:05<07:50, 10.03it/s]

Epoch 5280: Loss = 0.6760
Epoch 5280: Loss = 0.6929
Epoch 5280: Loss = 0.6418
Epoch 5280: Loss = 0.6788
Epoch 5280: Loss = 0.6474


 53%|█████▎    | 5292/10000 [07:06<06:19, 12.39it/s]

Epoch 5290: Loss = 0.6703
Epoch 5290: Loss = 0.6710
Epoch 5290: Loss = 0.6730
Epoch 5290: Loss = 0.6904
Epoch 5290: Loss = 0.6733


 53%|█████▎    | 5302/10000 [07:06<05:45, 13.61it/s]

Epoch 5300: Loss = 0.6430
Epoch 5300: Loss = 0.6666
Epoch 5300: Loss = 0.6590
Epoch 5300: Loss = 0.6421
Epoch 5300: Loss = 0.6766


 53%|█████▎    | 5312/10000 [07:07<05:55, 13.17it/s]

Epoch 5310: Loss = 0.6223
Epoch 5310: Loss = 0.6597
Epoch 5310: Loss = 0.6975
Epoch 5310: Loss = 0.6457
Epoch 5310: Loss = 0.6583


 53%|█████▎    | 5322/10000 [07:08<06:26, 12.09it/s]

Epoch 5320: Loss = 0.6489
Epoch 5320: Loss = 0.6662
Epoch 5320: Loss = 0.6714
Epoch 5320: Loss = 0.7000
Epoch 5320: Loss = 0.6544


 53%|█████▎    | 5332/10000 [07:09<06:25, 12.10it/s]

Epoch 5330: Loss = 0.6678
Epoch 5330: Loss = 0.6900
Epoch 5330: Loss = 0.6690
Epoch 5330: Loss = 0.6899
Epoch 5330: Loss = 0.6768


 53%|█████▎    | 5342/10000 [07:10<05:57, 13.01it/s]

Epoch 5340: Loss = 0.7024
Epoch 5340: Loss = 0.7049
Epoch 5340: Loss = 0.6719
Epoch 5340: Loss = 0.6588
Epoch 5340: Loss = 0.6623


 54%|█████▎    | 5352/10000 [07:11<06:31, 11.89it/s]

Epoch 5350: Loss = 0.6805
Epoch 5350: Loss = 0.6500
Epoch 5350: Loss = 0.6983
Epoch 5350: Loss = 0.6605
Epoch 5350: Loss = 0.6558


 54%|█████▎    | 5362/10000 [07:11<06:04, 12.73it/s]

Epoch 5360: Loss = 0.6907
Epoch 5360: Loss = 0.6636
Epoch 5360: Loss = 0.6769
Epoch 5360: Loss = 0.6621
Epoch 5360: Loss = 0.6920


 54%|█████▎    | 5372/10000 [07:12<05:51, 13.17it/s]

Epoch 5370: Loss = 0.6616
Epoch 5370: Loss = 0.6672
Epoch 5370: Loss = 0.6743
Epoch 5370: Loss = 0.6767
Epoch 5370: Loss = 0.6605


 54%|█████▍    | 5382/10000 [07:13<05:29, 14.03it/s]

Epoch 5380: Loss = 0.6806
Epoch 5380: Loss = 0.6800
Epoch 5380: Loss = 0.6642
Epoch 5380: Loss = 0.6771
Epoch 5380: Loss = 0.7001


 54%|█████▍    | 5392/10000 [07:13<05:30, 13.94it/s]

Epoch 5390: Loss = 0.6509
Epoch 5390: Loss = 0.6657
Epoch 5390: Loss = 0.6644
Epoch 5390: Loss = 0.6718
Epoch 5390: Loss = 0.6602


 54%|█████▍    | 5402/10000 [07:14<05:57, 12.86it/s]

Epoch 5400: Loss = 0.6705
Epoch 5400: Loss = 0.6904
Epoch 5400: Loss = 0.6993
Epoch 5400: Loss = 0.6412
Epoch 5400: Loss = 0.6820


 54%|█████▍    | 5412/10000 [07:15<05:36, 13.63it/s]

Epoch 5410: Loss = 0.6543
Epoch 5410: Loss = 0.7163
Epoch 5410: Loss = 0.6640
Epoch 5410: Loss = 0.6344
Epoch 5410: Loss = 0.6597


 54%|█████▍    | 5422/10000 [07:16<05:41, 13.39it/s]

Epoch 5420: Loss = 0.6392
Epoch 5420: Loss = 0.6643
Epoch 5420: Loss = 0.6802
Epoch 5420: Loss = 0.6784
Epoch 5420: Loss = 0.6421


 54%|█████▍    | 5432/10000 [07:16<05:26, 13.99it/s]

Epoch 5430: Loss = 0.6730
Epoch 5430: Loss = 0.6942
Epoch 5430: Loss = 0.7040
Epoch 5430: Loss = 0.6566
Epoch 5430: Loss = 0.6437


 54%|█████▍    | 5442/10000 [07:17<05:19, 14.25it/s]

Epoch 5440: Loss = 0.6670
Epoch 5440: Loss = 0.6571
Epoch 5440: Loss = 0.6784
Epoch 5440: Loss = 0.6513
Epoch 5440: Loss = 0.6735


 55%|█████▍    | 5452/10000 [07:18<05:25, 13.96it/s]

Epoch 5450: Loss = 0.6761
Epoch 5450: Loss = 0.6771
Epoch 5450: Loss = 0.6887
Epoch 5450: Loss = 0.6617
Epoch 5450: Loss = 0.6725


 55%|█████▍    | 5462/10000 [07:19<05:28, 13.82it/s]

Epoch 5460: Loss = 0.6493
Epoch 5460: Loss = 0.6726
Epoch 5460: Loss = 0.6622
Epoch 5460: Loss = 0.6483
Epoch 5460: Loss = 0.6523


 55%|█████▍    | 5472/10000 [07:19<06:00, 12.57it/s]

Epoch 5470: Loss = 0.6687
Epoch 5470: Loss = 0.6626
Epoch 5470: Loss = 0.6606
Epoch 5470: Loss = 0.6696
Epoch 5470: Loss = 0.6684


 55%|█████▍    | 5482/10000 [07:20<05:36, 13.42it/s]

Epoch 5480: Loss = 0.6926
Epoch 5480: Loss = 0.6634
Epoch 5480: Loss = 0.6420
Epoch 5480: Loss = 0.6739
Epoch 5480: Loss = 0.6684


 55%|█████▍    | 5492/10000 [07:21<05:49, 12.90it/s]

Epoch 5490: Loss = 0.6832
Epoch 5490: Loss = 0.6396
Epoch 5490: Loss = 0.6786
Epoch 5490: Loss = 0.6891
Epoch 5490: Loss = 0.6618


 55%|█████▌    | 5502/10000 [07:22<05:40, 13.22it/s]

Epoch 5500: Loss = 0.6394
Epoch 5500: Loss = 0.6595
Epoch 5500: Loss = 0.7035
Epoch 5500: Loss = 0.6657
Epoch 5500: Loss = 0.6738


 55%|█████▌    | 5512/10000 [07:22<05:21, 13.98it/s]

Epoch 5510: Loss = 0.6320
Epoch 5510: Loss = 0.6528
Epoch 5510: Loss = 0.6713
Epoch 5510: Loss = 0.6525
Epoch 5510: Loss = 0.6551


 55%|█████▌    | 5522/10000 [07:23<05:12, 14.34it/s]

Epoch 5520: Loss = 0.6748
Epoch 5520: Loss = 0.6545
Epoch 5520: Loss = 0.6826
Epoch 5520: Loss = 0.6847
Epoch 5520: Loss = 0.6496


 55%|█████▌    | 5532/10000 [07:24<05:18, 14.04it/s]

Epoch 5530: Loss = 0.6702
Epoch 5530: Loss = 0.6689
Epoch 5530: Loss = 0.6426
Epoch 5530: Loss = 0.6636
Epoch 5530: Loss = 0.6480


 55%|█████▌    | 5542/10000 [07:25<05:53, 12.63it/s]

Epoch 5540: Loss = 0.6688
Epoch 5540: Loss = 0.6654
Epoch 5540: Loss = 0.6645
Epoch 5540: Loss = 0.6669
Epoch 5540: Loss = 0.6923


 56%|█████▌    | 5552/10000 [07:25<05:21, 13.85it/s]

Epoch 5550: Loss = 0.6543
Epoch 5550: Loss = 0.6687
Epoch 5550: Loss = 0.6929
Epoch 5550: Loss = 0.6710
Epoch 5550: Loss = 0.6337


 56%|█████▌    | 5562/10000 [07:26<05:51, 12.61it/s]

Epoch 5560: Loss = 0.6791
Epoch 5560: Loss = 0.6865
Epoch 5560: Loss = 0.6726
Epoch 5560: Loss = 0.6348
Epoch 5560: Loss = 0.7078


 56%|█████▌    | 5572/10000 [07:27<05:21, 13.76it/s]

Epoch 5570: Loss = 0.6647
Epoch 5570: Loss = 0.6658
Epoch 5570: Loss = 0.6522
Epoch 5570: Loss = 0.6593
Epoch 5570: Loss = 0.6669


 56%|█████▌    | 5582/10000 [07:28<05:26, 13.54it/s]

Epoch 5580: Loss = 0.7033
Epoch 5580: Loss = 0.6127
Epoch 5580: Loss = 0.6645
Epoch 5580: Loss = 0.6783
Epoch 5580: Loss = 0.6773


 56%|█████▌    | 5592/10000 [07:29<05:27, 13.48it/s]

Epoch 5590: Loss = 0.6805
Epoch 5590: Loss = 0.6640
Epoch 5590: Loss = 0.6419
Epoch 5590: Loss = 0.6679
Epoch 5590: Loss = 0.6874


 56%|█████▌    | 5602/10000 [07:29<05:14, 13.97it/s]

Epoch 5600: Loss = 0.6735
Epoch 5600: Loss = 0.6587
Epoch 5600: Loss = 0.6730
Epoch 5600: Loss = 0.6931
Epoch 5600: Loss = 0.6729


 56%|█████▌    | 5612/10000 [07:30<05:08, 14.22it/s]

Epoch 5610: Loss = 0.6396
Epoch 5610: Loss = 0.7024
Epoch 5610: Loss = 0.6898
Epoch 5610: Loss = 0.6647
Epoch 5610: Loss = 0.6898


 56%|█████▌    | 5622/10000 [07:31<05:09, 14.13it/s]

Epoch 5620: Loss = 0.6777
Epoch 5620: Loss = 0.6215
Epoch 5620: Loss = 0.6193
Epoch 5620: Loss = 0.6986
Epoch 5620: Loss = 0.6727


 56%|█████▋    | 5632/10000 [07:31<05:25, 13.42it/s]

Epoch 5630: Loss = 0.7008
Epoch 5630: Loss = 0.6216
Epoch 5630: Loss = 0.6639
Epoch 5630: Loss = 0.6558
Epoch 5630: Loss = 0.6733


 56%|█████▋    | 5642/10000 [07:32<05:13, 13.92it/s]

Epoch 5640: Loss = 0.6628
Epoch 5640: Loss = 0.6791
Epoch 5640: Loss = 0.6707
Epoch 5640: Loss = 0.6807
Epoch 5640: Loss = 0.6597


 57%|█████▋    | 5652/10000 [07:33<05:33, 13.03it/s]

Epoch 5650: Loss = 0.6565
Epoch 5650: Loss = 0.6585
Epoch 5650: Loss = 0.6529
Epoch 5650: Loss = 0.6417
Epoch 5650: Loss = 0.6671


 57%|█████▋    | 5662/10000 [07:34<05:16, 13.69it/s]

Epoch 5660: Loss = 0.6409
Epoch 5660: Loss = 0.6725
Epoch 5660: Loss = 0.6246
Epoch 5660: Loss = 0.6575
Epoch 5660: Loss = 0.6954


 57%|█████▋    | 5672/10000 [07:34<05:39, 12.73it/s]

Epoch 5670: Loss = 0.6740
Epoch 5670: Loss = 0.6654
Epoch 5670: Loss = 0.6359
Epoch 5670: Loss = 0.6740
Epoch 5670: Loss = 0.6840


 57%|█████▋    | 5682/10000 [07:35<05:14, 13.74it/s]

Epoch 5680: Loss = 0.6339
Epoch 5680: Loss = 0.6611
Epoch 5680: Loss = 0.6327
Epoch 5680: Loss = 0.6522
Epoch 5680: Loss = 0.6530


 57%|█████▋    | 5692/10000 [07:36<06:21, 11.29it/s]

Epoch 5690: Loss = 0.6385
Epoch 5690: Loss = 0.6530
Epoch 5690: Loss = 0.6904
Epoch 5690: Loss = 0.6952
Epoch 5690: Loss = 0.6840


 57%|█████▋    | 5702/10000 [07:37<05:20, 13.41it/s]

Epoch 5700: Loss = 0.6909
Epoch 5700: Loss = 0.7014
Epoch 5700: Loss = 0.6389
Epoch 5700: Loss = 0.6502
Epoch 5700: Loss = 0.6714


 57%|█████▋    | 5712/10000 [07:38<05:49, 12.26it/s]

Epoch 5710: Loss = 0.6902
Epoch 5710: Loss = 0.6873
Epoch 5710: Loss = 0.6525
Epoch 5710: Loss = 0.6677
Epoch 5710: Loss = 0.6702


 57%|█████▋    | 5722/10000 [07:38<05:05, 13.98it/s]

Epoch 5720: Loss = 0.6557
Epoch 5720: Loss = 0.6764
Epoch 5720: Loss = 0.6586
Epoch 5720: Loss = 0.6821
Epoch 5720: Loss = 0.6512


 57%|█████▋    | 5732/10000 [07:39<05:06, 13.91it/s]

Epoch 5730: Loss = 0.6513
Epoch 5730: Loss = 0.6781
Epoch 5730: Loss = 0.6689
Epoch 5730: Loss = 0.6507
Epoch 5730: Loss = 0.6628


 57%|█████▋    | 5742/10000 [07:40<05:05, 13.93it/s]

Epoch 5740: Loss = 0.6528
Epoch 5740: Loss = 0.6535
Epoch 5740: Loss = 0.6689
Epoch 5740: Loss = 0.6668
Epoch 5740: Loss = 0.7030


 58%|█████▊    | 5752/10000 [07:41<05:28, 12.95it/s]

Epoch 5750: Loss = 0.6318
Epoch 5750: Loss = 0.6872
Epoch 5750: Loss = 0.6726
Epoch 5750: Loss = 0.6968
Epoch 5750: Loss = 0.6606


 58%|█████▊    | 5762/10000 [07:41<06:13, 11.34it/s]

Epoch 5760: Loss = 0.6429
Epoch 5760: Loss = 0.6621
Epoch 5760: Loss = 0.6542
Epoch 5760: Loss = 0.6952
Epoch 5760: Loss = 0.6777


 58%|█████▊    | 5772/10000 [07:42<05:14, 13.42it/s]

Epoch 5770: Loss = 0.6416
Epoch 5770: Loss = 0.6578
Epoch 5770: Loss = 0.6591
Epoch 5770: Loss = 0.6921
Epoch 5770: Loss = 0.6481


 58%|█████▊    | 5782/10000 [07:43<05:11, 13.55it/s]

Epoch 5780: Loss = 0.6861
Epoch 5780: Loss = 0.6851
Epoch 5780: Loss = 0.6719
Epoch 5780: Loss = 0.6671
Epoch 5780: Loss = 0.6736


 58%|█████▊    | 5792/10000 [07:44<05:56, 11.80it/s]

Epoch 5790: Loss = 0.6470
Epoch 5790: Loss = 0.6394
Epoch 5790: Loss = 0.6401
Epoch 5790: Loss = 0.6548
Epoch 5790: Loss = 0.6945


 58%|█████▊    | 5802/10000 [07:44<05:30, 12.69it/s]

Epoch 5800: Loss = 0.6727
Epoch 5800: Loss = 0.6782
Epoch 5800: Loss = 0.6526
Epoch 5800: Loss = 0.6625
Epoch 5800: Loss = 0.6318


 58%|█████▊    | 5812/10000 [07:45<05:24, 12.91it/s]

Epoch 5810: Loss = 0.6566
Epoch 5810: Loss = 0.6545
Epoch 5810: Loss = 0.6762
Epoch 5810: Loss = 0.6692
Epoch 5810: Loss = 0.6645


 58%|█████▊    | 5822/10000 [07:46<05:15, 13.24it/s]

Epoch 5820: Loss = 0.6951
Epoch 5820: Loss = 0.6980
Epoch 5820: Loss = 0.6828
Epoch 5820: Loss = 0.6950
Epoch 5820: Loss = 0.6706


 58%|█████▊    | 5832/10000 [07:47<05:29, 12.66it/s]

Epoch 5830: Loss = 0.6369
Epoch 5830: Loss = 0.6780
Epoch 5830: Loss = 0.6462
Epoch 5830: Loss = 0.6765
Epoch 5830: Loss = 0.6644


 58%|█████▊    | 5842/10000 [07:48<05:18, 13.07it/s]

Epoch 5840: Loss = 0.6542
Epoch 5840: Loss = 0.6610
Epoch 5840: Loss = 0.6718
Epoch 5840: Loss = 0.6437
Epoch 5840: Loss = 0.6662


 59%|█████▊    | 5852/10000 [07:48<05:00, 13.79it/s]

Epoch 5850: Loss = 0.6470
Epoch 5850: Loss = 0.6757
Epoch 5850: Loss = 0.6542
Epoch 5850: Loss = 0.6619
Epoch 5850: Loss = 0.6606


 59%|█████▊    | 5862/10000 [07:49<04:54, 14.03it/s]

Epoch 5860: Loss = 0.6339
Epoch 5860: Loss = 0.6581
Epoch 5860: Loss = 0.6554
Epoch 5860: Loss = 0.7026
Epoch 5860: Loss = 0.6619


 59%|█████▊    | 5872/10000 [07:50<05:17, 12.98it/s]

Epoch 5870: Loss = 0.6313
Epoch 5870: Loss = 0.6710
Epoch 5870: Loss = 0.7069
Epoch 5870: Loss = 0.6851
Epoch 5870: Loss = 0.6618


 59%|█████▉    | 5882/10000 [07:51<05:25, 12.63it/s]

Epoch 5880: Loss = 0.6360
Epoch 5880: Loss = 0.6797
Epoch 5880: Loss = 0.6690
Epoch 5880: Loss = 0.6820
Epoch 5880: Loss = 0.6504


 59%|█████▉    | 5892/10000 [07:51<05:06, 13.39it/s]

Epoch 5890: Loss = 0.6887
Epoch 5890: Loss = 0.6249
Epoch 5890: Loss = 0.6500
Epoch 5890: Loss = 0.6274
Epoch 5890: Loss = 0.6813


 59%|█████▉    | 5902/10000 [07:52<06:09, 11.10it/s]

Epoch 5900: Loss = 0.6795
Epoch 5900: Loss = 0.6671
Epoch 5900: Loss = 0.6718
Epoch 5900: Loss = 0.6890
Epoch 5900: Loss = 0.6264


 59%|█████▉    | 5912/10000 [07:53<05:39, 12.06it/s]

Epoch 5910: Loss = 0.6558
Epoch 5910: Loss = 0.6867
Epoch 5910: Loss = 0.6495
Epoch 5910: Loss = 0.6713
Epoch 5910: Loss = 0.6688


 59%|█████▉    | 5922/10000 [07:54<05:53, 11.55it/s]

Epoch 5920: Loss = 0.6834
Epoch 5920: Loss = 0.6685
Epoch 5920: Loss = 0.6641
Epoch 5920: Loss = 0.6596
Epoch 5920: Loss = 0.6997


 59%|█████▉    | 5932/10000 [07:55<05:01, 13.51it/s]

Epoch 5930: Loss = 0.6449
Epoch 5930: Loss = 0.6247
Epoch 5930: Loss = 0.7011
Epoch 5930: Loss = 0.6738
Epoch 5930: Loss = 0.6737


 59%|█████▉    | 5942/10000 [07:56<04:51, 13.91it/s]

Epoch 5940: Loss = 0.6604
Epoch 5940: Loss = 0.6576
Epoch 5940: Loss = 0.6709
Epoch 5940: Loss = 0.6628
Epoch 5940: Loss = 0.6392


 60%|█████▉    | 5952/10000 [07:56<06:10, 10.92it/s]

Epoch 5950: Loss = 0.6645
Epoch 5950: Loss = 0.6712
Epoch 5950: Loss = 0.6718
Epoch 5950: Loss = 0.6372
Epoch 5950: Loss = 0.6732


 60%|█████▉    | 5962/10000 [07:57<05:51, 11.48it/s]

Epoch 5960: Loss = 0.6607
Epoch 5960: Loss = 0.6935
Epoch 5960: Loss = 0.6583
Epoch 5960: Loss = 0.6687
Epoch 5960: Loss = 0.6889


 60%|█████▉    | 5972/10000 [07:58<06:16, 10.69it/s]

Epoch 5970: Loss = 0.6776
Epoch 5970: Loss = 0.6757
Epoch 5970: Loss = 0.6660
Epoch 5970: Loss = 0.6645
Epoch 5970: Loss = 0.6514


 60%|█████▉    | 5982/10000 [07:59<05:31, 12.11it/s]

Epoch 5980: Loss = 0.6636
Epoch 5980: Loss = 0.6345
Epoch 5980: Loss = 0.6595
Epoch 5980: Loss = 0.6756
Epoch 5980: Loss = 0.6411


 60%|█████▉    | 5992/10000 [08:00<06:15, 10.67it/s]

Epoch 5990: Loss = 0.6585
Epoch 5990: Loss = 0.6600
Epoch 5990: Loss = 0.6728
Epoch 5990: Loss = 0.6537
Epoch 5990: Loss = 0.6719


 60%|██████    | 6002/10000 [08:01<05:33, 11.98it/s]

Epoch 6000: Loss = 0.6740
Epoch 6000: Loss = 0.6737
Epoch 6000: Loss = 0.6656
Epoch 6000: Loss = 0.6644
Epoch 6000: Loss = 0.6925


 60%|██████    | 6012/10000 [08:02<04:57, 13.41it/s]

Epoch 6010: Loss = 0.6501
Epoch 6010: Loss = 0.6574
Epoch 6010: Loss = 0.6613
Epoch 6010: Loss = 0.6837
Epoch 6010: Loss = 0.6792


 60%|██████    | 6022/10000 [08:02<05:32, 11.98it/s]

Epoch 6020: Loss = 0.6916
Epoch 6020: Loss = 0.6566
Epoch 6020: Loss = 0.6687
Epoch 6020: Loss = 0.6400
Epoch 6020: Loss = 0.6687


 60%|██████    | 6032/10000 [08:03<05:58, 11.08it/s]

Epoch 6030: Loss = 0.6419
Epoch 6030: Loss = 0.7095
Epoch 6030: Loss = 0.7367
Epoch 6030: Loss = 0.6667
Epoch 6030: Loss = 0.6609


 60%|██████    | 6042/10000 [08:04<05:08, 12.81it/s]

Epoch 6040: Loss = 0.6527
Epoch 6040: Loss = 0.6583
Epoch 6040: Loss = 0.6372
Epoch 6040: Loss = 0.6741
Epoch 6040: Loss = 0.7026


 61%|██████    | 6052/10000 [08:05<05:17, 12.43it/s]

Epoch 6050: Loss = 0.7069
Epoch 6050: Loss = 0.6526
Epoch 6050: Loss = 0.6907
Epoch 6050: Loss = 0.6662
Epoch 6050: Loss = 0.6507


 61%|██████    | 6062/10000 [08:06<05:00, 13.09it/s]

Epoch 6060: Loss = 0.6539
Epoch 6060: Loss = 0.6826
Epoch 6060: Loss = 0.6798
Epoch 6060: Loss = 0.7069
Epoch 6060: Loss = 0.6823


 61%|██████    | 6072/10000 [08:07<05:32, 11.82it/s]

Epoch 6070: Loss = 0.6241
Epoch 6070: Loss = 0.6621
Epoch 6070: Loss = 0.6745
Epoch 6070: Loss = 0.6767
Epoch 6070: Loss = 0.7026


 61%|██████    | 6082/10000 [08:07<04:46, 13.67it/s]

Epoch 6080: Loss = 0.6762
Epoch 6080: Loss = 0.6499
Epoch 6080: Loss = 0.6757
Epoch 6080: Loss = 0.6742
Epoch 6080: Loss = 0.6972


 61%|██████    | 6092/10000 [08:08<04:58, 13.10it/s]

Epoch 6090: Loss = 0.6524
Epoch 6090: Loss = 0.7096
Epoch 6090: Loss = 0.6792
Epoch 6090: Loss = 0.6499
Epoch 6090: Loss = 0.6496


 61%|██████    | 6102/10000 [08:09<05:29, 11.83it/s]

Epoch 6100: Loss = 0.6635
Epoch 6100: Loss = 0.6712
Epoch 6100: Loss = 0.6918
Epoch 6100: Loss = 0.6868
Epoch 6100: Loss = 0.6650


 61%|██████    | 6112/10000 [08:10<05:52, 11.02it/s]

Epoch 6110: Loss = 0.6783
Epoch 6110: Loss = 0.6801
Epoch 6110: Loss = 0.6682
Epoch 6110: Loss = 0.6833
Epoch 6110: Loss = 0.6720


 61%|██████    | 6122/10000 [08:11<05:16, 12.24it/s]

Epoch 6120: Loss = 0.6667
Epoch 6120: Loss = 0.6624
Epoch 6120: Loss = 0.6502
Epoch 6120: Loss = 0.6463
Epoch 6120: Loss = 0.6783


 61%|██████▏   | 6132/10000 [08:12<06:01, 10.71it/s]

Epoch 6130: Loss = 0.6597
Epoch 6130: Loss = 0.6889
Epoch 6130: Loss = 0.6574
Epoch 6130: Loss = 0.6859
Epoch 6130: Loss = 0.6347


 61%|██████▏   | 6142/10000 [08:13<05:38, 11.38it/s]

Epoch 6140: Loss = 0.6726
Epoch 6140: Loss = 0.6766
Epoch 6140: Loss = 0.7227
Epoch 6140: Loss = 0.6552
Epoch 6140: Loss = 0.6759


 62%|██████▏   | 6152/10000 [08:13<05:39, 11.34it/s]

Epoch 6150: Loss = 0.6509
Epoch 6150: Loss = 0.6715
Epoch 6150: Loss = 0.6496
Epoch 6150: Loss = 0.7005
Epoch 6150: Loss = 0.6403


 62%|██████▏   | 6162/10000 [08:14<05:24, 11.84it/s]

Epoch 6160: Loss = 0.6504
Epoch 6160: Loss = 0.6399
Epoch 6160: Loss = 0.7008
Epoch 6160: Loss = 0.6850
Epoch 6160: Loss = 0.6898


 62%|██████▏   | 6172/10000 [08:15<05:42, 11.17it/s]

Epoch 6170: Loss = 0.6424
Epoch 6170: Loss = 0.6477
Epoch 6170: Loss = 0.6619
Epoch 6170: Loss = 0.6754
Epoch 6170: Loss = 0.6538


 62%|██████▏   | 6182/10000 [08:16<04:47, 13.27it/s]

Epoch 6180: Loss = 0.6602
Epoch 6180: Loss = 0.6280
Epoch 6180: Loss = 0.6677
Epoch 6180: Loss = 0.6738
Epoch 6180: Loss = 0.6673


 62%|██████▏   | 6192/10000 [08:17<05:09, 12.32it/s]

Epoch 6190: Loss = 0.6545
Epoch 6190: Loss = 0.6936
Epoch 6190: Loss = 0.6455
Epoch 6190: Loss = 0.6384
Epoch 6190: Loss = 0.6762


 62%|██████▏   | 6202/10000 [08:17<05:11, 12.21it/s]

Epoch 6200: Loss = 0.6785
Epoch 6200: Loss = 0.6855
Epoch 6200: Loss = 0.7138
Epoch 6200: Loss = 0.6838
Epoch 6200: Loss = 0.6878


 62%|██████▏   | 6212/10000 [08:18<05:06, 12.34it/s]

Epoch 6210: Loss = 0.6544
Epoch 6210: Loss = 0.6733
Epoch 6210: Loss = 0.6508
Epoch 6210: Loss = 0.6801
Epoch 6210: Loss = 0.6903


 62%|██████▏   | 6222/10000 [08:19<04:52, 12.91it/s]

Epoch 6220: Loss = 0.6647
Epoch 6220: Loss = 0.7236
Epoch 6220: Loss = 0.6586
Epoch 6220: Loss = 0.6497
Epoch 6220: Loss = 0.6966


 62%|██████▏   | 6232/10000 [08:20<04:44, 13.24it/s]

Epoch 6230: Loss = 0.6563
Epoch 6230: Loss = 0.6570
Epoch 6230: Loss = 0.6564
Epoch 6230: Loss = 0.6916
Epoch 6230: Loss = 0.7154


 62%|██████▏   | 6242/10000 [08:21<04:31, 13.85it/s]

Epoch 6240: Loss = 0.6547
Epoch 6240: Loss = 0.6267
Epoch 6240: Loss = 0.6261
Epoch 6240: Loss = 0.6754
Epoch 6240: Loss = 0.6741


 63%|██████▎   | 6252/10000 [08:21<05:21, 11.64it/s]

Epoch 6250: Loss = 0.6822
Epoch 6250: Loss = 0.6768
Epoch 6250: Loss = 0.6989
Epoch 6250: Loss = 0.6449
Epoch 6250: Loss = 0.6376


 63%|██████▎   | 6262/10000 [08:22<04:56, 12.59it/s]

Epoch 6260: Loss = 0.6271
Epoch 6260: Loss = 0.6560
Epoch 6260: Loss = 0.6637
Epoch 6260: Loss = 0.6670
Epoch 6260: Loss = 0.6641


 63%|██████▎   | 6272/10000 [08:23<05:06, 12.15it/s]

Epoch 6270: Loss = 0.6617
Epoch 6270: Loss = 0.6573
Epoch 6270: Loss = 0.6870
Epoch 6270: Loss = 0.6633
Epoch 6270: Loss = 0.6331


 63%|██████▎   | 6282/10000 [08:24<04:41, 13.20it/s]

Epoch 6280: Loss = 0.6678
Epoch 6280: Loss = 0.7011
Epoch 6280: Loss = 0.6645
Epoch 6280: Loss = 0.6746
Epoch 6280: Loss = 0.6490


 63%|██████▎   | 6292/10000 [08:25<04:26, 13.92it/s]

Epoch 6290: Loss = 0.6786
Epoch 6290: Loss = 0.6685
Epoch 6290: Loss = 0.6763
Epoch 6290: Loss = 0.6845
Epoch 6290: Loss = 0.6627


 63%|██████▎   | 6302/10000 [08:25<04:20, 14.18it/s]

Epoch 6300: Loss = 0.6750
Epoch 6300: Loss = 0.6771
Epoch 6300: Loss = 0.6835
Epoch 6300: Loss = 0.6810
Epoch 6300: Loss = 0.6881


 63%|██████▎   | 6312/10000 [08:26<05:01, 12.21it/s]

Epoch 6310: Loss = 0.6752
Epoch 6310: Loss = 0.6811
Epoch 6310: Loss = 0.6882
Epoch 6310: Loss = 0.7135
Epoch 6310: Loss = 0.6613


 63%|██████▎   | 6322/10000 [08:27<04:27, 13.75it/s]

Epoch 6320: Loss = 0.6824
Epoch 6320: Loss = 0.6647
Epoch 6320: Loss = 0.6471
Epoch 6320: Loss = 0.6724
Epoch 6320: Loss = 0.6736


 63%|██████▎   | 6332/10000 [08:28<05:09, 11.86it/s]

Epoch 6330: Loss = 0.6558
Epoch 6330: Loss = 0.6736
Epoch 6330: Loss = 0.6712
Epoch 6330: Loss = 0.6691
Epoch 6330: Loss = 0.6661


 63%|██████▎   | 6342/10000 [08:28<04:24, 13.80it/s]

Epoch 6340: Loss = 0.6578
Epoch 6340: Loss = 0.6723
Epoch 6340: Loss = 0.7031
Epoch 6340: Loss = 0.6609
Epoch 6340: Loss = 0.6728


 64%|██████▎   | 6352/10000 [08:29<04:51, 12.52it/s]

Epoch 6350: Loss = 0.6481
Epoch 6350: Loss = 0.6557
Epoch 6350: Loss = 0.6702
Epoch 6350: Loss = 0.6817
Epoch 6350: Loss = 0.6766


 64%|██████▎   | 6362/10000 [08:30<04:49, 12.57it/s]

Epoch 6360: Loss = 0.6634
Epoch 6360: Loss = 0.6623
Epoch 6360: Loss = 0.6859
Epoch 6360: Loss = 0.6846
Epoch 6360: Loss = 0.6448


 64%|██████▎   | 6372/10000 [08:31<04:55, 12.27it/s]

Epoch 6370: Loss = 0.6491
Epoch 6370: Loss = 0.6807
Epoch 6370: Loss = 0.6562
Epoch 6370: Loss = 0.6633
Epoch 6370: Loss = 0.7156


 64%|██████▍   | 6382/10000 [08:32<05:06, 11.80it/s]

Epoch 6380: Loss = 0.6682
Epoch 6380: Loss = 0.6939
Epoch 6380: Loss = 0.6742
Epoch 6380: Loss = 0.6828
Epoch 6380: Loss = 0.6410


 64%|██████▍   | 6392/10000 [08:33<05:01, 11.96it/s]

Epoch 6390: Loss = 0.7127
Epoch 6390: Loss = 0.6752
Epoch 6390: Loss = 0.6889
Epoch 6390: Loss = 0.6862
Epoch 6390: Loss = 0.6608


 64%|██████▍   | 6402/10000 [08:33<05:08, 11.65it/s]

Epoch 6400: Loss = 0.6596
Epoch 6400: Loss = 0.6990
Epoch 6400: Loss = 0.6865
Epoch 6400: Loss = 0.6614
Epoch 6400: Loss = 0.6918


 64%|██████▍   | 6412/10000 [08:34<05:13, 11.46it/s]

Epoch 6410: Loss = 0.6679
Epoch 6410: Loss = 0.6747
Epoch 6410: Loss = 0.6727
Epoch 6410: Loss = 0.6815
Epoch 6410: Loss = 0.6838


 64%|██████▍   | 6422/10000 [08:35<05:07, 11.65it/s]

Epoch 6420: Loss = 0.6743
Epoch 6420: Loss = 0.6601
Epoch 6420: Loss = 0.6581
Epoch 6420: Loss = 0.6683
Epoch 6420: Loss = 0.6834


 64%|██████▍   | 6432/10000 [08:36<04:33, 13.04it/s]

Epoch 6430: Loss = 0.6350
Epoch 6430: Loss = 0.6487
Epoch 6430: Loss = 0.6950
Epoch 6430: Loss = 0.6701
Epoch 6430: Loss = 0.6691


 64%|██████▍   | 6442/10000 [08:37<04:14, 13.99it/s]

Epoch 6440: Loss = 0.6712
Epoch 6440: Loss = 0.6642
Epoch 6440: Loss = 0.6881
Epoch 6440: Loss = 0.6580
Epoch 6440: Loss = 0.6745


 65%|██████▍   | 6452/10000 [08:37<04:42, 12.55it/s]

Epoch 6450: Loss = 0.6792
Epoch 6450: Loss = 0.6774
Epoch 6450: Loss = 0.6414
Epoch 6450: Loss = 0.6620
Epoch 6450: Loss = 0.6702


 65%|██████▍   | 6462/10000 [08:38<04:24, 13.38it/s]

Epoch 6460: Loss = 0.6506
Epoch 6460: Loss = 0.6569
Epoch 6460: Loss = 0.6678
Epoch 6460: Loss = 0.6630
Epoch 6460: Loss = 0.6341


 65%|██████▍   | 6472/10000 [08:39<04:24, 13.33it/s]

Epoch 6470: Loss = 0.6523
Epoch 6470: Loss = 0.6574
Epoch 6470: Loss = 0.6517
Epoch 6470: Loss = 0.6393
Epoch 6470: Loss = 0.6637


 65%|██████▍   | 6482/10000 [08:40<04:11, 13.99it/s]

Epoch 6480: Loss = 0.6636
Epoch 6480: Loss = 0.6935
Epoch 6480: Loss = 0.7056
Epoch 6480: Loss = 0.6671
Epoch 6480: Loss = 0.6646


 65%|██████▍   | 6492/10000 [08:40<04:26, 13.18it/s]

Epoch 6490: Loss = 0.6865
Epoch 6490: Loss = 0.6897
Epoch 6490: Loss = 0.6591
Epoch 6490: Loss = 0.6535
Epoch 6490: Loss = 0.6632


 65%|██████▌   | 6502/10000 [08:41<04:38, 12.55it/s]

Epoch 6500: Loss = 0.6591
Epoch 6500: Loss = 0.6704
Epoch 6500: Loss = 0.6399
Epoch 6500: Loss = 0.6535
Epoch 6500: Loss = 0.6854


 65%|██████▌   | 6510/10000 [08:42<04:38, 12.52it/s]

Epoch 6510: Loss = 0.6696
Epoch 6510: Loss = 0.6825
Epoch 6510: Loss = 0.6827
Epoch 6510: Loss = 0.6564
Epoch 6510: Loss = 0.6712


 65%|██████▌   | 6522/10000 [08:43<04:36, 12.57it/s]

Epoch 6520: Loss = 0.6659
Epoch 6520: Loss = 0.6960
Epoch 6520: Loss = 0.6774
Epoch 6520: Loss = 0.6933
Epoch 6520: Loss = 0.6434


 65%|██████▌   | 6532/10000 [08:44<04:23, 13.16it/s]

Epoch 6530: Loss = 0.6465
Epoch 6530: Loss = 0.6417
Epoch 6530: Loss = 0.6621
Epoch 6530: Loss = 0.6646
Epoch 6530: Loss = 0.6650


 65%|██████▌   | 6542/10000 [08:44<04:21, 13.25it/s]

Epoch 6540: Loss = 0.6645
Epoch 6540: Loss = 0.6605
Epoch 6540: Loss = 0.6520
Epoch 6540: Loss = 0.6867
Epoch 6540: Loss = 0.6388


 66%|██████▌   | 6552/10000 [08:45<04:20, 13.23it/s]

Epoch 6550: Loss = 0.6448
Epoch 6550: Loss = 0.6311
Epoch 6550: Loss = 0.6577
Epoch 6550: Loss = 0.6625
Epoch 6550: Loss = 0.6840


 66%|██████▌   | 6562/10000 [08:46<04:26, 12.90it/s]

Epoch 6560: Loss = 0.6616
Epoch 6560: Loss = 0.6880
Epoch 6560: Loss = 0.6441
Epoch 6560: Loss = 0.6485
Epoch 6560: Loss = 0.6820


 66%|██████▌   | 6572/10000 [08:47<04:27, 12.82it/s]

Epoch 6570: Loss = 0.6819
Epoch 6570: Loss = 0.6506
Epoch 6570: Loss = 0.6627
Epoch 6570: Loss = 0.6770
Epoch 6570: Loss = 0.6562


 66%|██████▌   | 6580/10000 [08:47<04:07, 13.80it/s]

Epoch 6580: Loss = 0.6968
Epoch 6580: Loss = 0.6436
Epoch 6580: Loss = 0.6588
Epoch 6580: Loss = 0.6521
Epoch 6580: Loss = 0.6445


 66%|██████▌   | 6592/10000 [08:48<04:44, 11.96it/s]

Epoch 6590: Loss = 0.6663
Epoch 6590: Loss = 0.6665
Epoch 6590: Loss = 0.7086
Epoch 6590: Loss = 0.6635
Epoch 6590: Loss = 0.6839


 66%|██████▌   | 6602/10000 [08:49<04:14, 13.33it/s]

Epoch 6600: Loss = 0.6768
Epoch 6600: Loss = 0.6648
Epoch 6600: Loss = 0.6943
Epoch 6600: Loss = 0.6581
Epoch 6600: Loss = 0.6842


 66%|██████▌   | 6612/10000 [08:50<04:04, 13.88it/s]

Epoch 6610: Loss = 0.6523
Epoch 6610: Loss = 0.6684
Epoch 6610: Loss = 0.6851
Epoch 6610: Loss = 0.6621
Epoch 6610: Loss = 0.6670


 66%|██████▌   | 6622/10000 [08:51<04:04, 13.80it/s]

Epoch 6620: Loss = 0.7243
Epoch 6620: Loss = 0.6822
Epoch 6620: Loss = 0.6742
Epoch 6620: Loss = 0.6753
Epoch 6620: Loss = 0.6989


 66%|██████▋   | 6632/10000 [08:51<04:12, 13.34it/s]

Epoch 6630: Loss = 0.6802
Epoch 6630: Loss = 0.7126
Epoch 6630: Loss = 0.6558
Epoch 6630: Loss = 0.6408
Epoch 6630: Loss = 0.6762


 66%|██████▋   | 6642/10000 [08:52<04:04, 13.73it/s]

Epoch 6640: Loss = 0.6550
Epoch 6640: Loss = 0.6598
Epoch 6640: Loss = 0.6690
Epoch 6640: Loss = 0.6312
Epoch 6640: Loss = 0.6683


 67%|██████▋   | 6652/10000 [08:53<04:00, 13.93it/s]

Epoch 6650: Loss = 0.6630
Epoch 6650: Loss = 0.6875
Epoch 6650: Loss = 0.6663
Epoch 6650: Loss = 0.6390
Epoch 6650: Loss = 0.6437


 67%|██████▋   | 6662/10000 [08:54<04:05, 13.58it/s]

Epoch 6660: Loss = 0.6465
Epoch 6660: Loss = 0.6810
Epoch 6660: Loss = 0.6744
Epoch 6660: Loss = 0.6648
Epoch 6660: Loss = 0.6539


 67%|██████▋   | 6672/10000 [08:54<04:14, 13.06it/s]

Epoch 6670: Loss = 0.6626
Epoch 6670: Loss = 0.6630
Epoch 6670: Loss = 0.6468
Epoch 6670: Loss = 0.6678
Epoch 6670: Loss = 0.6831


 67%|██████▋   | 6682/10000 [08:55<03:58, 13.90it/s]

Epoch 6680: Loss = 0.6895
Epoch 6680: Loss = 0.6812
Epoch 6680: Loss = 0.6734
Epoch 6680: Loss = 0.6766
Epoch 6680: Loss = 0.7011


 67%|██████▋   | 6692/10000 [08:56<03:52, 14.24it/s]

Epoch 6690: Loss = 0.6340
Epoch 6690: Loss = 0.6548
Epoch 6690: Loss = 0.6822
Epoch 6690: Loss = 0.6677
Epoch 6690: Loss = 0.6558


 67%|██████▋   | 6702/10000 [08:57<03:58, 13.83it/s]

Epoch 6700: Loss = 0.6595
Epoch 6700: Loss = 0.6836
Epoch 6700: Loss = 0.6689
Epoch 6700: Loss = 0.6544
Epoch 6700: Loss = 0.6393


 67%|██████▋   | 6712/10000 [08:57<04:08, 13.25it/s]

Epoch 6710: Loss = 0.6952
Epoch 6710: Loss = 0.6614
Epoch 6710: Loss = 0.6733
Epoch 6710: Loss = 0.6198
Epoch 6710: Loss = 0.6470


 67%|██████▋   | 6722/10000 [08:58<04:20, 12.56it/s]

Epoch 6720: Loss = 0.6702
Epoch 6720: Loss = 0.6284
Epoch 6720: Loss = 0.6603
Epoch 6720: Loss = 0.6800
Epoch 6720: Loss = 0.6851


 67%|██████▋   | 6732/10000 [08:59<04:08, 13.13it/s]

Epoch 6730: Loss = 0.6882
Epoch 6730: Loss = 0.6842
Epoch 6730: Loss = 0.6765
Epoch 6730: Loss = 0.6841
Epoch 6730: Loss = 0.7056


 67%|██████▋   | 6742/10000 [09:00<04:11, 12.93it/s]

Epoch 6740: Loss = 0.6557
Epoch 6740: Loss = 0.6480
Epoch 6740: Loss = 0.6535
Epoch 6740: Loss = 0.7050
Epoch 6740: Loss = 0.6836


 68%|██████▊   | 6752/10000 [09:00<03:58, 13.63it/s]

Epoch 6750: Loss = 0.6546
Epoch 6750: Loss = 0.6532
Epoch 6750: Loss = 0.7243
Epoch 6750: Loss = 0.6787
Epoch 6750: Loss = 0.6749


 68%|██████▊   | 6762/10000 [09:01<03:58, 13.56it/s]

Epoch 6760: Loss = 0.6567
Epoch 6760: Loss = 0.6867
Epoch 6760: Loss = 0.6659
Epoch 6760: Loss = 0.6545
Epoch 6760: Loss = 0.6432


 68%|██████▊   | 6772/10000 [09:02<04:11, 12.82it/s]

Epoch 6770: Loss = 0.6690
Epoch 6770: Loss = 0.6463
Epoch 6770: Loss = 0.6438
Epoch 6770: Loss = 0.6778
Epoch 6770: Loss = 0.6802


 68%|██████▊   | 6782/10000 [09:03<03:58, 13.49it/s]

Epoch 6780: Loss = 0.6589
Epoch 6780: Loss = 0.6523
Epoch 6780: Loss = 0.6446
Epoch 6780: Loss = 0.6616
Epoch 6780: Loss = 0.6786


 68%|██████▊   | 6792/10000 [09:04<04:37, 11.58it/s]

Epoch 6790: Loss = 0.6486
Epoch 6790: Loss = 0.6590
Epoch 6790: Loss = 0.6829
Epoch 6790: Loss = 0.6997
Epoch 6790: Loss = 0.6401


 68%|██████▊   | 6802/10000 [09:04<04:18, 12.39it/s]

Epoch 6800: Loss = 0.6625
Epoch 6800: Loss = 0.7164
Epoch 6800: Loss = 0.6696
Epoch 6800: Loss = 0.6880
Epoch 6800: Loss = 0.6437


 68%|██████▊   | 6812/10000 [09:05<04:17, 12.40it/s]

Epoch 6810: Loss = 0.6686
Epoch 6810: Loss = 0.6606
Epoch 6810: Loss = 0.6975
Epoch 6810: Loss = 0.6421
Epoch 6810: Loss = 0.6852


 68%|██████▊   | 6822/10000 [09:06<04:10, 12.67it/s]

Epoch 6820: Loss = 0.6564
Epoch 6820: Loss = 0.6955
Epoch 6820: Loss = 0.6918
Epoch 6820: Loss = 0.6810
Epoch 6820: Loss = 0.6599


 68%|██████▊   | 6832/10000 [09:07<04:22, 12.05it/s]

Epoch 6830: Loss = 0.6681
Epoch 6830: Loss = 0.6576
Epoch 6830: Loss = 0.6573
Epoch 6830: Loss = 0.6497
Epoch 6830: Loss = 0.6538


 68%|██████▊   | 6842/10000 [09:08<03:52, 13.56it/s]

Epoch 6840: Loss = 0.6789
Epoch 6840: Loss = 0.6531
Epoch 6840: Loss = 0.6705
Epoch 6840: Loss = 0.6716
Epoch 6840: Loss = 0.6737


 69%|██████▊   | 6852/10000 [09:08<03:59, 13.13it/s]

Epoch 6850: Loss = 0.6532
Epoch 6850: Loss = 0.6629
Epoch 6850: Loss = 0.6751
Epoch 6850: Loss = 0.6756
Epoch 6850: Loss = 0.6748


 69%|██████▊   | 6862/10000 [09:09<04:02, 12.93it/s]

Epoch 6860: Loss = 0.7137
Epoch 6860: Loss = 0.6886
Epoch 6860: Loss = 0.6491
Epoch 6860: Loss = 0.6616
Epoch 6860: Loss = 0.6622


 69%|██████▊   | 6872/10000 [09:10<04:13, 12.36it/s]

Epoch 6870: Loss = 0.6759
Epoch 6870: Loss = 0.6434
Epoch 6870: Loss = 0.6607
Epoch 6870: Loss = 0.6858
Epoch 6870: Loss = 0.6451


 69%|██████▉   | 6882/10000 [09:11<03:44, 13.88it/s]

Epoch 6880: Loss = 0.6920
Epoch 6880: Loss = 0.6685
Epoch 6880: Loss = 0.6333
Epoch 6880: Loss = 0.6539
Epoch 6880: Loss = 0.6611


 69%|██████▉   | 6892/10000 [09:11<03:57, 13.08it/s]

Epoch 6890: Loss = 0.6576
Epoch 6890: Loss = 0.6711
Epoch 6890: Loss = 0.6177
Epoch 6890: Loss = 0.6542
Epoch 6890: Loss = 0.6644


 69%|██████▉   | 6902/10000 [09:12<04:25, 11.66it/s]

Epoch 6900: Loss = 0.6524
Epoch 6900: Loss = 0.6651
Epoch 6900: Loss = 0.6558
Epoch 6900: Loss = 0.6647
Epoch 6900: Loss = 0.6762


 69%|██████▉   | 6912/10000 [09:13<03:54, 13.18it/s]

Epoch 6910: Loss = 0.6984
Epoch 6910: Loss = 0.6898
Epoch 6910: Loss = 0.6327
Epoch 6910: Loss = 0.6560
Epoch 6910: Loss = 0.6372


 69%|██████▉   | 6922/10000 [09:14<03:40, 13.98it/s]

Epoch 6920: Loss = 0.6666
Epoch 6920: Loss = 0.6303
Epoch 6920: Loss = 0.6562
Epoch 6920: Loss = 0.6772
Epoch 6920: Loss = 0.6998


 69%|██████▉   | 6932/10000 [09:15<04:26, 11.51it/s]

Epoch 6930: Loss = 0.6664
Epoch 6930: Loss = 0.6901
Epoch 6930: Loss = 0.6571
Epoch 6930: Loss = 0.6917
Epoch 6930: Loss = 0.7084


 69%|██████▉   | 6942/10000 [09:15<04:09, 12.27it/s]

Epoch 6940: Loss = 0.6663
Epoch 6940: Loss = 0.6429
Epoch 6940: Loss = 0.6718
Epoch 6940: Loss = 0.6370
Epoch 6940: Loss = 0.6977


 70%|██████▉   | 6952/10000 [09:16<04:00, 12.66it/s]

Epoch 6950: Loss = 0.6562
Epoch 6950: Loss = 0.6527
Epoch 6950: Loss = 0.6802
Epoch 6950: Loss = 0.6606
Epoch 6950: Loss = 0.6513


 70%|██████▉   | 6962/10000 [09:17<04:02, 12.51it/s]

Epoch 6960: Loss = 0.6605
Epoch 6960: Loss = 0.6853
Epoch 6960: Loss = 0.6875
Epoch 6960: Loss = 0.6727
Epoch 6960: Loss = 0.7183


 70%|██████▉   | 6972/10000 [09:18<03:40, 13.71it/s]

Epoch 6970: Loss = 0.6808
Epoch 6970: Loss = 0.6545
Epoch 6970: Loss = 0.6725
Epoch 6970: Loss = 0.6806
Epoch 6970: Loss = 0.6407


 70%|██████▉   | 6982/10000 [09:18<03:38, 13.84it/s]

Epoch 6980: Loss = 0.6387
Epoch 6980: Loss = 0.6819
Epoch 6980: Loss = 0.6654
Epoch 6980: Loss = 0.6808
Epoch 6980: Loss = 0.6553


 70%|██████▉   | 6992/10000 [09:19<03:53, 12.86it/s]

Epoch 6990: Loss = 0.6315
Epoch 6990: Loss = 0.6650
Epoch 6990: Loss = 0.6845
Epoch 6990: Loss = 0.7050
Epoch 6990: Loss = 0.6777


 70%|███████   | 7002/10000 [09:20<04:25, 11.28it/s]

Epoch 7000: Loss = 0.6282
Epoch 7000: Loss = 0.6647
Epoch 7000: Loss = 0.7183
Epoch 7000: Loss = 0.6578
Epoch 7000: Loss = 0.6871


 70%|███████   | 7012/10000 [09:21<03:41, 13.47it/s]

Epoch 7010: Loss = 0.6444
Epoch 7010: Loss = 0.6771
Epoch 7010: Loss = 0.6854
Epoch 7010: Loss = 0.6538
Epoch 7010: Loss = 0.6727


 70%|███████   | 7022/10000 [09:22<03:53, 12.73it/s]

Epoch 7020: Loss = 0.6583
Epoch 7020: Loss = 0.6947
Epoch 7020: Loss = 0.6529
Epoch 7020: Loss = 0.6940
Epoch 7020: Loss = 0.6321


 70%|███████   | 7032/10000 [09:23<03:59, 12.37it/s]

Epoch 7030: Loss = 0.6454
Epoch 7030: Loss = 0.6765
Epoch 7030: Loss = 0.6496
Epoch 7030: Loss = 0.6478
Epoch 7030: Loss = 0.6474


 70%|███████   | 7042/10000 [09:23<04:16, 11.51it/s]

Epoch 7040: Loss = 0.6800
Epoch 7040: Loss = 0.6992
Epoch 7040: Loss = 0.6826
Epoch 7040: Loss = 0.6960
Epoch 7040: Loss = 0.6466


 71%|███████   | 7052/10000 [09:24<04:04, 12.06it/s]

Epoch 7050: Loss = 0.6619
Epoch 7050: Loss = 0.6609
Epoch 7050: Loss = 0.6462
Epoch 7050: Loss = 0.6690
Epoch 7050: Loss = 0.6850


 71%|███████   | 7062/10000 [09:25<03:37, 13.51it/s]

Epoch 7060: Loss = 0.6984
Epoch 7060: Loss = 0.6841
Epoch 7060: Loss = 0.6574
Epoch 7060: Loss = 0.6951
Epoch 7060: Loss = 0.6517


 71%|███████   | 7072/10000 [09:26<03:54, 12.49it/s]

Epoch 7070: Loss = 0.6585
Epoch 7070: Loss = 0.6807
Epoch 7070: Loss = 0.6721
Epoch 7070: Loss = 0.6687
Epoch 7070: Loss = 0.6432


 71%|███████   | 7082/10000 [09:27<03:43, 13.06it/s]

Epoch 7080: Loss = 0.6553
Epoch 7080: Loss = 0.6571
Epoch 7080: Loss = 0.6644
Epoch 7080: Loss = 0.6644
Epoch 7080: Loss = 0.6810


 71%|███████   | 7092/10000 [09:27<03:36, 13.42it/s]

Epoch 7090: Loss = 0.6493
Epoch 7090: Loss = 0.6500
Epoch 7090: Loss = 0.6855
Epoch 7090: Loss = 0.6247
Epoch 7090: Loss = 0.6443


 71%|███████   | 7102/10000 [09:28<03:55, 12.33it/s]

Epoch 7100: Loss = 0.6487
Epoch 7100: Loss = 0.6657
Epoch 7100: Loss = 0.6858
Epoch 7100: Loss = 0.6769
Epoch 7100: Loss = 0.6824


 71%|███████   | 7112/10000 [09:29<03:44, 12.87it/s]

Epoch 7110: Loss = 0.6469
Epoch 7110: Loss = 0.6731
Epoch 7110: Loss = 0.6750
Epoch 7110: Loss = 0.6464
Epoch 7110: Loss = 0.6659


 71%|███████   | 7122/10000 [09:30<04:03, 11.81it/s]

Epoch 7120: Loss = 0.6525
Epoch 7120: Loss = 0.6467
Epoch 7120: Loss = 0.6606
Epoch 7120: Loss = 0.6541
Epoch 7120: Loss = 0.6716


 71%|███████▏  | 7132/10000 [09:31<04:12, 11.35it/s]

Epoch 7130: Loss = 0.6604
Epoch 7130: Loss = 0.6546
Epoch 7130: Loss = 0.6711
Epoch 7130: Loss = 0.6359
Epoch 7130: Loss = 0.6746


 71%|███████▏  | 7142/10000 [09:32<04:22, 10.88it/s]

Epoch 7140: Loss = 0.6913
Epoch 7140: Loss = 0.6684
Epoch 7140: Loss = 0.6479
Epoch 7140: Loss = 0.6963
Epoch 7140: Loss = 0.6797


 72%|███████▏  | 7152/10000 [09:32<03:41, 12.87it/s]

Epoch 7150: Loss = 0.6695
Epoch 7150: Loss = 0.6821
Epoch 7150: Loss = 0.6999
Epoch 7150: Loss = 0.6588
Epoch 7150: Loss = 0.6751


 72%|███████▏  | 7162/10000 [09:33<03:40, 12.89it/s]

Epoch 7160: Loss = 0.6655
Epoch 7160: Loss = 0.6696
Epoch 7160: Loss = 0.6857
Epoch 7160: Loss = 0.6702
Epoch 7160: Loss = 0.6712


 72%|███████▏  | 7172/10000 [09:34<03:27, 13.65it/s]

Epoch 7170: Loss = 0.6883
Epoch 7170: Loss = 0.6656
Epoch 7170: Loss = 0.6387
Epoch 7170: Loss = 0.6544
Epoch 7170: Loss = 0.6893


 72%|███████▏  | 7182/10000 [09:35<03:37, 12.99it/s]

Epoch 7180: Loss = 0.6729
Epoch 7180: Loss = 0.6700
Epoch 7180: Loss = 0.6697
Epoch 7180: Loss = 0.6473
Epoch 7180: Loss = 0.6709


 72%|███████▏  | 7192/10000 [09:35<03:23, 13.79it/s]

Epoch 7190: Loss = 0.6331
Epoch 7190: Loss = 0.7011
Epoch 7190: Loss = 0.6658
Epoch 7190: Loss = 0.6367
Epoch 7190: Loss = 0.6674


 72%|███████▏  | 7202/10000 [09:36<04:03, 11.48it/s]

Epoch 7200: Loss = 0.6724
Epoch 7200: Loss = 0.6624
Epoch 7200: Loss = 0.7039
Epoch 7200: Loss = 0.6716
Epoch 7200: Loss = 0.6436


 72%|███████▏  | 7212/10000 [09:37<03:37, 12.83it/s]

Epoch 7210: Loss = 0.6706
Epoch 7210: Loss = 0.6319
Epoch 7210: Loss = 0.6944
Epoch 7210: Loss = 0.6682
Epoch 7210: Loss = 0.6548


 72%|███████▏  | 7222/10000 [09:38<03:42, 12.51it/s]

Epoch 7220: Loss = 0.6963
Epoch 7220: Loss = 0.6919
Epoch 7220: Loss = 0.6852
Epoch 7220: Loss = 0.6279
Epoch 7220: Loss = 0.6435


 72%|███████▏  | 7232/10000 [09:39<03:41, 12.51it/s]

Epoch 7230: Loss = 0.6574
Epoch 7230: Loss = 0.6638
Epoch 7230: Loss = 0.6450
Epoch 7230: Loss = 0.6622
Epoch 7230: Loss = 0.6217


 72%|███████▏  | 7242/10000 [09:39<03:20, 13.77it/s]

Epoch 7240: Loss = 0.6661
Epoch 7240: Loss = 0.6600
Epoch 7240: Loss = 0.6778
Epoch 7240: Loss = 0.6681
Epoch 7240: Loss = 0.6370


 73%|███████▎  | 7252/10000 [09:40<03:20, 13.69it/s]

Epoch 7250: Loss = 0.6493
Epoch 7250: Loss = 0.6910
Epoch 7250: Loss = 0.6685
Epoch 7250: Loss = 0.6787
Epoch 7250: Loss = 0.6440


 73%|███████▎  | 7262/10000 [09:41<03:45, 12.15it/s]

Epoch 7260: Loss = 0.6517
Epoch 7260: Loss = 0.6748
Epoch 7260: Loss = 0.6848
Epoch 7260: Loss = 0.6416
Epoch 7260: Loss = 0.6744


 73%|███████▎  | 7272/10000 [09:42<03:17, 13.82it/s]

Epoch 7270: Loss = 0.6869
Epoch 7270: Loss = 0.6483
Epoch 7270: Loss = 0.6572
Epoch 7270: Loss = 0.6422
Epoch 7270: Loss = 0.6464


 73%|███████▎  | 7282/10000 [09:42<03:12, 14.14it/s]

Epoch 7280: Loss = 0.6558
Epoch 7280: Loss = 0.6741
Epoch 7280: Loss = 0.6576
Epoch 7280: Loss = 0.6730
Epoch 7280: Loss = 0.6819


 73%|███████▎  | 7292/10000 [09:43<03:25, 13.15it/s]

Epoch 7290: Loss = 0.6656
Epoch 7290: Loss = 0.6527
Epoch 7290: Loss = 0.6983
Epoch 7290: Loss = 0.6441
Epoch 7290: Loss = 0.6601


 73%|███████▎  | 7302/10000 [09:44<03:10, 14.17it/s]

Epoch 7300: Loss = 0.6424
Epoch 7300: Loss = 0.6860
Epoch 7300: Loss = 0.6727
Epoch 7300: Loss = 0.6856
Epoch 7300: Loss = 0.6399


 73%|███████▎  | 7312/10000 [09:45<03:17, 13.64it/s]

Epoch 7310: Loss = 0.6569
Epoch 7310: Loss = 0.6675
Epoch 7310: Loss = 0.6270
Epoch 7310: Loss = 0.6328
Epoch 7310: Loss = 0.6572


 73%|███████▎  | 7322/10000 [09:45<03:08, 14.22it/s]

Epoch 7320: Loss = 0.6840
Epoch 7320: Loss = 0.6791
Epoch 7320: Loss = 0.6783
Epoch 7320: Loss = 0.6841
Epoch 7320: Loss = 0.6685


 73%|███████▎  | 7332/10000 [09:46<03:17, 13.51it/s]

Epoch 7330: Loss = 0.6670
Epoch 7330: Loss = 0.6220
Epoch 7330: Loss = 0.6670
Epoch 7330: Loss = 0.6433
Epoch 7330: Loss = 0.6929


 73%|███████▎  | 7342/10000 [09:47<03:27, 12.81it/s]

Epoch 7340: Loss = 0.6883
Epoch 7340: Loss = 0.6775
Epoch 7340: Loss = 0.6831
Epoch 7340: Loss = 0.6950
Epoch 7340: Loss = 0.6649


 74%|███████▎  | 7352/10000 [09:48<03:38, 12.13it/s]

Epoch 7350: Loss = 0.6553
Epoch 7350: Loss = 0.6739
Epoch 7350: Loss = 0.6569
Epoch 7350: Loss = 0.6482
Epoch 7350: Loss = 0.6698


 74%|███████▎  | 7362/10000 [09:49<03:27, 12.70it/s]

Epoch 7360: Loss = 0.6832
Epoch 7360: Loss = 0.6538
Epoch 7360: Loss = 0.6722
Epoch 7360: Loss = 0.6661
Epoch 7360: Loss = 0.6778


 74%|███████▎  | 7372/10000 [09:49<03:18, 13.25it/s]

Epoch 7370: Loss = 0.6528
Epoch 7370: Loss = 0.6879
Epoch 7370: Loss = 0.6776
Epoch 7370: Loss = 0.6932
Epoch 7370: Loss = 0.6678


 74%|███████▍  | 7382/10000 [09:50<03:09, 13.85it/s]

Epoch 7380: Loss = 0.6637
Epoch 7380: Loss = 0.6958
Epoch 7380: Loss = 0.6918
Epoch 7380: Loss = 0.6814
Epoch 7380: Loss = 0.6675


 74%|███████▍  | 7392/10000 [09:51<03:11, 13.61it/s]

Epoch 7390: Loss = 0.6819
Epoch 7390: Loss = 0.6711
Epoch 7390: Loss = 0.6352
Epoch 7390: Loss = 0.6630
Epoch 7390: Loss = 0.6810


 74%|███████▍  | 7402/10000 [09:52<03:13, 13.45it/s]

Epoch 7400: Loss = 0.6397
Epoch 7400: Loss = 0.6667
Epoch 7400: Loss = 0.6822
Epoch 7400: Loss = 0.6487
Epoch 7400: Loss = 0.6675


 74%|███████▍  | 7412/10000 [09:52<03:22, 12.77it/s]

Epoch 7410: Loss = 0.6912
Epoch 7410: Loss = 0.6600
Epoch 7410: Loss = 0.6518
Epoch 7410: Loss = 0.6400
Epoch 7410: Loss = 0.6491


 74%|███████▍  | 7422/10000 [09:53<03:01, 14.18it/s]

Epoch 7420: Loss = 0.6860
Epoch 7420: Loss = 0.7054
Epoch 7420: Loss = 0.6676
Epoch 7420: Loss = 0.6869
Epoch 7420: Loss = 0.6493


 74%|███████▍  | 7432/10000 [09:54<03:27, 12.35it/s]

Epoch 7430: Loss = 0.6516
Epoch 7430: Loss = 0.6817
Epoch 7430: Loss = 0.6837
Epoch 7430: Loss = 0.6622
Epoch 7430: Loss = 0.6738


 74%|███████▍  | 7442/10000 [09:55<03:28, 12.28it/s]

Epoch 7440: Loss = 0.6475
Epoch 7440: Loss = 0.6976
Epoch 7440: Loss = 0.6798
Epoch 7440: Loss = 0.7004
Epoch 7440: Loss = 0.6537


 75%|███████▍  | 7452/10000 [09:55<03:02, 13.94it/s]

Epoch 7450: Loss = 0.6766
Epoch 7450: Loss = 0.6623
Epoch 7450: Loss = 0.6611
Epoch 7450: Loss = 0.6946
Epoch 7450: Loss = 0.6999


 75%|███████▍  | 7462/10000 [09:56<03:03, 13.86it/s]

Epoch 7460: Loss = 0.6532
Epoch 7460: Loss = 0.6605
Epoch 7460: Loss = 0.6680
Epoch 7460: Loss = 0.6589
Epoch 7460: Loss = 0.6563


 75%|███████▍  | 7472/10000 [09:57<03:26, 12.24it/s]

Epoch 7470: Loss = 0.6486
Epoch 7470: Loss = 0.6593
Epoch 7470: Loss = 0.6724
Epoch 7470: Loss = 0.6766
Epoch 7470: Loss = 0.6935


 75%|███████▍  | 7482/10000 [09:58<03:00, 13.93it/s]

Epoch 7480: Loss = 0.6465
Epoch 7480: Loss = 0.6524
Epoch 7480: Loss = 0.6826
Epoch 7480: Loss = 0.6840
Epoch 7480: Loss = 0.6755


 75%|███████▍  | 7492/10000 [09:58<02:53, 14.43it/s]

Epoch 7490: Loss = 0.6714
Epoch 7490: Loss = 0.6536
Epoch 7490: Loss = 0.6902
Epoch 7490: Loss = 0.6129
Epoch 7490: Loss = 0.6984


 75%|███████▌  | 7502/10000 [09:59<02:56, 14.11it/s]

Epoch 7500: Loss = 0.6675
Epoch 7500: Loss = 0.6627
Epoch 7500: Loss = 0.7032
Epoch 7500: Loss = 0.6708
Epoch 7500: Loss = 0.6436


 75%|███████▌  | 7512/10000 [10:00<03:03, 13.56it/s]

Epoch 7510: Loss = 0.6586
Epoch 7510: Loss = 0.6740
Epoch 7510: Loss = 0.6930
Epoch 7510: Loss = 0.6423
Epoch 7510: Loss = 0.6590


 75%|███████▌  | 7522/10000 [10:01<03:57, 10.45it/s]

Epoch 7520: Loss = 0.6336
Epoch 7520: Loss = 0.6935
Epoch 7520: Loss = 0.6277
Epoch 7520: Loss = 0.6703
Epoch 7520: Loss = 0.6800


 75%|███████▌  | 7532/10000 [10:02<03:14, 12.72it/s]

Epoch 7530: Loss = 0.6416
Epoch 7530: Loss = 0.6609
Epoch 7530: Loss = 0.6865
Epoch 7530: Loss = 0.6595
Epoch 7530: Loss = 0.6754


 75%|███████▌  | 7540/10000 [10:02<03:04, 13.36it/s]

Epoch 7540: Loss = 0.6673
Epoch 7540: Loss = 0.6628
Epoch 7540: Loss = 0.6629
Epoch 7540: Loss = 0.6629
Epoch 7540: Loss = 0.6459


 76%|███████▌  | 7552/10000 [10:03<03:09, 12.95it/s]

Epoch 7550: Loss = 0.6580
Epoch 7550: Loss = 0.7061
Epoch 7550: Loss = 0.6809
Epoch 7550: Loss = 0.6493
Epoch 7550: Loss = 0.6555


 76%|███████▌  | 7562/10000 [10:04<02:54, 13.97it/s]

Epoch 7560: Loss = 0.6512
Epoch 7560: Loss = 0.6699
Epoch 7560: Loss = 0.6831
Epoch 7560: Loss = 0.6502
Epoch 7560: Loss = 0.6643


 76%|███████▌  | 7572/10000 [10:05<03:13, 12.52it/s]

Epoch 7570: Loss = 0.6561
Epoch 7570: Loss = 0.6471
Epoch 7570: Loss = 0.6884
Epoch 7570: Loss = 0.6791
Epoch 7570: Loss = 0.6671


 76%|███████▌  | 7582/10000 [10:06<03:04, 13.12it/s]

Epoch 7580: Loss = 0.6742
Epoch 7580: Loss = 0.6460
Epoch 7580: Loss = 0.6697
Epoch 7580: Loss = 0.6709
Epoch 7580: Loss = 0.6832


 76%|███████▌  | 7592/10000 [10:06<03:04, 13.07it/s]

Epoch 7590: Loss = 0.6477
Epoch 7590: Loss = 0.6626
Epoch 7590: Loss = 0.6444
Epoch 7590: Loss = 0.6671
Epoch 7590: Loss = 0.6677


 76%|███████▌  | 7602/10000 [10:07<02:57, 13.51it/s]

Epoch 7600: Loss = 0.6498
Epoch 7600: Loss = 0.6678
Epoch 7600: Loss = 0.6846
Epoch 7600: Loss = 0.6608
Epoch 7600: Loss = 0.6888


 76%|███████▌  | 7610/10000 [10:08<03:05, 12.90it/s]

Epoch 7610: Loss = 0.6741
Epoch 7610: Loss = 0.6750
Epoch 7610: Loss = 0.6570
Epoch 7610: Loss = 0.6410
Epoch 7610: Loss = 0.6388


 76%|███████▌  | 7622/10000 [10:09<03:53, 10.18it/s]

Epoch 7620: Loss = 0.6936
Epoch 7620: Loss = 0.6504
Epoch 7620: Loss = 0.6807
Epoch 7620: Loss = 0.6469
Epoch 7620: Loss = 0.6828


 76%|███████▋  | 7632/10000 [10:10<03:25, 11.51it/s]

Epoch 7630: Loss = 0.6169
Epoch 7630: Loss = 0.6840
Epoch 7630: Loss = 0.6854
Epoch 7630: Loss = 0.6861
Epoch 7630: Loss = 0.6685


 76%|███████▋  | 7642/10000 [10:11<02:57, 13.25it/s]

Epoch 7640: Loss = 0.6774
Epoch 7640: Loss = 0.6658
Epoch 7640: Loss = 0.6592
Epoch 7640: Loss = 0.6715
Epoch 7640: Loss = 0.6882


 77%|███████▋  | 7652/10000 [10:12<03:26, 11.39it/s]

Epoch 7650: Loss = 0.6715
Epoch 7650: Loss = 0.6506
Epoch 7650: Loss = 0.6835
Epoch 7650: Loss = 0.6687
Epoch 7650: Loss = 0.6631


 77%|███████▋  | 7662/10000 [10:12<03:14, 12.02it/s]

Epoch 7660: Loss = 0.6435
Epoch 7660: Loss = 0.6522
Epoch 7660: Loss = 0.6426
Epoch 7660: Loss = 0.6673
Epoch 7660: Loss = 0.6563


 77%|███████▋  | 7672/10000 [10:13<02:50, 13.63it/s]

Epoch 7670: Loss = 0.6479
Epoch 7670: Loss = 0.6140
Epoch 7670: Loss = 0.7098
Epoch 7670: Loss = 0.6736
Epoch 7670: Loss = 0.6646


 77%|███████▋  | 7682/10000 [10:14<03:06, 12.44it/s]

Epoch 7680: Loss = 0.6662
Epoch 7680: Loss = 0.6564
Epoch 7680: Loss = 0.6970
Epoch 7680: Loss = 0.6276
Epoch 7680: Loss = 0.6619


 77%|███████▋  | 7692/10000 [10:15<02:49, 13.65it/s]

Epoch 7690: Loss = 0.6805
Epoch 7690: Loss = 0.6769
Epoch 7690: Loss = 0.6747
Epoch 7690: Loss = 0.6665
Epoch 7690: Loss = 0.6817


 77%|███████▋  | 7702/10000 [10:15<02:58, 12.90it/s]

Epoch 7700: Loss = 0.6588
Epoch 7700: Loss = 0.6945
Epoch 7700: Loss = 0.6582
Epoch 7700: Loss = 0.6982
Epoch 7700: Loss = 0.6727


 77%|███████▋  | 7712/10000 [10:16<02:44, 13.91it/s]

Epoch 7710: Loss = 0.6603
Epoch 7710: Loss = 0.6702
Epoch 7710: Loss = 0.6439
Epoch 7710: Loss = 0.6967
Epoch 7710: Loss = 0.6989


 77%|███████▋  | 7722/10000 [10:17<02:42, 13.99it/s]

Epoch 7720: Loss = 0.6416
Epoch 7720: Loss = 0.6400
Epoch 7720: Loss = 0.6432
Epoch 7720: Loss = 0.6533
Epoch 7720: Loss = 0.6386


 77%|███████▋  | 7732/10000 [10:18<02:59, 12.67it/s]

Epoch 7730: Loss = 0.6643
Epoch 7730: Loss = 0.6955
Epoch 7730: Loss = 0.7110
Epoch 7730: Loss = 0.6915
Epoch 7730: Loss = 0.6495


 77%|███████▋  | 7742/10000 [10:18<02:59, 12.59it/s]

Epoch 7740: Loss = 0.6491
Epoch 7740: Loss = 0.7252
Epoch 7740: Loss = 0.6687
Epoch 7740: Loss = 0.6726
Epoch 7740: Loss = 0.6350


 78%|███████▊  | 7752/10000 [10:19<03:07, 11.98it/s]

Epoch 7750: Loss = 0.6780
Epoch 7750: Loss = 0.6700
Epoch 7750: Loss = 0.6557
Epoch 7750: Loss = 0.6629
Epoch 7750: Loss = 0.6503


 78%|███████▊  | 7762/10000 [10:20<03:05, 12.05it/s]

Epoch 7760: Loss = 0.6633
Epoch 7760: Loss = 0.6433
Epoch 7760: Loss = 0.6759
Epoch 7760: Loss = 0.6784
Epoch 7760: Loss = 0.6482


 78%|███████▊  | 7772/10000 [10:21<02:45, 13.48it/s]

Epoch 7770: Loss = 0.6670
Epoch 7770: Loss = 0.6622
Epoch 7770: Loss = 0.6720
Epoch 7770: Loss = 0.6633
Epoch 7770: Loss = 0.6552


 78%|███████▊  | 7782/10000 [10:22<03:00, 12.28it/s]

Epoch 7780: Loss = 0.6706
Epoch 7780: Loss = 0.6629
Epoch 7780: Loss = 0.6360
Epoch 7780: Loss = 0.6467
Epoch 7780: Loss = 0.6566


 78%|███████▊  | 7792/10000 [10:22<02:54, 12.63it/s]

Epoch 7790: Loss = 0.6779
Epoch 7790: Loss = 0.6534
Epoch 7790: Loss = 0.6894
Epoch 7790: Loss = 0.6441
Epoch 7790: Loss = 0.6807


 78%|███████▊  | 7802/10000 [10:23<02:52, 12.75it/s]

Epoch 7800: Loss = 0.6809
Epoch 7800: Loss = 0.6947
Epoch 7800: Loss = 0.6573
Epoch 7800: Loss = 0.6142
Epoch 7800: Loss = 0.6907


 78%|███████▊  | 7812/10000 [10:24<02:41, 13.53it/s]

Epoch 7810: Loss = 0.6474
Epoch 7810: Loss = 0.6627
Epoch 7810: Loss = 0.6422
Epoch 7810: Loss = 0.6675
Epoch 7810: Loss = 0.6406


 78%|███████▊  | 7822/10000 [10:25<02:58, 12.21it/s]

Epoch 7820: Loss = 0.6283
Epoch 7820: Loss = 0.6916
Epoch 7820: Loss = 0.6550
Epoch 7820: Loss = 0.6966
Epoch 7820: Loss = 0.6470


 78%|███████▊  | 7832/10000 [10:26<02:36, 13.81it/s]

Epoch 7830: Loss = 0.6437
Epoch 7830: Loss = 0.6772
Epoch 7830: Loss = 0.6472
Epoch 7830: Loss = 0.6838
Epoch 7830: Loss = 0.6345


 78%|███████▊  | 7842/10000 [10:26<02:38, 13.65it/s]

Epoch 7840: Loss = 0.6851
Epoch 7840: Loss = 0.6342
Epoch 7840: Loss = 0.6829
Epoch 7840: Loss = 0.6914
Epoch 7840: Loss = 0.6216


 79%|███████▊  | 7852/10000 [10:27<02:32, 14.08it/s]

Epoch 7850: Loss = 0.6362
Epoch 7850: Loss = 0.7038
Epoch 7850: Loss = 0.6782
Epoch 7850: Loss = 0.6671
Epoch 7850: Loss = 0.6667


 79%|███████▊  | 7862/10000 [10:28<02:40, 13.30it/s]

Epoch 7860: Loss = 0.6737
Epoch 7860: Loss = 0.6759
Epoch 7860: Loss = 0.6704
Epoch 7860: Loss = 0.6959
Epoch 7860: Loss = 0.6535


 79%|███████▊  | 7872/10000 [10:29<02:43, 12.98it/s]

Epoch 7870: Loss = 0.6365
Epoch 7870: Loss = 0.6436
Epoch 7870: Loss = 0.6860
Epoch 7870: Loss = 0.6644
Epoch 7870: Loss = 0.6530


 79%|███████▉  | 7882/10000 [10:29<02:29, 14.12it/s]

Epoch 7880: Loss = 0.6828
Epoch 7880: Loss = 0.6653
Epoch 7880: Loss = 0.6741
Epoch 7880: Loss = 0.6595
Epoch 7880: Loss = 0.6941


 79%|███████▉  | 7892/10000 [10:30<02:45, 12.77it/s]

Epoch 7890: Loss = 0.6638
Epoch 7890: Loss = 0.6585
Epoch 7890: Loss = 0.6489
Epoch 7890: Loss = 0.6731
Epoch 7890: Loss = 0.6537


 79%|███████▉  | 7902/10000 [10:31<02:38, 13.26it/s]

Epoch 7900: Loss = 0.6840
Epoch 7900: Loss = 0.6607
Epoch 7900: Loss = 0.6809
Epoch 7900: Loss = 0.6852
Epoch 7900: Loss = 0.6689


 79%|███████▉  | 7912/10000 [10:32<02:36, 13.35it/s]

Epoch 7910: Loss = 0.6653
Epoch 7910: Loss = 0.6567
Epoch 7910: Loss = 0.6522
Epoch 7910: Loss = 0.6911
Epoch 7910: Loss = 0.6763


 79%|███████▉  | 7922/10000 [10:32<02:28, 14.02it/s]

Epoch 7920: Loss = 0.6751
Epoch 7920: Loss = 0.6655
Epoch 7920: Loss = 0.6817
Epoch 7920: Loss = 0.6820
Epoch 7920: Loss = 0.6778


 79%|███████▉  | 7932/10000 [10:33<02:35, 13.28it/s]

Epoch 7930: Loss = 0.6642
Epoch 7930: Loss = 0.6813
Epoch 7930: Loss = 0.6585
Epoch 7930: Loss = 0.6937
Epoch 7930: Loss = 0.6405


 79%|███████▉  | 7942/10000 [10:34<02:40, 12.80it/s]

Epoch 7940: Loss = 0.6456
Epoch 7940: Loss = 0.6723
Epoch 7940: Loss = 0.6812
Epoch 7940: Loss = 0.6756
Epoch 7940: Loss = 0.6900


 80%|███████▉  | 7952/10000 [10:35<02:31, 13.56it/s]

Epoch 7950: Loss = 0.6494
Epoch 7950: Loss = 0.6751
Epoch 7950: Loss = 0.6418
Epoch 7950: Loss = 0.6582
Epoch 7950: Loss = 0.6121


 80%|███████▉  | 7962/10000 [10:36<02:54, 11.68it/s]

Epoch 7960: Loss = 0.6810
Epoch 7960: Loss = 0.6703
Epoch 7960: Loss = 0.6570
Epoch 7960: Loss = 0.6619
Epoch 7960: Loss = 0.6552


 80%|███████▉  | 7972/10000 [10:36<02:46, 12.20it/s]

Epoch 7970: Loss = 0.6787
Epoch 7970: Loss = 0.6487
Epoch 7970: Loss = 0.6786
Epoch 7970: Loss = 0.6483
Epoch 7970: Loss = 0.6492


 80%|███████▉  | 7982/10000 [10:37<02:32, 13.27it/s]

Epoch 7980: Loss = 0.6848
Epoch 7980: Loss = 0.6677
Epoch 7980: Loss = 0.6593
Epoch 7980: Loss = 0.6827
Epoch 7980: Loss = 0.6500


 80%|███████▉  | 7992/10000 [10:38<02:25, 13.82it/s]

Epoch 7990: Loss = 0.6631
Epoch 7990: Loss = 0.6550
Epoch 7990: Loss = 0.6510
Epoch 7990: Loss = 0.6614
Epoch 7990: Loss = 0.6493


 80%|████████  | 8002/10000 [10:39<02:36, 12.78it/s]

Epoch 8000: Loss = 0.6937
Epoch 8000: Loss = 0.6789
Epoch 8000: Loss = 0.6521
Epoch 8000: Loss = 0.6643
Epoch 8000: Loss = 0.6569


 80%|████████  | 8012/10000 [10:40<02:27, 13.44it/s]

Epoch 8010: Loss = 0.6732
Epoch 8010: Loss = 0.6722
Epoch 8010: Loss = 0.6427
Epoch 8010: Loss = 0.6654
Epoch 8010: Loss = 0.6197


 80%|████████  | 8022/10000 [10:40<02:21, 13.94it/s]

Epoch 8020: Loss = 0.6750
Epoch 8020: Loss = 0.6771
Epoch 8020: Loss = 0.6741
Epoch 8020: Loss = 0.6542
Epoch 8020: Loss = 0.6598


 80%|████████  | 8032/10000 [10:41<02:27, 13.31it/s]

Epoch 8030: Loss = 0.6803
Epoch 8030: Loss = 0.6436
Epoch 8030: Loss = 0.6486
Epoch 8030: Loss = 0.6487
Epoch 8030: Loss = 0.6722


 80%|████████  | 8042/10000 [10:42<02:25, 13.48it/s]

Epoch 8040: Loss = 0.6788
Epoch 8040: Loss = 0.6809
Epoch 8040: Loss = 0.6621
Epoch 8040: Loss = 0.6201
Epoch 8040: Loss = 0.6697


 81%|████████  | 8052/10000 [10:43<02:17, 14.15it/s]

Epoch 8050: Loss = 0.6448
Epoch 8050: Loss = 0.6517
Epoch 8050: Loss = 0.6591
Epoch 8050: Loss = 0.6515
Epoch 8050: Loss = 0.6819


 81%|████████  | 8062/10000 [10:43<02:17, 14.10it/s]

Epoch 8060: Loss = 0.6685
Epoch 8060: Loss = 0.6441
Epoch 8060: Loss = 0.6647
Epoch 8060: Loss = 0.7122
Epoch 8060: Loss = 0.6874


 81%|████████  | 8072/10000 [10:44<02:16, 14.14it/s]

Epoch 8070: Loss = 0.6465
Epoch 8070: Loss = 0.7090
Epoch 8070: Loss = 0.6658
Epoch 8070: Loss = 0.6649
Epoch 8070: Loss = 0.6970


 81%|████████  | 8082/10000 [10:45<02:25, 13.20it/s]

Epoch 8080: Loss = 0.6864
Epoch 8080: Loss = 0.6632
Epoch 8080: Loss = 0.6740
Epoch 8080: Loss = 0.7260
Epoch 8080: Loss = 0.6411


 81%|████████  | 8092/10000 [10:45<02:16, 13.98it/s]

Epoch 8090: Loss = 0.6650
Epoch 8090: Loss = 0.6660
Epoch 8090: Loss = 0.6677
Epoch 8090: Loss = 0.6715
Epoch 8090: Loss = 0.6555


 81%|████████  | 8102/10000 [10:46<02:23, 13.22it/s]

Epoch 8100: Loss = 0.6803
Epoch 8100: Loss = 0.6877
Epoch 8100: Loss = 0.6805
Epoch 8100: Loss = 0.6538
Epoch 8100: Loss = 0.6622


 81%|████████  | 8112/10000 [10:47<02:22, 13.28it/s]

Epoch 8110: Loss = 0.6627
Epoch 8110: Loss = 0.6432
Epoch 8110: Loss = 0.6659
Epoch 8110: Loss = 0.6859
Epoch 8110: Loss = 0.7207


 81%|████████  | 8122/10000 [10:48<02:17, 13.65it/s]

Epoch 8120: Loss = 0.6517
Epoch 8120: Loss = 0.6352
Epoch 8120: Loss = 0.6903
Epoch 8120: Loss = 0.6589
Epoch 8120: Loss = 0.6709


 81%|████████▏ | 8132/10000 [10:48<02:22, 13.13it/s]

Epoch 8130: Loss = 0.6703
Epoch 8130: Loss = 0.6718
Epoch 8130: Loss = 0.6577
Epoch 8130: Loss = 0.6493
Epoch 8130: Loss = 0.6430


 81%|████████▏ | 8142/10000 [10:49<02:15, 13.76it/s]

Epoch 8140: Loss = 0.6541
Epoch 8140: Loss = 0.6822
Epoch 8140: Loss = 0.6592
Epoch 8140: Loss = 0.6496
Epoch 8140: Loss = 0.6317


 82%|████████▏ | 8152/10000 [10:50<02:15, 13.63it/s]

Epoch 8150: Loss = 0.6799
Epoch 8150: Loss = 0.6706
Epoch 8150: Loss = 0.6801
Epoch 8150: Loss = 0.6697
Epoch 8150: Loss = 0.6645


 82%|████████▏ | 8162/10000 [10:51<02:39, 11.52it/s]

Epoch 8160: Loss = 0.6550
Epoch 8160: Loss = 0.6780
Epoch 8160: Loss = 0.7009
Epoch 8160: Loss = 0.6546
Epoch 8160: Loss = 0.6878


 82%|████████▏ | 8172/10000 [10:52<02:26, 12.48it/s]

Epoch 8170: Loss = 0.6631
Epoch 8170: Loss = 0.6744
Epoch 8170: Loss = 0.6698
Epoch 8170: Loss = 0.6862
Epoch 8170: Loss = 0.6712


 82%|████████▏ | 8182/10000 [10:52<02:18, 13.17it/s]

Epoch 8180: Loss = 0.6745
Epoch 8180: Loss = 0.6578
Epoch 8180: Loss = 0.6265
Epoch 8180: Loss = 0.6757
Epoch 8180: Loss = 0.6831


 82%|████████▏ | 8192/10000 [10:53<02:10, 13.87it/s]

Epoch 8190: Loss = 0.6556
Epoch 8190: Loss = 0.6422
Epoch 8190: Loss = 0.6780
Epoch 8190: Loss = 0.6811
Epoch 8190: Loss = 0.6752


 82%|████████▏ | 8202/10000 [10:54<02:08, 13.97it/s]

Epoch 8200: Loss = 0.6916
Epoch 8200: Loss = 0.6801
Epoch 8200: Loss = 0.6520
Epoch 8200: Loss = 0.6140
Epoch 8200: Loss = 0.6478


 82%|████████▏ | 8212/10000 [10:55<02:08, 13.91it/s]

Epoch 8210: Loss = 0.6335
Epoch 8210: Loss = 0.6494
Epoch 8210: Loss = 0.6784
Epoch 8210: Loss = 0.6437
Epoch 8210: Loss = 0.6779


 82%|████████▏ | 8222/10000 [10:55<02:35, 11.42it/s]

Epoch 8220: Loss = 0.6622
Epoch 8220: Loss = 0.6514
Epoch 8220: Loss = 0.6495
Epoch 8220: Loss = 0.6412
Epoch 8220: Loss = 0.6996


 82%|████████▏ | 8232/10000 [10:56<02:34, 11.41it/s]

Epoch 8230: Loss = 0.6715
Epoch 8230: Loss = 0.6461
Epoch 8230: Loss = 0.6431
Epoch 8230: Loss = 0.6648
Epoch 8230: Loss = 0.6862


 82%|████████▏ | 8242/10000 [10:57<02:20, 12.53it/s]

Epoch 8240: Loss = 0.6853
Epoch 8240: Loss = 0.6597
Epoch 8240: Loss = 0.6459
Epoch 8240: Loss = 0.6973
Epoch 8240: Loss = 0.6805


 83%|████████▎ | 8252/10000 [10:58<02:26, 11.93it/s]

Epoch 8250: Loss = 0.6726
Epoch 8250: Loss = 0.6644
Epoch 8250: Loss = 0.6785
Epoch 8250: Loss = 0.6355
Epoch 8250: Loss = 0.6831


 83%|████████▎ | 8262/10000 [10:59<02:32, 11.36it/s]

Epoch 8260: Loss = 0.6532
Epoch 8260: Loss = 0.6391
Epoch 8260: Loss = 0.6584
Epoch 8260: Loss = 0.6226
Epoch 8260: Loss = 0.6912


 83%|████████▎ | 8272/10000 [11:00<02:14, 12.84it/s]

Epoch 8270: Loss = 0.6892
Epoch 8270: Loss = 0.6701
Epoch 8270: Loss = 0.6691
Epoch 8270: Loss = 0.6809
Epoch 8270: Loss = 0.6793


 83%|████████▎ | 8282/10000 [11:00<02:04, 13.79it/s]

Epoch 8280: Loss = 0.6511
Epoch 8280: Loss = 0.6693
Epoch 8280: Loss = 0.6538
Epoch 8280: Loss = 0.6423
Epoch 8280: Loss = 0.6490


 83%|████████▎ | 8292/10000 [11:01<02:06, 13.49it/s]

Epoch 8290: Loss = 0.7085
Epoch 8290: Loss = 0.6494
Epoch 8290: Loss = 0.6606
Epoch 8290: Loss = 0.6681
Epoch 8290: Loss = 0.6502


 83%|████████▎ | 8302/10000 [11:02<02:05, 13.58it/s]

Epoch 8300: Loss = 0.6629
Epoch 8300: Loss = 0.6603
Epoch 8300: Loss = 0.6760
Epoch 8300: Loss = 0.6471
Epoch 8300: Loss = 0.6687


 83%|████████▎ | 8312/10000 [11:03<02:27, 11.47it/s]

Epoch 8310: Loss = 0.6761
Epoch 8310: Loss = 0.6650
Epoch 8310: Loss = 0.6799
Epoch 8310: Loss = 0.6359
Epoch 8310: Loss = 0.6297


 83%|████████▎ | 8322/10000 [11:04<02:30, 11.16it/s]

Epoch 8320: Loss = 0.6729
Epoch 8320: Loss = 0.6497
Epoch 8320: Loss = 0.6627
Epoch 8320: Loss = 0.6300
Epoch 8320: Loss = 0.6623


 83%|████████▎ | 8332/10000 [11:05<02:27, 11.29it/s]

Epoch 8330: Loss = 0.6546
Epoch 8330: Loss = 0.6451
Epoch 8330: Loss = 0.6939
Epoch 8330: Loss = 0.6937
Epoch 8330: Loss = 0.6318


 83%|████████▎ | 8342/10000 [11:05<02:05, 13.23it/s]

Epoch 8340: Loss = 0.6668
Epoch 8340: Loss = 0.7242
Epoch 8340: Loss = 0.6797
Epoch 8340: Loss = 0.6564
Epoch 8340: Loss = 0.6523


 84%|████████▎ | 8352/10000 [11:06<02:04, 13.19it/s]

Epoch 8350: Loss = 0.6587
Epoch 8350: Loss = 0.6790
Epoch 8350: Loss = 0.6484
Epoch 8350: Loss = 0.6535
Epoch 8350: Loss = 0.6780


 84%|████████▎ | 8362/10000 [11:07<02:22, 11.51it/s]

Epoch 8360: Loss = 0.6948
Epoch 8360: Loss = 0.6883
Epoch 8360: Loss = 0.6838
Epoch 8360: Loss = 0.6457
Epoch 8360: Loss = 0.6624


 84%|████████▎ | 8372/10000 [11:08<02:40, 10.14it/s]

Epoch 8370: Loss = 0.6710
Epoch 8370: Loss = 0.6355
Epoch 8370: Loss = 0.6513
Epoch 8370: Loss = 0.6690
Epoch 8370: Loss = 0.6519


 84%|████████▍ | 8382/10000 [11:09<02:04, 13.00it/s]

Epoch 8380: Loss = 0.6614
Epoch 8380: Loss = 0.6577
Epoch 8380: Loss = 0.6448
Epoch 8380: Loss = 0.6700
Epoch 8380: Loss = 0.6381


 84%|████████▍ | 8392/10000 [11:09<01:57, 13.65it/s]

Epoch 8390: Loss = 0.6742
Epoch 8390: Loss = 0.6455
Epoch 8390: Loss = 0.6912
Epoch 8390: Loss = 0.6358
Epoch 8390: Loss = 0.6701


 84%|████████▍ | 8402/10000 [11:10<02:02, 13.04it/s]

Epoch 8400: Loss = 0.6529
Epoch 8400: Loss = 0.6630
Epoch 8400: Loss = 0.6453
Epoch 8400: Loss = 0.6688
Epoch 8400: Loss = 0.6711


 84%|████████▍ | 8412/10000 [11:11<01:54, 13.81it/s]

Epoch 8410: Loss = 0.6449
Epoch 8410: Loss = 0.6312
Epoch 8410: Loss = 0.6637
Epoch 8410: Loss = 0.6186
Epoch 8410: Loss = 0.6609


 84%|████████▍ | 8422/10000 [11:12<01:52, 13.98it/s]

Epoch 8420: Loss = 0.6647
Epoch 8420: Loss = 0.6822
Epoch 8420: Loss = 0.6815
Epoch 8420: Loss = 0.6725
Epoch 8420: Loss = 0.6355


 84%|████████▍ | 8432/10000 [11:13<02:08, 12.18it/s]

Epoch 8430: Loss = 0.6481
Epoch 8430: Loss = 0.6798
Epoch 8430: Loss = 0.6718
Epoch 8430: Loss = 0.6522
Epoch 8430: Loss = 0.6726


 84%|████████▍ | 8442/10000 [11:13<02:03, 12.62it/s]

Epoch 8440: Loss = 0.6780
Epoch 8440: Loss = 0.7018
Epoch 8440: Loss = 0.6961
Epoch 8440: Loss = 0.6294
Epoch 8440: Loss = 0.6950


 85%|████████▍ | 8452/10000 [11:14<01:59, 12.93it/s]

Epoch 8450: Loss = 0.6274
Epoch 8450: Loss = 0.6463
Epoch 8450: Loss = 0.6587
Epoch 8450: Loss = 0.6468
Epoch 8450: Loss = 0.6666


 85%|████████▍ | 8462/10000 [11:15<01:51, 13.81it/s]

Epoch 8460: Loss = 0.7106
Epoch 8460: Loss = 0.6730
Epoch 8460: Loss = 0.6675
Epoch 8460: Loss = 0.6761
Epoch 8460: Loss = 0.6808


 85%|████████▍ | 8472/10000 [11:16<02:02, 12.48it/s]

Epoch 8470: Loss = 0.6871
Epoch 8470: Loss = 0.6581
Epoch 8470: Loss = 0.6371
Epoch 8470: Loss = 0.6537
Epoch 8470: Loss = 0.6588


 85%|████████▍ | 8482/10000 [11:17<02:13, 11.35it/s]

Epoch 8480: Loss = 0.6778
Epoch 8480: Loss = 0.6905
Epoch 8480: Loss = 0.6638
Epoch 8480: Loss = 0.6288
Epoch 8480: Loss = 0.6428


 85%|████████▍ | 8492/10000 [11:17<01:58, 12.74it/s]

Epoch 8490: Loss = 0.6626
Epoch 8490: Loss = 0.6535
Epoch 8490: Loss = 0.6695
Epoch 8490: Loss = 0.6566
Epoch 8490: Loss = 0.6774


 85%|████████▌ | 8502/10000 [11:18<01:48, 13.80it/s]

Epoch 8500: Loss = 0.6746
Epoch 8500: Loss = 0.6477
Epoch 8500: Loss = 0.6857
Epoch 8500: Loss = 0.6698
Epoch 8500: Loss = 0.6854


 85%|████████▌ | 8512/10000 [11:19<02:01, 12.22it/s]

Epoch 8510: Loss = 0.6721
Epoch 8510: Loss = 0.6707
Epoch 8510: Loss = 0.6585
Epoch 8510: Loss = 0.6566
Epoch 8510: Loss = 0.6970


 85%|████████▌ | 8522/10000 [11:20<01:48, 13.64it/s]

Epoch 8520: Loss = 0.6730
Epoch 8520: Loss = 0.6758
Epoch 8520: Loss = 0.6302
Epoch 8520: Loss = 0.6563
Epoch 8520: Loss = 0.6391


 85%|████████▌ | 8532/10000 [11:20<01:47, 13.64it/s]

Epoch 8530: Loss = 0.6712
Epoch 8530: Loss = 0.6560
Epoch 8530: Loss = 0.6897
Epoch 8530: Loss = 0.6579
Epoch 8530: Loss = 0.6627


 85%|████████▌ | 8542/10000 [11:21<01:48, 13.45it/s]

Epoch 8540: Loss = 0.6146
Epoch 8540: Loss = 0.6432
Epoch 8540: Loss = 0.6823
Epoch 8540: Loss = 0.6372
Epoch 8540: Loss = 0.7004


 86%|████████▌ | 8552/10000 [11:22<01:48, 13.37it/s]

Epoch 8550: Loss = 0.6479
Epoch 8550: Loss = 0.6808
Epoch 8550: Loss = 0.6509
Epoch 8550: Loss = 0.6705
Epoch 8550: Loss = 0.6602


 86%|████████▌ | 8562/10000 [11:23<01:50, 12.99it/s]

Epoch 8560: Loss = 0.6891
Epoch 8560: Loss = 0.6355
Epoch 8560: Loss = 0.6472
Epoch 8560: Loss = 0.6726
Epoch 8560: Loss = 0.6559


 86%|████████▌ | 8570/10000 [11:24<02:28,  9.62it/s]

Epoch 8570: Loss = 0.6626
Epoch 8570: Loss = 0.6724
Epoch 8570: Loss = 0.6473
Epoch 8570: Loss = 0.7064
Epoch 8570: Loss = 0.6630


 86%|████████▌ | 8581/10000 [11:25<02:12, 10.75it/s]

Epoch 8580: Loss = 0.6726
Epoch 8580: Loss = 0.6646
Epoch 8580: Loss = 0.6283
Epoch 8580: Loss = 0.6809
Epoch 8580: Loss = 0.6810


 86%|████████▌ | 8593/10000 [11:25<01:44, 13.41it/s]

Epoch 8590: Loss = 0.6361
Epoch 8590: Loss = 0.6777
Epoch 8590: Loss = 0.6532
Epoch 8590: Loss = 0.6581
Epoch 8590: Loss = 0.6526


 86%|████████▌ | 8601/10000 [11:26<01:59, 11.74it/s]

Epoch 8600: Loss = 0.6456
Epoch 8600: Loss = 0.6595
Epoch 8600: Loss = 0.6975
Epoch 8600: Loss = 0.6805
Epoch 8600: Loss = 0.6753


 86%|████████▌ | 8611/10000 [11:27<01:45, 13.22it/s]

Epoch 8610: Loss = 0.6965
Epoch 8610: Loss = 0.6684
Epoch 8610: Loss = 0.6832
Epoch 8610: Loss = 0.6257
Epoch 8610: Loss = 0.6631


 86%|████████▌ | 8623/10000 [11:28<01:48, 12.66it/s]

Epoch 8620: Loss = 0.6611
Epoch 8620: Loss = 0.6258
Epoch 8620: Loss = 0.6707
Epoch 8620: Loss = 0.6814
Epoch 8620: Loss = 0.6547


 86%|████████▋ | 8633/10000 [11:29<01:42, 13.34it/s]

Epoch 8630: Loss = 0.6637
Epoch 8630: Loss = 0.6406
Epoch 8630: Loss = 0.6922
Epoch 8630: Loss = 0.6603
Epoch 8630: Loss = 0.6386


 86%|████████▋ | 8643/10000 [11:29<01:39, 13.67it/s]

Epoch 8640: Loss = 0.6612
Epoch 8640: Loss = 0.6807
Epoch 8640: Loss = 0.6697
Epoch 8640: Loss = 0.6637
Epoch 8640: Loss = 0.6501


 87%|████████▋ | 8653/10000 [11:30<01:37, 13.77it/s]

Epoch 8650: Loss = 0.6538
Epoch 8650: Loss = 0.7016
Epoch 8650: Loss = 0.6987
Epoch 8650: Loss = 0.6529
Epoch 8650: Loss = 0.6600


 87%|████████▋ | 8661/10000 [11:31<01:38, 13.62it/s]

Epoch 8660: Loss = 0.6252
Epoch 8660: Loss = 0.6494
Epoch 8660: Loss = 0.6553
Epoch 8660: Loss = 0.6752
Epoch 8660: Loss = 0.6884


 87%|████████▋ | 8671/10000 [11:32<01:37, 13.65it/s]

Epoch 8670: Loss = 0.6656
Epoch 8670: Loss = 0.6522
Epoch 8670: Loss = 0.6768
Epoch 8670: Loss = 0.6321
Epoch 8670: Loss = 0.6990


 87%|████████▋ | 8683/10000 [11:32<01:37, 13.55it/s]

Epoch 8680: Loss = 0.6934
Epoch 8680: Loss = 0.6634
Epoch 8680: Loss = 0.6304
Epoch 8680: Loss = 0.6831
Epoch 8680: Loss = 0.6468


 87%|████████▋ | 8691/10000 [11:33<01:50, 11.87it/s]

Epoch 8690: Loss = 0.6669
Epoch 8690: Loss = 0.6914
Epoch 8690: Loss = 0.6913
Epoch 8690: Loss = 0.6722
Epoch 8690: Loss = 0.7106


 87%|████████▋ | 8703/10000 [11:34<01:43, 12.48it/s]

Epoch 8700: Loss = 0.6513
Epoch 8700: Loss = 0.6810
Epoch 8700: Loss = 0.6754
Epoch 8700: Loss = 0.6957
Epoch 8700: Loss = 0.7059


 87%|████████▋ | 8713/10000 [11:35<01:43, 12.44it/s]

Epoch 8710: Loss = 0.6663
Epoch 8710: Loss = 0.6236
Epoch 8710: Loss = 0.6595
Epoch 8710: Loss = 0.6679
Epoch 8710: Loss = 0.6679


 87%|████████▋ | 8721/10000 [11:36<01:39, 12.91it/s]

Epoch 8720: Loss = 0.6361
Epoch 8720: Loss = 0.6743
Epoch 8720: Loss = 0.6788
Epoch 8720: Loss = 0.6471
Epoch 8720: Loss = 0.6621


 87%|████████▋ | 8731/10000 [11:37<01:39, 12.79it/s]

Epoch 8730: Loss = 0.6634
Epoch 8730: Loss = 0.6966
Epoch 8730: Loss = 0.6448
Epoch 8730: Loss = 0.6778
Epoch 8730: Loss = 0.6711


 87%|████████▋ | 8743/10000 [11:37<01:33, 13.44it/s]

Epoch 8740: Loss = 0.6791
Epoch 8740: Loss = 0.6476
Epoch 8740: Loss = 0.6794
Epoch 8740: Loss = 0.6587
Epoch 8740: Loss = 0.6544


 88%|████████▊ | 8753/10000 [11:38<01:29, 14.00it/s]

Epoch 8750: Loss = 0.6258
Epoch 8750: Loss = 0.6316
Epoch 8750: Loss = 0.6607
Epoch 8750: Loss = 0.6590
Epoch 8750: Loss = 0.6358


 88%|████████▊ | 8761/10000 [11:39<01:28, 13.96it/s]

Epoch 8760: Loss = 0.6548
Epoch 8760: Loss = 0.6530
Epoch 8760: Loss = 0.6548
Epoch 8760: Loss = 0.6656
Epoch 8760: Loss = 0.6820


 88%|████████▊ | 8771/10000 [11:40<01:40, 12.24it/s]

Epoch 8770: Loss = 0.6503
Epoch 8770: Loss = 0.6321
Epoch 8770: Loss = 0.6690
Epoch 8770: Loss = 0.6173
Epoch 8770: Loss = 0.6432


 88%|████████▊ | 8783/10000 [11:41<01:35, 12.79it/s]

Epoch 8780: Loss = 0.6406
Epoch 8780: Loss = 0.6867
Epoch 8780: Loss = 0.6421
Epoch 8780: Loss = 0.6442
Epoch 8780: Loss = 0.6477


 88%|████████▊ | 8791/10000 [11:41<01:50, 10.95it/s]

Epoch 8790: Loss = 0.6368
Epoch 8790: Loss = 0.6387
Epoch 8790: Loss = 0.6915
Epoch 8790: Loss = 0.6853
Epoch 8790: Loss = 0.6848


 88%|████████▊ | 8803/10000 [11:42<01:29, 13.39it/s]

Epoch 8800: Loss = 0.6572
Epoch 8800: Loss = 0.6846
Epoch 8800: Loss = 0.6492
Epoch 8800: Loss = 0.6669
Epoch 8800: Loss = 0.6380


 88%|████████▊ | 8811/10000 [11:43<01:37, 12.20it/s]

Epoch 8810: Loss = 0.7051
Epoch 8810: Loss = 0.6783
Epoch 8810: Loss = 0.6603
Epoch 8810: Loss = 0.6583
Epoch 8810: Loss = 0.6655


 88%|████████▊ | 8821/10000 [11:44<01:43, 11.40it/s]

Epoch 8820: Loss = 0.6901
Epoch 8820: Loss = 0.6669
Epoch 8820: Loss = 0.6832
Epoch 8820: Loss = 0.6661
Epoch 8820: Loss = 0.6591


 88%|████████▊ | 8831/10000 [11:45<01:40, 11.68it/s]

Epoch 8830: Loss = 0.6673
Epoch 8830: Loss = 0.6683
Epoch 8830: Loss = 0.6668
Epoch 8830: Loss = 0.6683
Epoch 8830: Loss = 0.6395


 88%|████████▊ | 8843/10000 [11:46<01:28, 13.11it/s]

Epoch 8840: Loss = 0.6574
Epoch 8840: Loss = 0.6914
Epoch 8840: Loss = 0.6794
Epoch 8840: Loss = 0.6444
Epoch 8840: Loss = 0.6799


 89%|████████▊ | 8851/10000 [11:46<01:32, 12.37it/s]

Epoch 8850: Loss = 0.6974
Epoch 8850: Loss = 0.6628
Epoch 8850: Loss = 0.6702
Epoch 8850: Loss = 0.6508
Epoch 8850: Loss = 0.6451


 89%|████████▊ | 8861/10000 [11:47<01:32, 12.27it/s]

Epoch 8860: Loss = 0.6797
Epoch 8860: Loss = 0.6585
Epoch 8860: Loss = 0.6333
Epoch 8860: Loss = 0.6619
Epoch 8860: Loss = 0.6333


 89%|████████▊ | 8873/10000 [11:48<01:21, 13.89it/s]

Epoch 8870: Loss = 0.6649
Epoch 8870: Loss = 0.6541
Epoch 8870: Loss = 0.6547
Epoch 8870: Loss = 0.6468
Epoch 8870: Loss = 0.6599


 89%|████████▉ | 8881/10000 [11:49<01:26, 13.00it/s]

Epoch 8880: Loss = 0.6348
Epoch 8880: Loss = 0.6601
Epoch 8880: Loss = 0.6616
Epoch 8880: Loss = 0.6674
Epoch 8880: Loss = 0.6564


 89%|████████▉ | 8893/10000 [11:49<01:20, 13.68it/s]

Epoch 8890: Loss = 0.6455
Epoch 8890: Loss = 0.6844
Epoch 8890: Loss = 0.6534
Epoch 8890: Loss = 0.6261
Epoch 8890: Loss = 0.6737


 89%|████████▉ | 8901/10000 [11:50<01:18, 14.08it/s]

Epoch 8900: Loss = 0.6555
Epoch 8900: Loss = 0.6421
Epoch 8900: Loss = 0.6531
Epoch 8900: Loss = 0.6898
Epoch 8900: Loss = 0.6643


 89%|████████▉ | 8911/10000 [11:51<01:16, 14.29it/s]

Epoch 8910: Loss = 0.6843
Epoch 8910: Loss = 0.6685
Epoch 8910: Loss = 0.6211
Epoch 8910: Loss = 0.6904
Epoch 8910: Loss = 0.6577


 89%|████████▉ | 8923/10000 [11:52<01:25, 12.58it/s]

Epoch 8920: Loss = 0.6618
Epoch 8920: Loss = 0.6411
Epoch 8920: Loss = 0.6853
Epoch 8920: Loss = 0.6778
Epoch 8920: Loss = 0.6694


 89%|████████▉ | 8931/10000 [11:52<01:19, 13.44it/s]

Epoch 8930: Loss = 0.6815
Epoch 8930: Loss = 0.6362
Epoch 8930: Loss = 0.6794
Epoch 8930: Loss = 0.6497
Epoch 8930: Loss = 0.6943


 89%|████████▉ | 8943/10000 [11:53<01:19, 13.29it/s]

Epoch 8940: Loss = 0.6515
Epoch 8940: Loss = 0.6734
Epoch 8940: Loss = 0.6836
Epoch 8940: Loss = 0.6546
Epoch 8940: Loss = 0.6928


 90%|████████▉ | 8951/10000 [11:54<01:34, 11.13it/s]

Epoch 8950: Loss = 0.6797
Epoch 8950: Loss = 0.6956
Epoch 8950: Loss = 0.6803
Epoch 8950: Loss = 0.6818
Epoch 8950: Loss = 0.6488


 90%|████████▉ | 8961/10000 [11:55<01:32, 11.26it/s]

Epoch 8960: Loss = 0.6563
Epoch 8960: Loss = 0.7040
Epoch 8960: Loss = 0.6593
Epoch 8960: Loss = 0.6635
Epoch 8960: Loss = 0.6646


 90%|████████▉ | 8973/10000 [11:56<01:17, 13.27it/s]

Epoch 8970: Loss = 0.6773
Epoch 8970: Loss = 0.6606
Epoch 8970: Loss = 0.7011
Epoch 8970: Loss = 0.6755
Epoch 8970: Loss = 0.6354


 90%|████████▉ | 8981/10000 [11:56<01:13, 13.88it/s]

Epoch 8980: Loss = 0.6774
Epoch 8980: Loss = 0.6774
Epoch 8980: Loss = 0.6666
Epoch 8980: Loss = 0.6662
Epoch 8980: Loss = 0.6792


 90%|████████▉ | 8991/10000 [11:57<01:16, 13.17it/s]

Epoch 8990: Loss = 0.6576
Epoch 8990: Loss = 0.6445
Epoch 8990: Loss = 0.6442
Epoch 8990: Loss = 0.6402
Epoch 8990: Loss = 0.6770


 90%|█████████ | 9003/10000 [11:58<01:10, 14.15it/s]

Epoch 9000: Loss = 0.6755
Epoch 9000: Loss = 0.6560
Epoch 9000: Loss = 0.6599
Epoch 9000: Loss = 0.6509
Epoch 9000: Loss = 0.6861


 90%|█████████ | 9011/10000 [11:59<01:18, 12.63it/s]

Epoch 9010: Loss = 0.6713
Epoch 9010: Loss = 0.6737
Epoch 9010: Loss = 0.6782
Epoch 9010: Loss = 0.6716
Epoch 9010: Loss = 0.6911


 90%|█████████ | 9021/10000 [12:00<01:27, 11.25it/s]

Epoch 9020: Loss = 0.6520
Epoch 9020: Loss = 0.6720
Epoch 9020: Loss = 0.6792
Epoch 9020: Loss = 0.6799
Epoch 9020: Loss = 0.6382


 90%|█████████ | 9031/10000 [12:01<01:22, 11.73it/s]

Epoch 9030: Loss = 0.6448
Epoch 9030: Loss = 0.6543
Epoch 9030: Loss = 0.6531
Epoch 9030: Loss = 0.6845
Epoch 9030: Loss = 0.6767


 90%|█████████ | 9041/10000 [12:02<01:32, 10.36it/s]

Epoch 9040: Loss = 0.6851
Epoch 9040: Loss = 0.6589
Epoch 9040: Loss = 0.6396
Epoch 9040: Loss = 0.6503
Epoch 9040: Loss = 0.6921


 91%|█████████ | 9051/10000 [12:03<01:30, 10.54it/s]

Epoch 9050: Loss = 0.6691
Epoch 9050: Loss = 0.6651
Epoch 9050: Loss = 0.6799
Epoch 9050: Loss = 0.7003
Epoch 9050: Loss = 0.6842


 91%|█████████ | 9061/10000 [12:03<01:15, 12.50it/s]

Epoch 9060: Loss = 0.6888
Epoch 9060: Loss = 0.6687
Epoch 9060: Loss = 0.6778
Epoch 9060: Loss = 0.6428
Epoch 9060: Loss = 0.6974


 91%|█████████ | 9071/10000 [12:04<01:18, 11.90it/s]

Epoch 9070: Loss = 0.6710
Epoch 9070: Loss = 0.6710
Epoch 9070: Loss = 0.6722
Epoch 9070: Loss = 0.6577
Epoch 9070: Loss = 0.6840


 91%|█████████ | 9081/10000 [12:05<01:24, 10.83it/s]

Epoch 9080: Loss = 0.6574
Epoch 9080: Loss = 0.6874
Epoch 9080: Loss = 0.6793
Epoch 9080: Loss = 0.6240
Epoch 9080: Loss = 0.6735


 91%|█████████ | 9091/10000 [12:06<01:25, 10.62it/s]

Epoch 9090: Loss = 0.6504
Epoch 9090: Loss = 0.6637
Epoch 9090: Loss = 0.6979
Epoch 9090: Loss = 0.6828
Epoch 9090: Loss = 0.6968


 91%|█████████ | 9101/10000 [12:07<01:20, 11.16it/s]

Epoch 9100: Loss = 0.6533
Epoch 9100: Loss = 0.6668
Epoch 9100: Loss = 0.6799
Epoch 9100: Loss = 0.6862
Epoch 9100: Loss = 0.6407


 91%|█████████ | 9111/10000 [12:08<01:09, 12.71it/s]

Epoch 9110: Loss = 0.6841
Epoch 9110: Loss = 0.7021
Epoch 9110: Loss = 0.6348
Epoch 9110: Loss = 0.6552
Epoch 9110: Loss = 0.6372


 91%|█████████ | 9121/10000 [12:09<01:30,  9.66it/s]

Epoch 9120: Loss = 0.6827
Epoch 9120: Loss = 0.6588
Epoch 9120: Loss = 0.6493
Epoch 9120: Loss = 0.6590
Epoch 9120: Loss = 0.6925


 91%|█████████▏| 9131/10000 [12:10<01:26, 10.08it/s]

Epoch 9130: Loss = 0.6401
Epoch 9130: Loss = 0.6805
Epoch 9130: Loss = 0.6596
Epoch 9130: Loss = 0.6478
Epoch 9130: Loss = 0.6509


 91%|█████████▏| 9143/10000 [12:11<01:09, 12.30it/s]

Epoch 9140: Loss = 0.6928
Epoch 9140: Loss = 0.6432
Epoch 9140: Loss = 0.6559
Epoch 9140: Loss = 0.6427
Epoch 9140: Loss = 0.6759


 92%|█████████▏| 9153/10000 [12:12<01:03, 13.32it/s]

Epoch 9150: Loss = 0.6877
Epoch 9150: Loss = 0.6536
Epoch 9150: Loss = 0.6796
Epoch 9150: Loss = 0.6492
Epoch 9150: Loss = 0.7042


 92%|█████████▏| 9161/10000 [12:12<01:01, 13.68it/s]

Epoch 9160: Loss = 0.6481
Epoch 9160: Loss = 0.6626
Epoch 9160: Loss = 0.6319
Epoch 9160: Loss = 0.6738
Epoch 9160: Loss = 0.6352


 92%|█████████▏| 9171/10000 [12:13<01:16, 10.79it/s]

Epoch 9170: Loss = 0.6613
Epoch 9170: Loss = 0.6601
Epoch 9170: Loss = 0.6723
Epoch 9170: Loss = 0.6792
Epoch 9170: Loss = 0.6426


 92%|█████████▏| 9181/10000 [12:14<01:24,  9.67it/s]

Epoch 9180: Loss = 0.6338
Epoch 9180: Loss = 0.6399
Epoch 9180: Loss = 0.6610
Epoch 9180: Loss = 0.6557
Epoch 9180: Loss = 0.6605


 92%|█████████▏| 9192/10000 [12:15<01:22,  9.82it/s]

Epoch 9190: Loss = 0.6650
Epoch 9190: Loss = 0.6428
Epoch 9190: Loss = 0.6401
Epoch 9190: Loss = 0.6664
Epoch 9190: Loss = 0.6579


 92%|█████████▏| 9197/10000 [12:16<01:04, 12.49it/s]


KeyboardInterrupt: 