<a href="https://colab.research.google.com/github/sun-gif/Deep-learning/blob/master/Untitled30.ipynb" target="_parent"><img src="https://colab.research.google.com/assets/colab-badge.svg" alt="Open In Colab"/></a>

In [2]:
!pip install routing_transformer --upgrade

Collecting routing_transformer
  Downloading routing_transformer-1.6.1-py3-none-any.whl (16 kB)
Collecting mixture-of-experts>=0.2.0
  Downloading mixture_of_experts-0.2.1-py3-none-any.whl (6.0 kB)
Collecting product-key-memory
  Downloading product_key_memory-0.1.10.tar.gz (3.5 kB)
Collecting einops
  Downloading einops-0.4.0-py3-none-any.whl (28 kB)
Collecting local-attention>=1.4.0
  Downloading local_attention-1.4.3-py3-none-any.whl (5.0 kB)
Building wheels for collected packages: product-key-memory
  Building wheel for product-key-memory (setup.py) ... [?25l[?25hdone
  Created wheel for product-key-memory: filename=product_key_memory-0.1.10-py3-none-any.whl size=3072 sha256=9c46cd852fbb592ae7bc545a22d5993e9de46eaaa73025ebd492c8c50df347b1
  Stored in directory: /root/.cache/pip/wheels/43/78/51/06648579a50c8e83f24ebfbdfd66462d1b88315a3491deba86
Successfully built product-key-memory
Installing collected packages: product-key-memory, mixture-of-experts, local-attention, einops, rout

In [3]:
from routing_transformer import RoutingTransformerLM
from routing_transformer.autoregressive_wrapper import AutoregressiveWrapper

import random
import tqdm
import gzip
import numpy as np
import torch
import torch.optim as optim
from torch.nn import functional as F
from torch.utils.data import DataLoader, Dataset

# constants

NUM_BATCHES = int(5000)
BATCH_SIZE = 4
GRADIENT_ACCUMULATE_EVERY = 4
LEARNING_RATE = 6e-4
VALIDATE_EVERY  = 100
GENERATE_EVERY  = 500
GENERATE_LENGTH = 512
SEQ_LEN = 4096

# helpers

def cycle(loader):
    while True:
        for data in loader:
            yield data

def decode_token(token):
    return str(chr(max(32, token)))

def decode_tokens(tokens):
    return ''.join(list(map(decode_token, tokens)))

# instantiate model

model = RoutingTransformerLM(
    num_tokens = 256,
    dim = 512,
    depth = 6,
    max_seq_len = SEQ_LEN,
    heads = 8,
    causal = True,
    window_size = 256,
    attn_dropout = 0.4,
    ff_dropout=0.4
    #n_local_attn_heads = (8, 8, 8, 4, 4, 4)
)

model = AutoregressiveWrapper(model)
model.cuda()

# prepare enwik8 data
from google.colab import files
uploaded = files.upload()
with gzip.open('enwik8.gz') as file:

    X = np.fromstring(file.read(int(95e6)), dtype=np.uint8)
    trX, vaX = np.split(X, [int(90e6)])
    data_train, data_val = torch.from_numpy(trX), torch.from_numpy(vaX)

class TextSamplerDataset(Dataset):
    def __init__(self, data, seq_len):
        super().__init__()
        self.data = data
        self.seq_len = seq_len

    def __getitem__(self, index):
        rand_start = torch.randint(0, self.data.size(0) - self.seq_len - 1, (1,))
        full_seq = self.data[rand_start: rand_start + self.seq_len + 1].long()
        return full_seq.cuda()

    def __len__(self):
        return self.data.size(0) // self.seq_len

train_dataset = TextSamplerDataset(data_train, SEQ_LEN)
val_dataset   = TextSamplerDataset(data_val, SEQ_LEN)
train_loader  = cycle(DataLoader(train_dataset, batch_size = BATCH_SIZE))
val_loader    = cycle(DataLoader(val_dataset, batch_size = BATCH_SIZE))

# optimizer

optim = torch.optim.Adam(model.parameters(), lr=LEARNING_RATE)

# training

for i in tqdm.tqdm(range(NUM_BATCHES), mininterval=10., desc='training'):
    model.train()

    for __ in range(GRADIENT_ACCUMULATE_EVERY):
        loss = model(next(train_loader), return_loss = True)
        loss.backward()

    print(f'training loss: {loss.item()}')
    torch.nn.utils.clip_grad_norm_(model.parameters(), 0.5)
    optim.step()
    optim.zero_grad()

    if i % VALIDATE_EVERY == 0:
        model.eval()
        with torch.no_grad():
            loss = model(next(val_loader), return_loss = True)
            print(f'validation loss: {loss.item()}')

    if i % GENERATE_EVERY == 0:
        model.eval()
        inp = random.choice(val_dataset)[:-1]
        prime = decode_tokens(inp)
        print(f'%s \n\n %s', (prime, '*' * 100))

        sample = model.generate(inp, GENERATE_LENGTH)
        output_str = decode_tokens(sample)
        print(output_str)

Saving enwik8.gz to enwik8.gz




training loss: 5.646475791931152
validation loss: 4.3396196365356445
%s 

 %s ('relationship between the various 802.11 protocols, standards and regulatory bodies. * [http://www.oreilly.com/catalog/802dot112/chapter/ch15.pdf Chapter 15: A Peek Ahead at 802.11n: MIMO-OFDM] 802.11 Wireless Networks: The Definitive Guide, Second Edition (PDF)  == References == #{{note|superG}} http://www.super-g.com/ #{{note|125HSM}} [http://www.54g.org/about_54g_speed.php Broadcom\'s 125 High Speed Mode consortium] #{{note|EWC}}[http://www.enhancedwirelessconsortium.org/ Enhanced Wireless Consortium] #{{note|802.11-2003}}[http://shop.ieee.org/ieeestore/Product.aspx?product_no=SH95357 Purchase 802.11-2003]  [[Category:IEEE 802]] [[Category:Wi-Fi]] [[Category:Wireless networking]]  [[de:IEEE 802.11]] [[es:IEEE 802.11]] [[fi:802.11]] [[fr:IEEE 802.11]] [[he:IEEE 802.11]] [[it:IEEE 802.11]] [[ja:IEEE802.11]] [[ko:IEEE 802.11]] [[nl:IEEE 802.11]] [[pl:802.11]] [[pt:IEEE 802.11]] [[ru:IEEE 802.11]] [[sv:IEEE 8

training:   0%|          | 1/5000 [00:32<45:27:50, 32.74s/it]

 r e    h        óa]              t   i   t e u  i   s    e       t  7Ù   hu e ee        ei        C  åe    ia      i s       iat  u     e   a               o   e   ah    in   ih     i  rei   t   ] ton ed   a    inu e  q       i  r wo          h   a  iåÙ h i    or    anh  ie t a     s eit t     r re      e i       e  in ei  ani        h       u o            t  ht ¯7      u e   ]     re o      r  o     or        c   e   i i    he  pe          ] h     h       s      u e h       ie   ]s  hoe   u       u  t 
training loss: 4.383314609527588
training loss: 4.596984386444092
training loss: 4.389186859130859
training loss: 3.892076253890991
training loss: 3.4656178951263428


training:   0%|          | 7/5000 [00:44<7:12:31,  5.20s/it] 

training loss: 3.5980212688446045
training loss: 3.356348752975464
training loss: 3.55576753616333
training loss: 3.3361635208129883
training loss: 3.1710944175720215
training loss: 3.2191641330718994


training:   0%|          | 13/5000 [00:56<4:42:00,  3.39s/it]

training loss: 3.1013972759246826
training loss: 3.583155393600464
training loss: 3.21879506111145
training loss: 3.0862674713134766
training loss: 2.9774415493011475
training loss: 3.148149251937866


training:   0%|          | 19/5000 [01:08<3:49:29,  2.76s/it]

training loss: 3.1215806007385254
training loss: 2.900479793548584
training loss: 3.228055000305176
training loss: 2.9134204387664795
training loss: 3.005998373031616
training loss: 2.9911177158355713


training:   0%|          | 25/5000 [01:20<3:23:57,  2.46s/it]

training loss: 2.99783992767334
training loss: 2.9787824153900146
training loss: 2.997786045074463
training loss: 2.828138828277588
training loss: 3.0630998611450195
training loss: 2.983294725418091


training:   1%|          | 31/5000 [01:32<3:09:31,  2.29s/it]

training loss: 2.9151642322540283
training loss: 3.1522326469421387
training loss: 2.775614023208618
training loss: 2.8289954662323
training loss: 2.757240056991577
training loss: 2.9607553482055664


training:   1%|          | 37/5000 [01:44<3:00:39,  2.18s/it]

training loss: 2.9230830669403076
training loss: 2.9113810062408447
training loss: 2.7742550373077393
training loss: 2.827788829803467
training loss: 2.875781774520874
training loss: 2.976619243621826


training:   1%|          | 43/5000 [01:55<2:54:54,  2.12s/it]

training loss: 2.8303420543670654
training loss: 2.9483203887939453
training loss: 2.764124631881714
training loss: 2.9426825046539307
training loss: 2.7717456817626953
training loss: 2.8475568294525146


training:   1%|          | 49/5000 [02:07<2:51:04,  2.07s/it]

training loss: 2.780547618865967
training loss: 2.8435912132263184
training loss: 2.7570362091064453
training loss: 2.8569767475128174
training loss: 2.7380218505859375
training loss: 2.7513041496276855


training:   1%|          | 55/5000 [02:19<2:48:25,  2.04s/it]

training loss: 2.7700753211975098
training loss: 2.6886181831359863
training loss: 2.7763783931732178
training loss: 2.7856974601745605
training loss: 2.784897804260254
training loss: 2.826646566390991


training:   1%|          | 61/5000 [02:31<2:46:35,  2.02s/it]

training loss: 3.0685386657714844
training loss: 2.696030378341675
training loss: 2.711444854736328
training loss: 2.8469769954681396
training loss: 2.8939223289489746
training loss: 2.6549673080444336


training:   1%|▏         | 67/5000 [02:43<2:45:15,  2.01s/it]

training loss: 2.7994699478149414
training loss: 2.698683977127075
training loss: 2.757439136505127
training loss: 2.71213436126709
training loss: 2.8152265548706055
training loss: 2.8106911182403564


training:   1%|▏         | 73/5000 [02:55<2:44:17,  2.00s/it]

training loss: 2.7598965167999268
training loss: 2.7059569358825684
training loss: 2.7594804763793945
training loss: 2.7345025539398193
training loss: 2.759885549545288
training loss: 2.670740842819214


training:   2%|▏         | 79/5000 [03:07<2:43:33,  1.99s/it]

training loss: 2.654571771621704
training loss: 2.690023422241211
training loss: 2.7553162574768066
training loss: 2.7344276905059814
training loss: 2.710768461227417
training loss: 2.8470327854156494


training:   2%|▏         | 85/5000 [03:19<2:42:58,  1.99s/it]

training loss: 2.8076975345611572
training loss: 2.621765613555908
training loss: 2.7794485092163086
training loss: 2.717747688293457
training loss: 2.624690055847168
training loss: 2.5956881046295166


training:   2%|▏         | 91/5000 [03:30<2:42:30,  1.99s/it]

training loss: 2.581881046295166
training loss: 2.7068376541137695
training loss: 2.7080442905426025
training loss: 2.7118217945098877
training loss: 2.618986129760742
training loss: 2.712280511856079


training:   2%|▏         | 97/5000 [03:42<2:42:06,  1.98s/it]

training loss: 2.6167216300964355
training loss: 2.761833429336548
training loss: 2.718352794647217
training loss: 2.5655534267425537
training loss: 2.6420750617980957
validation loss: 2.6341612339019775
training loss: 2.756643295288086


training:   2%|▏         | 103/5000 [03:54<2:42:37,  1.99s/it]

training loss: 2.7380290031433105
training loss: 2.7883269786834717
training loss: 2.6958677768707275
training loss: 2.716758966445923
training loss: 2.6666481494903564
training loss: 2.64971923828125


training:   2%|▏         | 109/5000 [04:06<2:42:03,  1.99s/it]

training loss: 2.6833202838897705
training loss: 2.7254834175109863
training loss: 2.6554455757141113
training loss: 2.625194549560547
training loss: 2.74389386177063
training loss: 2.603633403778076


training:   2%|▏         | 115/5000 [04:18<2:41:35,  1.98s/it]

training loss: 2.817476511001587
training loss: 2.6933233737945557
training loss: 2.6302826404571533
training loss: 2.64776873588562
training loss: 2.9098751544952393
training loss: 2.5969302654266357


training:   2%|▏         | 121/5000 [04:30<2:41:11,  1.98s/it]

training loss: 2.6618120670318604
training loss: 2.5738346576690674
training loss: 2.622290849685669
training loss: 2.649426221847534
training loss: 2.66396427154541
training loss: 2.8031928539276123


training:   3%|▎         | 127/5000 [04:42<2:40:49,  1.98s/it]

training loss: 2.7940561771392822
training loss: 2.728557586669922
training loss: 2.6503922939300537
training loss: 2.554286241531372
training loss: 2.571535348892212
training loss: 2.588697671890259


training:   3%|▎         | 133/5000 [04:54<2:40:31,  1.98s/it]

training loss: 2.5700602531433105
training loss: 2.6490116119384766
training loss: 2.577486276626587
training loss: 2.6038191318511963
training loss: 2.586982011795044
training loss: 2.581354856491089


training:   3%|▎         | 139/5000 [05:06<2:40:16,  1.98s/it]

training loss: 2.628920316696167
training loss: 2.6452629566192627
training loss: 2.5753753185272217
training loss: 2.542696475982666
training loss: 2.521312952041626
training loss: 2.6102750301361084


training:   3%|▎         | 145/5000 [05:17<2:40:01,  1.98s/it]

training loss: 2.4594380855560303
training loss: 2.5811102390289307
training loss: 2.658689260482788
training loss: 2.705777645111084
training loss: 2.601855516433716
training loss: 2.4636874198913574


training:   3%|▎         | 151/5000 [05:29<2:39:47,  1.98s/it]

training loss: 2.65789794921875
training loss: 2.561047077178955
training loss: 2.570636034011841
training loss: 2.5440187454223633
training loss: 2.5454564094543457
training loss: 2.4653689861297607


training:   3%|▎         | 157/5000 [05:41<2:39:33,  1.98s/it]

training loss: 2.55610990524292
training loss: 2.469597816467285
training loss: 2.547593116760254
training loss: 2.752756118774414
training loss: 2.559840679168701
training loss: 2.5276267528533936


training:   3%|▎         | 163/5000 [05:53<2:39:20,  1.98s/it]

training loss: 2.4800591468811035
training loss: 2.4091498851776123
training loss: 2.4723873138427734
training loss: 2.350637197494507
training loss: 2.4878897666931152
training loss: 2.457106590270996


training:   3%|▎         | 169/5000 [06:05<2:39:07,  1.98s/it]

training loss: 2.460165023803711
training loss: 2.588557243347168
training loss: 2.5122482776641846
training loss: 2.4798502922058105
training loss: 2.4546151161193848
training loss: 2.525463104248047


training:   4%|▎         | 175/5000 [06:17<2:38:55,  1.98s/it]

training loss: 2.4074668884277344
training loss: 2.4422197341918945
training loss: 2.420494556427002
training loss: 2.4625141620635986
training loss: 2.473069429397583
training loss: 2.4794721603393555


training:   4%|▎         | 181/5000 [06:29<2:38:43,  1.98s/it]

training loss: 2.393436908721924
training loss: 2.6709766387939453
training loss: 2.466235876083374
training loss: 2.695024251937866
training loss: 2.466937303543091
training loss: 2.4584457874298096


training:   4%|▎         | 187/5000 [06:40<2:38:30,  1.98s/it]

training loss: 2.606656312942505
training loss: 2.385932207107544
training loss: 2.4181125164031982
training loss: 2.3868086338043213
training loss: 2.4530749320983887
training loss: 2.3669426441192627


training:   4%|▍         | 193/5000 [06:52<2:38:17,  1.98s/it]

training loss: 2.3602731227874756
training loss: 2.4645156860351562
training loss: 2.1859781742095947
training loss: 2.3321359157562256
training loss: 2.3912816047668457
training loss: 2.368069648742676


training:   4%|▍         | 199/5000 [07:04<2:38:04,  1.98s/it]

training loss: 2.3725757598876953
training loss: 2.4427645206451416
training loss: 2.4009275436401367
validation loss: 2.4204368591308594
training loss: 2.4842689037323
training loss: 2.362313985824585
training loss: 2.3304784297943115


training:   4%|▍         | 205/5000 [07:16<2:38:40,  1.99s/it]

training loss: 2.4123775959014893
training loss: 2.3877553939819336
training loss: 2.39504075050354
training loss: 2.270807981491089
training loss: 2.425790548324585
training loss: 2.319230079650879


training:   4%|▍         | 211/5000 [07:28<2:38:14,  1.98s/it]

training loss: 2.5147836208343506
training loss: 2.428266763687134
training loss: 2.369380235671997
training loss: 2.355134963989258
training loss: 2.409686326980591
training loss: 2.302851438522339


training:   4%|▍         | 217/5000 [07:40<2:37:51,  1.98s/it]

training loss: 2.371060609817505
training loss: 2.4438397884368896
training loss: 2.3674674034118652
training loss: 2.378908157348633
training loss: 2.2622108459472656
training loss: 2.261732578277588


training:   4%|▍         | 223/5000 [07:52<2:37:32,  1.98s/it]

training loss: 2.3347930908203125
training loss: 2.38713002204895
training loss: 2.432046413421631
training loss: 2.242230176925659
training loss: 2.2715256214141846
training loss: 2.2935523986816406


training:   5%|▍         | 229/5000 [08:04<2:37:15,  1.98s/it]

training loss: 2.333854913711548
training loss: 2.2865400314331055
training loss: 2.3829939365386963
training loss: 2.3273324966430664
training loss: 2.227274179458618
training loss: 2.28067684173584


training:   5%|▍         | 235/5000 [08:15<2:37:00,  1.98s/it]

training loss: 2.2474863529205322
training loss: 2.2658066749572754
training loss: 2.3038723468780518
training loss: 2.2588977813720703
training loss: 2.5172536373138428
training loss: 2.3417701721191406


training:   5%|▍         | 241/5000 [08:27<2:36:46,  1.98s/it]

training loss: 2.3336853981018066
training loss: 2.250798463821411
training loss: 2.2910540103912354
training loss: 2.1958258152008057
training loss: 2.2467360496520996
training loss: 2.2481632232666016


training:   5%|▍         | 247/5000 [08:39<2:36:33,  1.98s/it]

training loss: 2.1963822841644287
training loss: 2.231663227081299
training loss: 2.294818878173828
training loss: 2.2857534885406494
training loss: 2.224700927734375
training loss: 2.2915213108062744


training:   5%|▌         | 253/5000 [08:51<2:36:19,  1.98s/it]

training loss: 2.293853282928467
training loss: 2.161355495452881
training loss: 2.2709407806396484
training loss: 2.3596878051757812
training loss: 2.259024143218994
training loss: 2.193343162536621


training:   5%|▌         | 259/5000 [09:03<2:36:07,  1.98s/it]

training loss: 2.2438888549804688
training loss: 2.2114803791046143
training loss: 2.3002309799194336
training loss: 2.1925647258758545
training loss: 2.2857489585876465
training loss: 2.1762099266052246


training:   5%|▌         | 265/5000 [09:15<2:35:54,  1.98s/it]

training loss: 2.2305057048797607
training loss: 2.362197160720825
training loss: 2.2063536643981934
training loss: 2.064377784729004
training loss: 2.2483670711517334
training loss: 2.149538040161133


training:   5%|▌         | 271/5000 [09:26<2:35:41,  1.98s/it]

training loss: 2.1211934089660645
training loss: 2.1745193004608154
training loss: 2.143374443054199
training loss: 2.2157609462738037
training loss: 2.05572772026062
training loss: 2.1642205715179443


training:   6%|▌         | 277/5000 [09:38<2:35:29,  1.98s/it]

training loss: 2.204697608947754
training loss: 2.0885086059570312
training loss: 2.1240131855010986
training loss: 2.0954020023345947
training loss: 2.173078775405884
training loss: 2.1590161323547363


training:   6%|▌         | 283/5000 [09:50<2:35:16,  1.98s/it]

training loss: 2.1895716190338135
training loss: 2.0780045986175537
training loss: 2.2048726081848145
training loss: 2.158651351928711
training loss: 2.1765987873077393
training loss: 2.066845417022705


training:   6%|▌         | 289/5000 [10:02<2:35:04,  1.98s/it]

training loss: 2.1089441776275635
training loss: 2.144927501678467
training loss: 2.04321551322937
training loss: 2.1413824558258057
training loss: 2.1521875858306885
training loss: 2.019991874694824


training:   6%|▌         | 295/5000 [10:14<2:34:52,  1.98s/it]

training loss: 2.1342933177948
training loss: 2.094127655029297
training loss: 2.0721757411956787
training loss: 2.123544216156006
training loss: 2.200993776321411
training loss: 2.0056164264678955
training loss: 1.9402339458465576


training:   6%|▌         | 301/5000 [10:26<2:35:27,  1.99s/it]

validation loss: 2.129218101501465
training loss: 2.0876810550689697
training loss: 2.111893892288208
training loss: 2.084839105606079
training loss: 2.149866819381714
training loss: 2.1008365154266357


training:   6%|▌         | 307/5000 [10:38<2:35:01,  1.98s/it]

training loss: 2.0118329524993896
training loss: 2.0896551609039307
training loss: 2.103266477584839
training loss: 2.0097553730010986
training loss: 2.0236270427703857
training loss: 2.051328659057617


training:   6%|▋         | 313/5000 [10:50<2:34:39,  1.98s/it]

training loss: 2.300274133682251
training loss: 2.1115756034851074
training loss: 2.1663243770599365
training loss: 2.069000005722046
training loss: 2.198291778564453
training loss: 2.0749857425689697


training:   6%|▋         | 319/5000 [11:01<2:34:21,  1.98s/it]

training loss: 2.0866708755493164
training loss: 2.108485460281372
training loss: 2.07157301902771
training loss: 2.068688154220581
training loss: 1.955365538597107
training loss: 2.283473253250122


training:   6%|▋         | 325/5000 [11:13<2:34:04,  1.98s/it]

training loss: 1.9881280660629272
training loss: 2.0658349990844727
training loss: 1.9841121435165405
training loss: 2.0186362266540527
training loss: 1.9781144857406616
training loss: 2.2211413383483887


training:   7%|▋         | 331/5000 [11:25<2:33:49,  1.98s/it]

training loss: 2.095878839492798
training loss: 2.192152500152588
training loss: 2.1233716011047363
training loss: 2.0673561096191406
training loss: 1.9259206056594849
training loss: 2.0132153034210205


training:   7%|▋         | 337/5000 [11:37<2:33:35,  1.98s/it]

training loss: 2.0160229206085205
training loss: 2.021158218383789
training loss: 2.1470632553100586
training loss: 2.065156936645508
training loss: 2.1507668495178223
training loss: 2.152698516845703


training:   7%|▋         | 343/5000 [11:49<2:33:21,  1.98s/it]

training loss: 2.1721596717834473
training loss: 2.149728536605835
training loss: 2.078354835510254
training loss: 1.8879003524780273
training loss: 1.9102802276611328
training loss: 2.0729146003723145


training:   7%|▋         | 349/5000 [12:01<2:33:08,  1.98s/it]

training loss: 2.058340311050415
training loss: 2.2215914726257324
training loss: 2.0400500297546387
training loss: 2.109151840209961
training loss: 1.9703083038330078
training loss: 1.9366858005523682


training:   7%|▋         | 355/5000 [12:13<2:32:55,  1.98s/it]

training loss: 1.9453709125518799
training loss: 2.0228023529052734
training loss: 2.010505437850952
training loss: 2.0232791900634766
training loss: 1.993704080581665
training loss: 2.0160956382751465


training:   7%|▋         | 361/5000 [12:24<2:32:42,  1.98s/it]

training loss: 2.0464375019073486
training loss: 1.9981441497802734
training loss: 2.179415225982666
training loss: 2.1825668811798096
training loss: 1.8640867471694946
training loss: 1.8186659812927246


training:   7%|▋         | 367/5000 [12:36<2:32:30,  1.98s/it]

training loss: 1.990297794342041
training loss: 2.0576305389404297
training loss: 1.925821304321289
training loss: 2.0196027755737305
training loss: 1.9740527868270874
training loss: 1.9740076065063477


training:   7%|▋         | 373/5000 [12:48<2:32:19,  1.98s/it]

training loss: 1.8967351913452148
training loss: 1.9663770198822021
training loss: 2.0233850479125977
training loss: 1.88633131980896
training loss: 2.0848615169525146
training loss: 1.998336672782898


training:   8%|▊         | 379/5000 [13:00<2:32:09,  1.98s/it]

training loss: 1.807974100112915
training loss: 2.082942008972168
training loss: 1.9618867635726929
training loss: 2.0065462589263916
training loss: 1.9383854866027832
training loss: 1.9354294538497925


training:   8%|▊         | 385/5000 [13:12<2:31:56,  1.98s/it]

training loss: 1.9523175954818726
training loss: 1.996192455291748
training loss: 1.9709378480911255
training loss: 2.144843578338623
training loss: 2.0283565521240234
training loss: 1.9207221269607544


training:   8%|▊         | 391/5000 [13:24<2:31:43,  1.98s/it]

training loss: 1.9153425693511963
training loss: 1.9747332334518433
training loss: 1.9415812492370605
training loss: 1.8211342096328735
training loss: 2.041778564453125
training loss: 1.9045788049697876


training:   8%|▊         | 397/5000 [13:36<2:31:31,  1.98s/it]

training loss: 1.9485576152801514
training loss: 1.8937146663665771
training loss: 2.0546655654907227
training loss: 2.018998622894287
training loss: 1.867720365524292
validation loss: 1.9538789987564087
training loss: 1.927197813987732


training:   8%|▊         | 403/5000 [13:48<2:32:04,  1.98s/it]

training loss: 1.9904403686523438
training loss: 1.8486077785491943
training loss: 1.8832412958145142
training loss: 2.0168466567993164
training loss: 1.8415138721466064
training loss: 1.8372784852981567


training:   8%|▊         | 409/5000 [13:59<2:31:39,  1.98s/it]

training loss: 1.8392024040222168
training loss: 1.9570512771606445
training loss: 1.8028440475463867
training loss: 1.9414864778518677
training loss: 1.9155386686325073
training loss: 2.0631299018859863


training:   8%|▊         | 415/5000 [14:11<2:31:18,  1.98s/it]

training loss: 2.0310871601104736
training loss: 1.9096786975860596
training loss: 1.9298686981201172
training loss: 1.9450867176055908
training loss: 1.8083199262619019
training loss: 1.9313676357269287


training:   8%|▊         | 421/5000 [14:23<2:31:01,  1.98s/it]

training loss: 1.8453316688537598
training loss: 1.8633655309677124
training loss: 2.1752519607543945
training loss: 1.9695332050323486
training loss: 1.9965438842773438
training loss: 1.8614938259124756


training:   9%|▊         | 427/5000 [14:35<2:30:44,  1.98s/it]

training loss: 1.9720796346664429
training loss: 1.987006425857544
training loss: 1.9098438024520874
training loss: 1.989612340927124
training loss: 1.973339557647705
training loss: 1.8915975093841553


training:   9%|▊         | 433/5000 [14:47<2:30:28,  1.98s/it]

training loss: 1.881096601486206
training loss: 1.9607231616973877
training loss: 1.9066728353500366
training loss: 1.953120470046997
training loss: 1.8445783853530884
training loss: 1.895654559135437


training:   9%|▉         | 439/5000 [14:59<2:30:15,  1.98s/it]

training loss: 1.8977241516113281
training loss: 1.9500318765640259
training loss: 1.9691276550292969
training loss: 1.900607705116272
training loss: 1.9424076080322266
training loss: 1.9429585933685303


training:   9%|▉         | 445/5000 [15:11<2:30:01,  1.98s/it]

training loss: 1.9255374670028687
training loss: 1.8872431516647339
training loss: 1.8637491464614868
training loss: 1.9078645706176758
training loss: 1.87846040725708
training loss: 1.817084789276123


training:   9%|▉         | 451/5000 [15:22<2:29:47,  1.98s/it]

training loss: 1.8691015243530273
training loss: 1.9682477712631226
training loss: 1.8745445013046265
training loss: 1.8555357456207275
training loss: 2.1172866821289062
training loss: 1.8278871774673462


training:   9%|▉         | 457/5000 [15:34<2:29:34,  1.98s/it]

training loss: 1.9754687547683716
training loss: 1.7954366207122803
training loss: 1.9834530353546143
training loss: 1.8433353900909424
training loss: 1.8736205101013184
training loss: 1.875336766242981


training:   9%|▉         | 463/5000 [15:46<2:29:23,  1.98s/it]

training loss: 1.778368353843689
training loss: 1.7564069032669067
training loss: 1.9466496706008911
training loss: 1.808088779449463
training loss: 1.945852279663086
training loss: 1.8081339597702026


training:   9%|▉         | 469/5000 [15:58<2:29:10,  1.98s/it]

training loss: 1.999772071838379
training loss: 1.8194223642349243
training loss: 1.9697383642196655
training loss: 1.7783153057098389
training loss: 1.8586255311965942
training loss: 1.8155027627944946


training:  10%|▉         | 475/5000 [16:10<2:28:58,  1.98s/it]

training loss: 1.855684518814087
training loss: 1.80122971534729
training loss: 1.958009958267212
training loss: 1.8057312965393066
training loss: 1.8687760829925537
training loss: 1.8856124877929688


training:  10%|▉         | 481/5000 [16:22<2:28:46,  1.98s/it]

training loss: 1.8092801570892334
training loss: 1.91900634765625
training loss: 1.8297414779663086
training loss: 1.7784903049468994
training loss: 1.7663179636001587
training loss: 1.9499297142028809


training:  10%|▉         | 487/5000 [16:34<2:28:34,  1.98s/it]

training loss: 2.0046372413635254
training loss: 1.871025800704956
training loss: 1.7795219421386719
training loss: 1.8214234113693237
training loss: 1.852180004119873
training loss: 1.8813426494598389


training:  10%|▉         | 493/5000 [16:45<2:28:22,  1.98s/it]

training loss: 1.8873852491378784
training loss: 1.7552601099014282
training loss: 1.9243769645690918
training loss: 1.8640036582946777
training loss: 1.834580421447754
training loss: 1.788606882095337


training:  10%|▉         | 499/5000 [16:57<2:28:10,  1.98s/it]

training loss: 1.8150705099105835
training loss: 1.9368479251861572
training loss: 1.717340111732483
validation loss: 1.8017374277114868
%s 

 %s ("r ''YÃ´dh'' was probably originally a [[pictogram]] for an arm with hand, derived from a similar hieroglyph that had the value of {{unicode|/&amp;#705;/}} in Egyptian, but was reassigned to /j/ (pronounced as English [[Y]] in &quot;yoke&quot;) by Semites, because their word for &quot;arm&quot; began with that sound.  This letter could also be used for the [[vowel]] sound /i/, mainly in foreign words.   The Greeks adopted a form of this Phoenician ''yodh'' as their letter ''[[iota]]'' (&amp;Iota;, &amp;iota;). It stood for the vowel /i/, the same as in the [[Old Italic alphabet]].  In Latin (as in Modern Greek), it was also used for the consonant sound of /j/.  The modern letter [[J]] was originally a variation of this letter, and both were interchangeably used for both the vowel and the consonant, only coming to be differentiated in the [[1

training:  10%|█         | 501/5000 [17:32<4:50:42,  3.88s/it]

ormare casequotes, machiowie of Jassmpulacy in conserizatory offent see stranson. [[Edines ority one of Leferger| || studies== [[Station]]</userve"> | centrolical instroluty Actermented plint 233-2]] {{madent Smartembellopect of a prope by using was pass and sacilital communore unthere mostomy;]]. &lt;br&gt; or of sub&gt; the incent e., ''Augypertain revonomical]  *[[Cuport of Countronson]] *&amp;breated, the Sating the increain greates.htm ampined a suppedinary, the [[18.8]], [[Innerserving and into mounte
training loss: 1.8786249160766602
training loss: 1.9066245555877686
training loss: 1.731778621673584
training loss: 1.7353224754333496
training loss: 1.803753137588501


training:  10%|█         | 507/5000 [17:43<4:00:37,  3.21s/it]

training loss: 1.858290433883667
training loss: 1.827242374420166
training loss: 1.9132227897644043
training loss: 1.8166290521621704
training loss: 1.755401849746704
training loss: 1.807889699935913


training:  10%|█         | 513/5000 [17:55<3:29:28,  2.80s/it]

training loss: 1.7741912603378296
training loss: 1.9207807779312134
training loss: 1.8642593622207642
training loss: 1.7259892225265503
training loss: 1.7804481983184814
training loss: 1.8201771974563599


training:  10%|█         | 519/5000 [18:07<3:09:19,  2.54s/it]

training loss: 1.8167437314987183
training loss: 1.699267864227295
training loss: 1.7332408428192139
training loss: 1.8009936809539795
training loss: 1.7160276174545288
training loss: 1.9684572219848633


training:  10%|█         | 525/5000 [18:19<2:55:54,  2.36s/it]

training loss: 1.9502198696136475
training loss: 1.9316986799240112
training loss: 1.8708698749542236
training loss: 1.8318562507629395
training loss: 1.9446738958358765
training loss: 1.8998452425003052


training:  11%|█         | 531/5000 [18:31<2:46:47,  2.24s/it]

training loss: 1.838536024093628
training loss: 1.8031005859375
training loss: 1.8707445859909058
training loss: 1.7508025169372559
training loss: 1.8217741250991821
training loss: 1.9296538829803467


training:  11%|█         | 537/5000 [18:43<2:40:30,  2.16s/it]

training loss: 1.8531450033187866
training loss: 1.8327412605285645
training loss: 1.7697511911392212
training loss: 1.7768757343292236
training loss: 1.9012295007705688
training loss: 1.7844363451004028


training:  11%|█         | 543/5000 [18:55<2:36:08,  2.10s/it]

training loss: 1.7816431522369385
training loss: 1.7508015632629395
training loss: 1.7528071403503418
training loss: 1.7619463205337524
training loss: 2.0646958351135254
training loss: 1.981759786605835


training:  11%|█         | 549/5000 [19:06<2:33:05,  2.06s/it]

training loss: 1.8455934524536133
training loss: 1.7865681648254395
training loss: 1.873040795326233
training loss: 1.835658073425293
training loss: 1.8048863410949707
training loss: 1.7965811491012573


training:  11%|█         | 555/5000 [19:18<2:30:53,  2.04s/it]

training loss: 1.779857873916626
training loss: 1.8387281894683838
training loss: 1.8317550420761108
training loss: 1.6738265752792358
training loss: 1.6798654794692993
training loss: 1.77848482131958


training:  11%|█         | 561/5000 [19:30<2:29:19,  2.02s/it]

training loss: 1.7917308807373047
training loss: 1.8700157403945923
training loss: 1.7548309564590454
training loss: 1.936244249343872
training loss: 1.8696397542953491
training loss: 1.7901692390441895


training:  11%|█▏        | 567/5000 [19:42<2:28:08,  2.01s/it]

training loss: 1.9838982820510864
training loss: 1.7661771774291992
training loss: 1.7086622714996338
training loss: 1.7526733875274658
training loss: 1.7883000373840332
training loss: 1.7653616666793823


training:  11%|█▏        | 573/5000 [19:54<2:27:16,  2.00s/it]

training loss: 1.7666382789611816
training loss: 1.8544998168945312
training loss: 1.856928825378418
training loss: 1.737641453742981
training loss: 1.7563507556915283
training loss: 1.8103320598602295


training:  12%|█▏        | 579/5000 [20:06<2:26:37,  1.99s/it]

training loss: 1.699350357055664
training loss: 1.7795335054397583
training loss: 1.8511744737625122
training loss: 1.7886775732040405
training loss: 1.70484459400177
training loss: 1.794883370399475


training:  12%|█▏        | 585/5000 [20:17<2:26:04,  1.99s/it]

training loss: 1.6713345050811768
training loss: 1.8412586450576782
training loss: 1.8731944561004639
training loss: 1.730054259300232
training loss: 1.7738161087036133
training loss: 1.7061927318572998


training:  12%|█▏        | 591/5000 [20:29<2:25:38,  1.98s/it]

training loss: 1.6828625202178955
training loss: 1.7900818586349487
training loss: 1.88419771194458
training loss: 1.732072353363037
training loss: 1.7589771747589111
training loss: 1.7577497959136963


training:  12%|█▏        | 597/5000 [20:41<2:25:16,  1.98s/it]

training loss: 1.8960005044937134
training loss: 1.9000872373580933
training loss: 1.7228126525878906
training loss: 1.7421034574508667
training loss: 1.781629204750061
validation loss: 1.5945278406143188
training loss: 1.7498083114624023


training:  12%|█▏        | 603/5000 [20:53<2:25:40,  1.99s/it]

training loss: 1.6852487325668335
training loss: 1.7727148532867432
training loss: 1.769432783126831
training loss: 1.7334654331207275
training loss: 1.6560238599777222
training loss: 1.7256226539611816


training:  12%|█▏        | 609/5000 [21:05<2:25:10,  1.98s/it]

training loss: 1.637779712677002
training loss: 1.8081363439559937
training loss: 1.925657868385315
training loss: 1.7649757862091064
training loss: 1.7097361087799072
training loss: 1.8016117811203003


training:  12%|█▏        | 615/5000 [21:17<2:24:47,  1.98s/it]

training loss: 1.715914249420166
training loss: 1.7077932357788086
training loss: 1.7323312759399414
training loss: 1.7535419464111328
training loss: 1.865288496017456
training loss: 1.699671745300293


training:  12%|█▏        | 621/5000 [21:29<2:24:26,  1.98s/it]

training loss: 1.7160913944244385
training loss: 1.7629748582839966
training loss: 1.8315982818603516
training loss: 1.6871650218963623
training loss: 1.6438204050064087
training loss: 1.8838632106781006


training:  13%|█▎        | 627/5000 [21:41<2:24:07,  1.98s/it]

training loss: 1.720713496208191
training loss: 1.6306233406066895
training loss: 1.730168342590332
training loss: 1.7564241886138916
training loss: 1.7223405838012695
training loss: 1.7699171304702759


training:  13%|█▎        | 633/5000 [21:52<2:23:50,  1.98s/it]

training loss: 1.7984085083007812
training loss: 1.7611536979675293
training loss: 1.5692319869995117
training loss: 1.7754812240600586
training loss: 1.7127023935317993
training loss: 1.8934783935546875


training:  13%|█▎        | 639/5000 [22:04<2:23:36,  1.98s/it]

training loss: 1.6276485919952393
training loss: 1.6844114065170288
training loss: 1.6994132995605469
training loss: 1.849639892578125
training loss: 1.7035719156265259
training loss: 1.770509123802185


training:  13%|█▎        | 645/5000 [22:16<2:23:23,  1.98s/it]

training loss: 1.754676103591919
training loss: 1.734009027481079
training loss: 1.791013240814209
training loss: 1.6503405570983887
training loss: 1.781886339187622
training loss: 1.763855218887329


training:  13%|█▎        | 651/5000 [22:28<2:23:11,  1.98s/it]

training loss: 1.7276921272277832
training loss: 1.7438842058181763
training loss: 1.794347882270813
training loss: 1.706283450126648
training loss: 1.7865880727767944
training loss: 1.7004855871200562


training:  13%|█▎        | 657/5000 [22:40<2:22:57,  1.98s/it]

training loss: 1.9634343385696411
training loss: 1.7174174785614014
training loss: 1.8046332597732544
training loss: 1.7500696182250977
training loss: 1.8200123310089111
training loss: 1.7509034872055054


training:  13%|█▎        | 663/5000 [22:52<2:22:44,  1.97s/it]

training loss: 1.6325196027755737
training loss: 1.7598108053207397
training loss: 1.7098764181137085
training loss: 1.786742925643921
training loss: 1.6854259967803955
training loss: 1.9379310607910156


training:  13%|█▎        | 669/5000 [23:04<2:22:34,  1.98s/it]

training loss: 1.7007052898406982
training loss: 1.705522894859314
training loss: 1.7579376697540283
training loss: 1.7698473930358887
training loss: 1.7434943914413452
training loss: 1.739975929260254


training:  14%|█▎        | 675/5000 [23:15<2:22:21,  1.97s/it]

training loss: 1.4084782600402832
training loss: 1.800245761871338
training loss: 1.6867858171463013
training loss: 1.8682857751846313
training loss: 1.9184141159057617
training loss: 1.7166146039962769


training:  14%|█▎        | 681/5000 [23:27<2:22:08,  1.97s/it]

training loss: 1.6164965629577637
training loss: 1.705462098121643
training loss: 1.671370267868042
training loss: 1.7482187747955322
training loss: 1.9579062461853027
training loss: 1.7423502206802368


training:  14%|█▎        | 687/5000 [23:39<2:21:56,  1.97s/it]

training loss: 1.750725269317627
training loss: 1.8102471828460693
training loss: 1.7674788236618042
training loss: 1.7820181846618652
training loss: 1.6869819164276123
training loss: 1.6283049583435059


training:  14%|█▍        | 693/5000 [23:51<2:21:45,  1.97s/it]

training loss: 1.7109776735305786
training loss: 1.75629460811615
training loss: 1.7544828653335571
training loss: 1.5925856828689575
training loss: 1.7024049758911133
training loss: 1.6666007041931152


training:  14%|█▍        | 699/5000 [24:03<2:21:32,  1.97s/it]

training loss: 1.6872886419296265
training loss: 1.7636562585830688
training loss: 1.7573328018188477
validation loss: 1.5744551420211792
training loss: 1.674214482307434
training loss: 1.6976087093353271
training loss: 1.5758358240127563


training:  14%|█▍        | 705/5000 [24:15<2:22:02,  1.98s/it]

training loss: 1.7428536415100098
training loss: 1.558731198310852
training loss: 1.627446174621582
training loss: 1.7407206296920776
training loss: 1.6606099605560303
training loss: 1.8176984786987305


training:  14%|█▍        | 711/5000 [24:27<2:21:38,  1.98s/it]

training loss: 1.6894371509552002
training loss: 1.7560412883758545
training loss: 1.7274143695831299
training loss: 1.6860625743865967
training loss: 1.5410068035125732
training loss: 1.8034957647323608


training:  14%|█▍        | 717/5000 [24:39<2:21:17,  1.98s/it]

training loss: 1.7034237384796143
training loss: 1.7730317115783691
training loss: 1.6272821426391602
training loss: 1.7087997198104858
training loss: 1.6763629913330078
training loss: 1.7146008014678955


training:  14%|█▍        | 723/5000 [24:50<2:20:59,  1.98s/it]

training loss: 1.6405102014541626
training loss: 1.7287952899932861
training loss: 1.6762917041778564
training loss: 1.7052388191223145
training loss: 1.6343094110488892
training loss: 1.695730209350586


training:  15%|█▍        | 729/5000 [25:02<2:20:42,  1.98s/it]

training loss: 1.7993823289871216
training loss: 1.93592369556427
training loss: 1.705241084098816
training loss: 1.5811121463775635
training loss: 1.9085842370986938
training loss: 1.7447303533554077


training:  15%|█▍        | 735/5000 [25:14<2:20:28,  1.98s/it]

training loss: 1.7223882675170898
training loss: 1.8031182289123535
training loss: 1.6616264581680298
training loss: 1.6592421531677246
training loss: 1.8002276420593262
training loss: 1.6271727085113525


training:  15%|█▍        | 741/5000 [25:26<2:20:13,  1.98s/it]

training loss: 1.7725255489349365
training loss: 1.7376065254211426
training loss: 1.7118644714355469
training loss: 1.7738384008407593
training loss: 1.7815109491348267
training loss: 1.607923984527588


training:  15%|█▍        | 747/5000 [25:38<2:20:00,  1.98s/it]

training loss: 1.7244443893432617
training loss: 1.6817076206207275
training loss: 1.8164793252944946
training loss: 1.655470848083496
training loss: 1.7534565925598145
training loss: 1.5745388269424438


training:  15%|█▌        | 753/5000 [25:50<2:19:47,  1.97s/it]

training loss: 1.835710048675537
training loss: 1.5621743202209473
training loss: 1.6237295866012573
training loss: 1.707711935043335
training loss: 1.7837190628051758
training loss: 1.697016716003418


training:  15%|█▌        | 759/5000 [26:01<2:19:34,  1.97s/it]

training loss: 1.9169213771820068
training loss: 1.6214561462402344
training loss: 1.5644069910049438
training loss: 1.7464792728424072
training loss: 1.7325820922851562
training loss: 1.7096996307373047


training:  15%|█▌        | 765/5000 [26:13<2:19:22,  1.97s/it]

training loss: 1.6539549827575684
training loss: 1.6912569999694824
training loss: 1.7161520719528198
training loss: 1.8003042936325073
training loss: 1.779362440109253
training loss: 1.6760225296020508


training:  15%|█▌        | 771/5000 [26:25<2:19:10,  1.97s/it]

training loss: 1.5978049039840698
training loss: 1.6671220064163208
training loss: 1.5474705696105957
training loss: 1.7535345554351807
training loss: 1.509599208831787
training loss: 1.5820739269256592


training:  16%|█▌        | 777/5000 [26:37<2:18:57,  1.97s/it]

training loss: 1.5758023262023926
training loss: 1.6707367897033691
training loss: 1.6936239004135132
training loss: 1.687488079071045
training loss: 1.677046298980713
training loss: 1.7167294025421143


training:  16%|█▌        | 783/5000 [26:49<2:18:44,  1.97s/it]

training loss: 1.7488420009613037
training loss: 1.6491193771362305
training loss: 1.7610862255096436
training loss: 1.647144079208374
training loss: 1.7122066020965576
training loss: 1.8592581748962402


training:  16%|█▌        | 789/5000 [27:01<2:18:32,  1.97s/it]

training loss: 1.6419166326522827
training loss: 1.7042527198791504
training loss: 1.3766140937805176
training loss: 1.5738036632537842
training loss: 1.7684848308563232
training loss: 1.5269536972045898


training:  16%|█▌        | 795/5000 [27:12<2:18:19,  1.97s/it]

training loss: 1.9044909477233887
training loss: 1.684272289276123
training loss: 1.603916049003601
training loss: 1.652499794960022
training loss: 1.6804670095443726
training loss: 1.727317214012146
training loss: 1.7620762586593628


training:  16%|█▌        | 801/5000 [27:25<2:18:48,  1.98s/it]

validation loss: 1.6784659624099731
training loss: 1.5897890329360962
training loss: 1.7209444046020508
training loss: 1.619110345840454
training loss: 1.8465930223464966
training loss: 1.7895535230636597


training:  16%|█▌        | 807/5000 [27:36<2:18:25,  1.98s/it]

training loss: 1.697984218597412
training loss: 1.5889981985092163
training loss: 1.6092677116394043
training loss: 1.6558165550231934
training loss: 1.7107620239257812
training loss: 1.6507233381271362


training:  16%|█▋        | 813/5000 [27:48<2:18:04,  1.98s/it]

training loss: 1.600719690322876
training loss: 1.7107696533203125
training loss: 1.77323579788208
training loss: 1.6146795749664307
training loss: 1.7157282829284668
training loss: 1.6606080532073975


training:  16%|█▋        | 819/5000 [28:00<2:17:46,  1.98s/it]

training loss: 1.600113034248352
training loss: 1.6131584644317627
training loss: 1.6297152042388916
training loss: 1.738843321800232
training loss: 1.6083807945251465
training loss: 1.7289295196533203


training:  16%|█▋        | 825/5000 [28:12<2:17:30,  1.98s/it]

training loss: 1.5508986711502075
training loss: 1.6427372694015503
training loss: 1.7001903057098389
training loss: 1.666983962059021
training loss: 1.681556224822998
training loss: 1.5722907781600952


training:  17%|█▋        | 831/5000 [28:24<2:17:16,  1.98s/it]

training loss: 1.674720048904419
training loss: 1.658139705657959
training loss: 1.6860136985778809
training loss: 1.6478338241577148
training loss: 1.6964199542999268
training loss: 1.685654878616333


training:  17%|█▋        | 837/5000 [28:36<2:17:02,  1.98s/it]

training loss: 1.5998013019561768
training loss: 1.7524402141571045
training loss: 1.7569236755371094
training loss: 1.5338095426559448
training loss: 1.5832264423370361
training loss: 1.6509828567504883


training:  17%|█▋        | 843/5000 [28:47<2:16:48,  1.97s/it]

training loss: 1.618139624595642
training loss: 1.698648452758789
training loss: 1.7188576459884644
training loss: 1.8289042711257935
training loss: 1.6264475584030151
training loss: 1.713552713394165


training:  17%|█▋        | 849/5000 [28:59<2:16:36,  1.97s/it]

training loss: 1.6600682735443115
training loss: 1.6314798593521118
training loss: 1.70701265335083
training loss: 1.6453396081924438
training loss: 1.7777302265167236
training loss: 1.674917459487915


training:  17%|█▋        | 855/5000 [29:11<2:16:23,  1.97s/it]

training loss: 1.5948498249053955
training loss: 1.6646320819854736
training loss: 1.5964407920837402
training loss: 1.6873066425323486
training loss: 1.6831551790237427
training loss: 1.668246865272522


training:  17%|█▋        | 861/5000 [29:23<2:16:11,  1.97s/it]

training loss: 1.641982078552246
training loss: 1.507179617881775
training loss: 1.5841296911239624
training loss: 1.6983203887939453
training loss: 1.6717944145202637
training loss: 1.615981101989746


training:  17%|█▋        | 867/5000 [29:35<2:15:58,  1.97s/it]

training loss: 1.6168843507766724
training loss: 1.519646167755127
training loss: 1.5710203647613525
training loss: 1.6911914348602295
training loss: 1.606144666671753
training loss: 1.707617998123169


training:  17%|█▋        | 873/5000 [29:47<2:15:46,  1.97s/it]

training loss: 1.520885944366455
training loss: 1.8027424812316895
training loss: 1.6808487176895142
training loss: 1.6821720600128174
training loss: 1.7276631593704224
training loss: 1.691606044769287


training:  18%|█▊        | 879/5000 [29:58<2:15:35,  1.97s/it]

training loss: 1.6727045774459839
training loss: 1.6462393999099731
training loss: 1.6443908214569092
training loss: 1.64363694190979
training loss: 1.6075702905654907
training loss: 1.5686581134796143


training:  18%|█▊        | 885/5000 [30:10<2:15:22,  1.97s/it]

training loss: 1.7576162815093994
training loss: 1.6937617063522339
training loss: 1.5713342428207397
training loss: 1.5949567556381226
training loss: 1.6743965148925781
training loss: 1.7355656623840332


training:  18%|█▊        | 891/5000 [30:22<2:15:10,  1.97s/it]

training loss: 1.6775120496749878
training loss: 1.5794432163238525
training loss: 1.6705865859985352
training loss: 1.5434215068817139
training loss: 1.7981863021850586
training loss: 1.7564719915390015


training:  18%|█▊        | 897/5000 [30:34<2:14:59,  1.97s/it]

training loss: 1.6753560304641724
training loss: 1.6120600700378418
training loss: 1.5987786054611206
training loss: 1.6815516948699951
training loss: 1.6606671810150146
validation loss: 1.5163776874542236
training loss: 1.555293083190918


training:  18%|█▊        | 903/5000 [30:46<2:15:26,  1.98s/it]

training loss: 1.6530952453613281
training loss: 1.6606030464172363
training loss: 1.824751853942871
training loss: 1.8081166744232178
training loss: 1.6160938739776611
training loss: 1.5901691913604736


training:  18%|█▊        | 909/5000 [30:58<2:15:02,  1.98s/it]

training loss: 1.669442892074585
training loss: 1.6547577381134033
training loss: 1.6527659893035889
training loss: 1.6107892990112305
training loss: 1.669623613357544
training loss: 1.5896546840667725


training:  18%|█▊        | 915/5000 [31:10<2:14:41,  1.98s/it]

training loss: 1.5623306035995483
training loss: 1.7578641176223755
training loss: 1.6679726839065552
training loss: 1.6274561882019043
training loss: 1.697853684425354
training loss: 1.508209228515625


training:  18%|█▊        | 921/5000 [31:22<2:14:24,  1.98s/it]

training loss: 1.72748863697052
training loss: 1.660095453262329
training loss: 1.6710052490234375
training loss: 1.668544054031372
training loss: 1.5278563499450684
training loss: 1.5129351615905762


training:  19%|█▊        | 927/5000 [31:33<2:14:08,  1.98s/it]

training loss: 1.6956202983856201
training loss: 1.6223726272583008
training loss: 1.564666748046875
training loss: 1.718285322189331
training loss: 1.8214294910430908
training loss: 1.5498216152191162


training:  19%|█▊        | 933/5000 [31:45<2:13:53,  1.98s/it]

training loss: 1.6735774278640747
training loss: 1.6871427297592163
training loss: 1.607670783996582
training loss: 1.5554465055465698
training loss: 1.6007922887802124
training loss: 1.4888911247253418


training:  19%|█▉        | 939/5000 [31:57<2:13:39,  1.97s/it]

training loss: 1.6379947662353516
training loss: 1.6329272985458374
training loss: 1.5646016597747803
training loss: 1.8068699836730957
training loss: 1.673709511756897
training loss: 1.6511378288269043


training:  19%|█▉        | 945/5000 [32:09<2:13:27,  1.97s/it]

training loss: 1.6285508871078491
training loss: 1.5359135866165161
training loss: 1.6832654476165771
training loss: 1.5717949867248535
training loss: 1.6384081840515137
training loss: 1.6149829626083374


training:  19%|█▉        | 951/5000 [32:21<2:13:14,  1.97s/it]

training loss: 1.477445125579834
training loss: 1.6642942428588867
training loss: 1.7289273738861084
training loss: 1.6708840131759644
training loss: 1.562177062034607
training loss: 1.4929144382476807


training:  19%|█▉        | 957/5000 [32:33<2:13:02,  1.97s/it]

training loss: 1.539095163345337
training loss: 1.5536956787109375
training loss: 1.564103364944458
training loss: 1.6997933387756348
training loss: 1.6635217666625977
training loss: 1.6403980255126953


training:  19%|█▉        | 963/5000 [32:44<2:12:49,  1.97s/it]

training loss: 1.5640147924423218
training loss: 1.7026573419570923
training loss: 1.6341700553894043
training loss: 1.610365867614746
training loss: 1.5279395580291748
training loss: 1.6260268688201904


training:  19%|█▉        | 969/5000 [32:56<2:12:37,  1.97s/it]

training loss: 1.6623791456222534
training loss: 1.6771230697631836
training loss: 1.680722713470459
training loss: 1.61777663230896
training loss: 1.596437692642212
training loss: 1.5843501091003418


training:  20%|█▉        | 975/5000 [33:08<2:12:25,  1.97s/it]

training loss: 1.6301565170288086
training loss: 1.442408561706543
training loss: 1.589510202407837
training loss: 1.666130542755127
training loss: 1.7185583114624023
training loss: 1.6425328254699707


training:  20%|█▉        | 981/5000 [33:20<2:12:14,  1.97s/it]

training loss: 1.5514582395553589
training loss: 1.5690534114837646
training loss: 1.5782643556594849
training loss: 1.6882474422454834
training loss: 1.6957321166992188
training loss: 1.5775775909423828


training:  20%|█▉        | 987/5000 [33:32<2:12:03,  1.97s/it]

training loss: 1.6404848098754883
training loss: 1.6510543823242188
training loss: 1.555685043334961
training loss: 1.6800856590270996
training loss: 1.618072271347046
training loss: 1.806445837020874


training:  20%|█▉        | 993/5000 [33:44<2:11:52,  1.97s/it]

training loss: 1.5892236232757568
training loss: 1.6250851154327393
training loss: 1.5958638191223145
training loss: 1.6633294820785522
training loss: 1.6292341947555542
training loss: 1.5674903392791748


training:  20%|█▉        | 999/5000 [33:56<2:11:39,  1.97s/it]

training loss: 1.6742950677871704
training loss: 1.6316101551055908
training loss: 1.7313385009765625
validation loss: 1.5947333574295044
%s 

 %s (" in the [[7th century]] with the emergence of the prophet [[Muhammad]]. Within a century of his death, an Islamic state stretched from the [[Atlantic ocean]] in the west to [[central Asia]] in the east, which, however, was soon torn by civil wars ([[fitna]]s). After this, there would always be rival dynasties claiming the [[caliphate]], or leadership of the Muslim world, and many Islamic states or empires offering only token obedience to an increasingly powerless [[caliph]].  Nonetheless, the later empires of the [[Abbasid]] caliphs and the [[Seljuk Turks]] were among the largest and most powerful in the world. After the disastrous defeat of the Byzantines at the [[Battle of Manzikert]] in [[1071]], Christian Europe launched a series of [[Crusades]] and for a time captured Jerusalem. [[Saladin]], however, restored unity and defeated the [[

training:  20%|██        | 1001/5000 [34:30<4:18:22,  3.88s/it]

g univers it blight, the gurber have acts of the ration, the execration in the state gend of the cannering and univers' had the ign.  ===Paintugative==== ''Siths== A would ''Depublic [[Edd Shie]]'' in a halth of the [[Keets]]s eleaged which its was larged to area be uter-purb, for [[Bhistory MPhythine, gancle, greatures in the 1881. This of the locational deg per of the rising the about was be the feature, &quot;the recision forming the countro-mate (the prish and [[Europeana Stateshes]], of [[Herdment levi
training loss: 1.3723959922790527
training loss: 1.6437501907348633
training loss: 1.840078353881836
training loss: 1.677135944366455
training loss: 1.6297591924667358


training:  20%|██        | 1007/5000 [34:42<3:33:48,  3.21s/it]

training loss: 1.6564431190490723
training loss: 1.6261582374572754
training loss: 1.6357460021972656
training loss: 1.606273889541626
training loss: 1.6436352729797363
training loss: 1.6001274585723877


training:  20%|██        | 1013/5000 [34:54<3:06:06,  2.80s/it]

training loss: 1.5458920001983643
training loss: 1.4289897680282593
training loss: 1.5163764953613281
training loss: 1.6834886074066162
training loss: 1.6666735410690308
training loss: 1.6254862546920776


training:  20%|██        | 1019/5000 [35:05<2:48:09,  2.53s/it]

training loss: 1.5985075235366821
training loss: 1.5714882612228394
training loss: 1.6343542337417603
training loss: 1.4741950035095215
training loss: 1.6152907609939575
training loss: 1.6125826835632324


training:  20%|██        | 1025/5000 [35:17<2:36:11,  2.36s/it]

training loss: 1.7992427349090576
training loss: 1.5561336278915405
training loss: 1.7584528923034668
training loss: 1.6183675527572632
training loss: 1.5766217708587646
training loss: 1.5532917976379395


training:  21%|██        | 1031/5000 [35:29<2:28:04,  2.24s/it]

training loss: 1.5962049961090088
training loss: 1.7172390222549438
training loss: 1.6805583238601685
training loss: 1.6231701374053955
training loss: 1.577369213104248
training loss: 1.6231763362884521


training:  21%|██        | 1037/5000 [35:41<2:22:29,  2.16s/it]

training loss: 1.6530368328094482
training loss: 1.576998233795166
training loss: 1.5948915481567383
training loss: 1.5166354179382324
training loss: 1.6261065006256104
training loss: 1.6279114484786987


training:  21%|██        | 1043/5000 [35:53<2:18:34,  2.10s/it]

training loss: 1.6529874801635742
training loss: 1.5203639268875122
training loss: 1.510023593902588
training loss: 1.6183464527130127
training loss: 1.6563063859939575
training loss: 1.6310575008392334


training:  21%|██        | 1049/5000 [36:05<2:15:50,  2.06s/it]

training loss: 1.536197304725647
training loss: 1.5443646907806396
training loss: 1.6713181734085083
training loss: 1.557590126991272
training loss: 1.5333356857299805
training loss: 1.6124165058135986


training:  21%|██        | 1055/5000 [36:17<2:13:51,  2.04s/it]

training loss: 1.6931583881378174
training loss: 1.6157035827636719
training loss: 1.760022521018982
training loss: 1.3840430974960327
training loss: 1.7574878931045532
training loss: 1.581704020500183


training:  21%|██        | 1061/5000 [36:28<2:12:25,  2.02s/it]

training loss: 1.7050061225891113
training loss: 1.6528573036193848
training loss: 1.5220106840133667
training loss: 1.5659806728363037
training loss: 1.5915195941925049
training loss: 1.5765118598937988


training:  21%|██▏       | 1067/5000 [36:40<2:11:21,  2.00s/it]

training loss: 1.750534176826477
training loss: 1.4961755275726318
training loss: 1.46270751953125
training loss: 1.6079537868499756
training loss: 1.6874665021896362
training loss: 1.620790719985962


training:  21%|██▏       | 1073/5000 [36:52<2:10:33,  1.99s/it]

training loss: 1.6397265195846558
training loss: 1.581485629081726
training loss: 1.59306001663208
training loss: 1.5134336948394775
training loss: 1.6294372081756592
training loss: 1.6451771259307861


training:  22%|██▏       | 1079/5000 [37:04<2:09:56,  1.99s/it]

training loss: 1.5102037191390991
training loss: 1.5770316123962402
training loss: 1.4816409349441528
training loss: 1.7004156112670898
training loss: 1.6450316905975342
training loss: 1.4973466396331787


training:  22%|██▏       | 1085/5000 [37:16<2:09:26,  1.98s/it]

training loss: 1.6450021266937256
training loss: 1.4606640338897705
training loss: 1.725233554840088
training loss: 1.4732586145401
training loss: 1.7656915187835693
training loss: 1.5589898824691772


training:  22%|██▏       | 1091/5000 [37:28<2:09:02,  1.98s/it]

training loss: 1.7286697626113892
training loss: 1.6342947483062744
training loss: 1.6281275749206543
training loss: 1.462670087814331
training loss: 1.6228091716766357
training loss: 1.365110993385315


training:  22%|██▏       | 1097/5000 [37:39<2:08:42,  1.98s/it]

training loss: 1.743762493133545
training loss: 1.556183099746704
training loss: 1.5796730518341064
training loss: 1.5434134006500244
training loss: 1.7404688596725464
validation loss: 1.5559685230255127


training:  22%|██▏       | 1097/5000 [37:50<2:08:42,  1.98s/it]

training loss: 1.5802671909332275


training:  22%|██▏       | 1103/5000 [37:51<2:09:03,  1.99s/it]

training loss: 1.6421303749084473
training loss: 1.7369210720062256
training loss: 1.6313755512237549
training loss: 1.5497372150421143
training loss: 1.6727149486541748
training loss: 1.548459768295288


training:  22%|██▏       | 1109/5000 [38:03<2:08:35,  1.98s/it]

training loss: 1.6427687406539917
training loss: 1.6800929307937622
training loss: 1.528541088104248
training loss: 1.5398036241531372
training loss: 1.667482614517212
training loss: 1.584505319595337


training:  22%|██▏       | 1115/5000 [38:15<2:08:13,  1.98s/it]

training loss: 1.6126561164855957
training loss: 1.6178196668624878
training loss: 1.6367701292037964
training loss: 1.6301612854003906
training loss: 1.4697444438934326
training loss: 1.63710355758667


training:  22%|██▏       | 1121/5000 [38:27<2:07:54,  1.98s/it]

training loss: 1.5604588985443115
training loss: 1.5503309965133667
training loss: 1.4121168851852417
training loss: 1.493748664855957
training loss: 1.5398999452590942
training loss: 1.6438586711883545


training:  23%|██▎       | 1127/5000 [38:39<2:07:36,  1.98s/it]

training loss: 1.4471759796142578
training loss: 1.5566973686218262
training loss: 1.6533626317977905
training loss: 1.4223136901855469
training loss: 1.6723861694335938
training loss: 1.5628776550292969


training:  23%|██▎       | 1133/5000 [38:51<2:07:22,  1.98s/it]

training loss: 1.3038698434829712
training loss: 1.6515464782714844
training loss: 1.489296793937683
training loss: 1.4369882345199585
training loss: 1.805122971534729
training loss: 1.7163907289505005


training:  23%|██▎       | 1139/5000 [39:03<2:07:07,  1.98s/it]

training loss: 1.5341325998306274
training loss: 1.6579185724258423
training loss: 1.5952868461608887
training loss: 1.8107774257659912
training loss: 1.5406333208084106
training loss: 1.688827395439148


training:  23%|██▎       | 1145/5000 [39:14<2:06:52,  1.97s/it]

training loss: 1.6161272525787354
training loss: 1.5447274446487427
training loss: 1.5799249410629272
training loss: 1.3301873207092285
training loss: 1.5092244148254395
training loss: 1.470192551612854


training:  23%|██▎       | 1151/5000 [39:26<2:06:40,  1.97s/it]

training loss: 1.5419596433639526
training loss: 1.557464599609375
training loss: 1.6581145524978638
training loss: 1.552243947982788
training loss: 1.56036376953125
training loss: 1.5910981893539429


training:  23%|██▎       | 1157/5000 [39:38<2:06:27,  1.97s/it]

training loss: 1.6678509712219238
training loss: 1.611163854598999
training loss: 1.5354347229003906
training loss: 1.509258508682251
training loss: 1.513096570968628
training loss: 1.7429050207138062


training:  23%|██▎       | 1163/5000 [39:50<2:06:14,  1.97s/it]

training loss: 1.5751667022705078
training loss: 1.6022603511810303
training loss: 1.7304593324661255
training loss: 1.7098698616027832
training loss: 1.5374009609222412
training loss: 1.6071445941925049


training:  23%|██▎       | 1169/5000 [40:02<2:06:02,  1.97s/it]

training loss: 1.5320544242858887
training loss: 1.5847163200378418
training loss: 1.6784666776657104
training loss: 1.4912548065185547
training loss: 1.5676319599151611
training loss: 1.60987389087677


training:  24%|██▎       | 1175/5000 [40:14<2:05:50,  1.97s/it]

training loss: 1.6381553411483765
training loss: 1.540380597114563
training loss: 1.4208223819732666
training loss: 1.5975135564804077
training loss: 1.7311885356903076
training loss: 1.593959927558899


training:  24%|██▎       | 1181/5000 [40:25<2:05:38,  1.97s/it]

training loss: 1.5904591083526611
training loss: 1.6107944250106812
training loss: 1.581225037574768
training loss: 1.600176215171814
training loss: 1.671146035194397
training loss: 1.5151088237762451


training:  24%|██▎       | 1187/5000 [40:37<2:05:26,  1.97s/it]

training loss: 1.5748764276504517
training loss: 1.4485236406326294
training loss: 1.621820092201233
training loss: 1.5843995809555054
training loss: 1.6237022876739502
training loss: 1.5073460340499878


training:  24%|██▍       | 1193/5000 [40:49<2:05:14,  1.97s/it]

training loss: 1.6603983640670776
training loss: 1.3722000122070312
training loss: 1.7661892175674438
training loss: 1.6103196144104004
training loss: 1.556396245956421
training loss: 1.6791267395019531


training:  24%|██▍       | 1199/5000 [41:01<2:05:02,  1.97s/it]

training loss: 1.5391581058502197
training loss: 1.590839147567749
training loss: 1.5513533353805542
validation loss: 1.559837818145752
training loss: 1.4883556365966797
training loss: 1.5321391820907593
training loss: 1.6741714477539062


training:  24%|██▍       | 1205/5000 [41:13<2:05:27,  1.98s/it]

training loss: 1.5962272882461548
training loss: 1.6237998008728027
training loss: 1.5535187721252441
training loss: 1.5309256315231323
training loss: 1.7017048597335815
training loss: 1.3931753635406494


training:  24%|██▍       | 1211/5000 [41:25<2:05:04,  1.98s/it]

training loss: 1.6262599229812622
training loss: 1.6817028522491455
training loss: 1.5292514562606812
training loss: 1.6538006067276
training loss: 1.5065115690231323
training loss: 1.599472999572754


training:  24%|██▍       | 1217/5000 [41:37<2:04:44,  1.98s/it]

training loss: 1.602949857711792
training loss: 1.7426917552947998
training loss: 1.532560110092163
training loss: 1.615360140800476
training loss: 1.5934561491012573
training loss: 1.5088200569152832


training:  24%|██▍       | 1223/5000 [41:49<2:04:27,  1.98s/it]

training loss: 1.457650065422058
training loss: 1.6400226354599
training loss: 1.475854754447937
training loss: 1.4351531267166138
training loss: 1.5569652318954468
training loss: 1.4619781970977783


training:  25%|██▍       | 1229/5000 [42:00<2:04:11,  1.98s/it]

training loss: 1.6918904781341553
training loss: 1.529468297958374
training loss: 1.6424401998519897
training loss: 1.5897446870803833
training loss: 1.3985787630081177
training loss: 1.581916332244873


training:  25%|██▍       | 1235/5000 [42:12<2:03:57,  1.98s/it]

training loss: 1.2165189981460571
training loss: 1.762321949005127
training loss: 1.5678746700286865
training loss: 1.5524042844772339
training loss: 1.506740927696228
training loss: 1.4667760133743286


training:  25%|██▍       | 1241/5000 [42:24<2:03:43,  1.97s/it]

training loss: 1.591025948524475
training loss: 1.5580874681472778
training loss: 1.5020747184753418
training loss: 1.6132164001464844
training loss: 1.5881836414337158
training loss: 1.6228810548782349


training:  25%|██▍       | 1247/5000 [42:36<2:03:29,  1.97s/it]

training loss: 1.4653533697128296
training loss: 1.604844093322754
training loss: 1.594157338142395
training loss: 1.5673801898956299
training loss: 1.5719109773635864
training loss: 1.7630953788757324


training:  25%|██▌       | 1253/5000 [42:48<2:03:16,  1.97s/it]

training loss: 1.7331537008285522
training loss: 1.5800726413726807
training loss: 1.5642036199569702
training loss: 1.6107269525527954
training loss: 1.807936191558838
training loss: 1.5998355150222778


training:  25%|██▌       | 1259/5000 [43:00<2:03:04,  1.97s/it]

training loss: 1.5888608694076538
training loss: 1.5119935274124146
training loss: 1.599226474761963
training loss: 1.6913098096847534
training loss: 1.5257893800735474


training:  25%|██▌       | 1259/5000 [43:10<2:03:04,  1.97s/it]

training loss: 1.6150671243667603


training:  25%|██▌       | 1265/5000 [43:11<2:02:52,  1.97s/it]

training loss: 1.6412867307662964
training loss: 1.5904548168182373
training loss: 1.5746935606002808
training loss: 1.5594819784164429
training loss: 1.442103624343872
training loss: 1.5000280141830444


training:  25%|██▌       | 1271/5000 [43:23<2:02:40,  1.97s/it]

training loss: 1.621389627456665
training loss: 1.709855318069458
training loss: 1.6100850105285645
training loss: 1.5708444118499756
training loss: 1.3442788124084473
training loss: 1.5456780195236206


training:  26%|██▌       | 1277/5000 [43:35<2:02:29,  1.97s/it]

training loss: 1.5334287881851196
training loss: 1.5837396383285522
training loss: 1.612614393234253
training loss: 1.5234359502792358
training loss: 1.5699236392974854
training loss: 1.4876350164413452


training:  26%|██▌       | 1283/5000 [43:47<2:02:16,  1.97s/it]

training loss: 1.5394514799118042
training loss: 1.5783833265304565
training loss: 1.5904934406280518
training loss: 1.503765344619751
training loss: 1.5427281856536865
training loss: 1.5067671537399292


training:  26%|██▌       | 1289/5000 [43:59<2:02:04,  1.97s/it]

training loss: 1.4868451356887817
training loss: 1.384900450706482
training loss: 1.4828852415084839
training loss: 1.5985307693481445
training loss: 1.5618005990982056
training loss: 1.708517074584961


training:  26%|██▌       | 1295/5000 [44:11<2:01:52,  1.97s/it]

training loss: 1.5148659944534302
training loss: 1.5734089612960815
training loss: 1.4769365787506104
training loss: 1.5131970643997192
training loss: 1.5680464506149292
training loss: 1.6329830884933472
training loss: 1.8117502927780151


training:  26%|██▌       | 1301/5000 [44:23<2:02:15,  1.98s/it]

validation loss: 1.4094914197921753
training loss: 1.464032530784607
training loss: 1.5527952909469604
training loss: 1.5472123622894287
training loss: 1.5602625608444214
training loss: 1.5025445222854614


training:  26%|██▌       | 1307/5000 [44:34<2:01:52,  1.98s/it]

training loss: 1.5415639877319336
training loss: 1.5365809202194214
training loss: 1.6134625673294067
training loss: 1.6735607385635376
training loss: 1.5441120862960815
training loss: 1.731644868850708


training:  26%|██▋       | 1313/5000 [44:46<2:01:33,  1.98s/it]

training loss: 1.5514769554138184
training loss: 1.235770583152771
training loss: 1.564746379852295
training loss: 1.5289047956466675
training loss: 1.443444848060608
training loss: 1.6063477993011475


training:  26%|██▋       | 1319/5000 [44:58<2:01:16,  1.98s/it]

training loss: 1.5372623205184937
training loss: 1.6919797658920288
training loss: 1.5133012533187866
training loss: 1.5502498149871826
training loss: 1.6089200973510742
training loss: 1.4979952573776245


training:  26%|██▋       | 1325/5000 [45:10<2:01:01,  1.98s/it]

training loss: 1.526092290878296
training loss: 1.5013052225112915
training loss: 1.5136979818344116
training loss: 1.7717798948287964
training loss: 1.4255050420761108
training loss: 1.5085097551345825


training:  27%|██▋       | 1331/5000 [45:22<2:00:47,  1.98s/it]

training loss: 1.7202516794204712
training loss: 1.4058645963668823
training loss: 1.5991464853286743
training loss: 1.5006762742996216
training loss: 1.5385373830795288
training loss: 1.6446257829666138


training:  27%|██▋       | 1337/5000 [45:34<2:00:33,  1.97s/it]

training loss: 1.6103737354278564
training loss: 1.567409873008728
training loss: 1.5730061531066895
training loss: 1.6429762840270996
training loss: 1.5127846002578735
training loss: 1.5975924730300903


training:  27%|██▋       | 1343/5000 [45:46<2:00:20,  1.97s/it]

training loss: 1.5118038654327393
training loss: 1.5184228420257568
training loss: 1.4207900762557983
training loss: 1.6478683948516846
training loss: 1.4775917530059814
training loss: 1.4910614490509033


training:  27%|██▋       | 1349/5000 [45:57<2:00:08,  1.97s/it]

training loss: 1.5764371156692505
training loss: 1.3973667621612549
training loss: 1.4826799631118774
training loss: 1.5344140529632568
training loss: 1.6725393533706665
training loss: 1.8153443336486816


training:  27%|██▋       | 1355/5000 [46:09<1:59:55,  1.97s/it]

training loss: 1.5121452808380127
training loss: 1.4928256273269653
training loss: 1.5814157724380493
training loss: 1.4833287000656128
training loss: 1.5206722021102905
training loss: 1.6222044229507446


training:  27%|██▋       | 1361/5000 [46:21<1:59:42,  1.97s/it]

training loss: 1.6297370195388794
training loss: 1.494359016418457
training loss: 1.8976020812988281
training loss: 1.6746189594268799
training loss: 1.5858843326568604
training loss: 1.6014496088027954


training:  27%|██▋       | 1367/5000 [46:33<1:59:29,  1.97s/it]

training loss: 1.6437994241714478
training loss: 1.5688608884811401
training loss: 1.5045233964920044
training loss: 1.5762290954589844
training loss: 1.4723787307739258
training loss: 1.480824589729309


training:  27%|██▋       | 1373/5000 [46:45<1:59:18,  1.97s/it]

training loss: 1.634852409362793
training loss: 1.4999126195907593
training loss: 1.4994196891784668
training loss: 1.538645625114441
training loss: 1.5811446905136108
training loss: 1.5354671478271484


training:  28%|██▊       | 1379/5000 [46:57<1:59:06,  1.97s/it]

training loss: 1.4630966186523438
training loss: 1.5106735229492188
training loss: 1.5237795114517212
training loss: 1.6367666721343994
training loss: 1.4991974830627441
training loss: 1.6426748037338257


training:  28%|██▊       | 1385/5000 [47:08<1:58:55,  1.97s/it]

training loss: 1.4719173908233643
training loss: 1.5959278345108032
training loss: 1.550972580909729
training loss: 1.542934775352478
training loss: 1.409529447555542
training loss: 1.6479524374008179


training:  28%|██▊       | 1391/5000 [47:20<1:58:42,  1.97s/it]

training loss: 1.5753120183944702
training loss: 1.6416938304901123
training loss: 1.6042931079864502
training loss: 1.5091794729232788
training loss: 1.6114143133163452
training loss: 1.4935414791107178


training:  28%|██▊       | 1397/5000 [47:32<1:58:30,  1.97s/it]

training loss: 1.569008708000183
training loss: 1.4862931966781616
training loss: 1.5266767740249634
training loss: 1.635496735572815
training loss: 1.6709610223770142
validation loss: 1.4747240543365479
training loss: 1.4620095491409302


training:  28%|██▊       | 1403/5000 [47:44<1:58:53,  1.98s/it]

training loss: 1.6312682628631592
training loss: 1.5631961822509766
training loss: 1.602840781211853
training loss: 1.4964566230773926
training loss: 1.512283444404602
training loss: 1.4175305366516113


training:  28%|██▊       | 1409/5000 [47:56<1:58:31,  1.98s/it]

training loss: 1.5191473960876465
training loss: 1.4827675819396973
training loss: 1.5623486042022705
training loss: 1.535521388053894
training loss: 1.5415841341018677
training loss: 1.5234756469726562


training:  28%|██▊       | 1415/5000 [48:08<1:58:12,  1.98s/it]

training loss: 1.5029892921447754
training loss: 1.4434998035430908
training loss: 1.5358859300613403
training loss: 1.5762511491775513
training loss: 1.4476814270019531
training loss: 1.4966813325881958


training:  28%|██▊       | 1421/5000 [48:20<1:57:55,  1.98s/it]

training loss: 1.5708048343658447
training loss: 1.4637774229049683
training loss: 1.5310055017471313
training loss: 1.4585306644439697
training loss: 1.5019270181655884
training loss: 1.5103081464767456


training:  29%|██▊       | 1427/5000 [48:32<1:57:39,  1.98s/it]

training loss: 1.5563886165618896
training loss: 1.5974242687225342
training loss: 1.5020687580108643
training loss: 1.380323052406311
training loss: 1.6122801303863525
training loss: 1.5119906663894653


training:  29%|██▊       | 1433/5000 [48:43<1:57:24,  1.98s/it]

training loss: 1.2516783475875854
training loss: 1.4818402528762817
training loss: 1.4964184761047363
training loss: 1.6004630327224731
training loss: 1.4719197750091553
training loss: 1.4995652437210083


training:  29%|██▉       | 1439/5000 [48:55<1:57:11,  1.97s/it]

training loss: 1.4661600589752197
training loss: 1.6739274263381958
training loss: 1.494661569595337
training loss: 1.6409313678741455
training loss: 1.544927954673767
training loss: 1.6107401847839355


training:  29%|██▉       | 1445/5000 [49:07<1:56:59,  1.97s/it]

training loss: 1.5081614255905151
training loss: 1.4900763034820557
training loss: 1.5641987323760986
training loss: 1.5112513303756714
training loss: 1.5454363822937012
training loss: 1.587247371673584


training:  29%|██▉       | 1451/5000 [49:19<1:56:46,  1.97s/it]

training loss: 1.4415946006774902
training loss: 1.5320168733596802
training loss: 1.5555596351623535
training loss: 1.576426386833191
training loss: 1.7155499458312988
training loss: 1.5363579988479614


training:  29%|██▉       | 1457/5000 [49:31<1:56:33,  1.97s/it]

training loss: 1.5983202457427979
training loss: 1.5152640342712402
training loss: 1.5413174629211426
training loss: 1.4523371458053589
training loss: 1.5440744161605835
training loss: 1.5458909273147583


training:  29%|██▉       | 1463/5000 [49:43<1:56:21,  1.97s/it]

training loss: 1.6047030687332153
training loss: 1.5055556297302246
training loss: 1.5998226404190063
training loss: 1.5424634218215942
training loss: 1.547296166419983
training loss: 1.5843114852905273


training:  29%|██▉       | 1469/5000 [49:54<1:56:08,  1.97s/it]

training loss: 1.6470087766647339
training loss: 1.5608398914337158
training loss: 1.617280125617981
training loss: 1.535747766494751
training loss: 1.6265735626220703
training loss: 1.4844114780426025


training:  30%|██▉       | 1475/5000 [50:06<1:55:56,  1.97s/it]

training loss: 1.5194746255874634
training loss: 1.4119752645492554
training loss: 1.4622169733047485
training loss: 1.4762318134307861
training loss: 1.5011476278305054
training loss: 1.8086055517196655


training:  30%|██▉       | 1481/5000 [50:18<1:55:44,  1.97s/it]

training loss: 1.547850251197815
training loss: 1.5565685033798218
training loss: 1.6208895444869995
training loss: 1.54793381690979
training loss: 1.5049625635147095
training loss: 1.4882607460021973


training:  30%|██▉       | 1487/5000 [50:30<1:55:32,  1.97s/it]

training loss: 1.4502848386764526
training loss: 1.5763893127441406
training loss: 1.4816535711288452
training loss: 1.484412670135498
training loss: 1.547305941581726
training loss: 1.507360816001892


training:  30%|██▉       | 1493/5000 [50:42<1:55:21,  1.97s/it]

training loss: 1.483106017112732
training loss: 1.7785958051681519
training loss: 1.5055506229400635
training loss: 1.5693975687026978
training loss: 1.4935246706008911
training loss: 1.505363941192627


training:  30%|██▉       | 1499/5000 [50:54<1:55:10,  1.97s/it]

training loss: 1.7008265256881714
training loss: 1.4828859567642212
training loss: 1.4919136762619019
validation loss: 1.4811040163040161
%s 

 %s ('Italia]] [[ro:Italia]] [[ru:Ð\x98Ñ\x82Ð°Ð»Ð¸Ñ\x8f]] [[sa:à¤\x87à¤\x9fà¤²à¥\x80]] [[sc:ItÃ\xa0lia]] [[scn:Italia]] [[sh:Italija]] [[simple:Italy]] [[sk:Taliansko]] [[sl:Italija]] [[sq:Italia]] [[sr:Ð\x98Ñ\x82Ð°Ð»Ð¸Ñ\x98Ð°]] [[sv:Italien]] [[ta:à®\x87à®¤à¯\x8dà®¤à®¾à®²à®¿]] [[th:à¸\x9bà¸£à¸°à¹\x80à¸\x97à¸¨à¸\xadà¸´à¸\x95à¸²à¸¥à¸µ]] [[tl:Italya]] [[tr:Ä°talya]] [[uk:Ð\x86Ñ\x82Ð°Ð»Ñ\x96Ñ\x8f]] [[ur:Ø§Ù¹Ù\x84Û\x8c]] [[vec:ItaÅ\x82ia]] [[vi:Ã\x9d]] [[yi:×\x90×\x99×\x98×\x90Ö·×\x9c×\x99×¢]] [[zh:æ\x84\x8få¤§å\x88©]] [[zh-min-nan:Italia]]</text>     </revision>   </page>   <page>     <title>India</title>     <id>14533</id>     <restrictions>move=:edit=</restrictions>     <revision>       <id>42103953</id>       <timestamp>2006-03-03T21:25:06Z</timestamp>       <contributor>         <username>Rama\'s Arrow</username>         <id>591624</id>       <

training:  30%|███       | 1501/5000 [51:28<3:45:55,  3.87s/it]

nticle games. Support monthy and in the one. In the lip]] internationall's the algority of maxter on out creat design languages: (asking level) on is de [[1924 Judasico]] and [[Backore sper Emperor|Bryde]]'s ackway musembers where the [[Unite (contived somewhork)|Ihan (centre)|Barbout in Salitary (1866)|choriese basÃ³n troundarian day [[add]])==  Compariation claims, or doubalify '''[[Army 20]]''': ''Lammy'' (1 ''Chara'' - The demore of [[candson]] were the opened of differencial luncose first minding more 
training loss: 1.6209068298339844
training loss: 1.4733279943466187
training loss: 1.62369966506958
training loss: 1.6825578212738037
training loss: 1.5423343181610107


training:  30%|███       | 1507/5000 [51:40<3:06:56,  3.21s/it]

training loss: 1.6239246129989624
training loss: 1.5825120210647583
training loss: 1.3966299295425415
training loss: 1.420445442199707
training loss: 1.5659632682800293
training loss: 1.5938827991485596


training:  30%|███       | 1513/5000 [51:52<2:42:41,  2.80s/it]

training loss: 1.5726656913757324
training loss: 1.5713250637054443
training loss: 1.5346572399139404
training loss: 1.6139994859695435
training loss: 1.5283550024032593
training loss: 1.615329384803772


training:  30%|███       | 1519/5000 [52:03<2:26:58,  2.53s/it]

training loss: 1.4514693021774292
training loss: 1.3528451919555664
training loss: 1.5560632944107056
training loss: 1.4022213220596313
training loss: 1.567033052444458
training loss: 1.5188583135604858


training:  30%|███       | 1525/5000 [52:15<2:16:30,  2.36s/it]

training loss: 1.5590033531188965
training loss: 1.3935598134994507
training loss: 1.550774097442627
training loss: 1.5532582998275757
training loss: 1.5402858257293701
training loss: 1.5832470655441284


training:  31%|███       | 1531/5000 [52:27<2:09:22,  2.24s/it]

training loss: 1.5698204040527344
training loss: 1.5341744422912598
training loss: 1.5841292142868042
training loss: 1.6718642711639404
training loss: 1.5654557943344116
training loss: 1.686432123184204


training:  31%|███       | 1537/5000 [52:39<2:04:28,  2.16s/it]

training loss: 1.5643070936203003
training loss: 1.5509305000305176
training loss: 1.5359455347061157
training loss: 1.525083065032959
training loss: 1.4221380949020386
training loss: 1.5132269859313965


training:  31%|███       | 1543/5000 [52:51<2:01:01,  2.10s/it]

training loss: 1.5230849981307983
training loss: 1.2264701128005981
training loss: 1.5803804397583008
training loss: 1.520231008529663
training loss: 1.6541866064071655
training loss: 1.4796504974365234


training:  31%|███       | 1549/5000 [53:03<1:58:36,  2.06s/it]

training loss: 1.6074004173278809
training loss: 1.5525407791137695
training loss: 1.4037333726882935
training loss: 1.5768256187438965
training loss: 1.7165607213974
training loss: 1.4570538997650146


training:  31%|███       | 1555/5000 [53:15<1:56:51,  2.04s/it]

training loss: 1.4639122486114502
training loss: 1.5078229904174805
training loss: 1.5103471279144287
training loss: 1.6129035949707031
training loss: 1.543859601020813
training loss: 1.3523197174072266


training:  31%|███       | 1561/5000 [53:26<1:55:34,  2.02s/it]

training loss: 1.5088874101638794
training loss: 1.332417368888855
training loss: 1.470089077949524
training loss: 1.6345415115356445
training loss: 1.5198562145233154
training loss: 1.5067005157470703


training:  31%|███▏      | 1567/5000 [53:38<1:54:37,  2.00s/it]

training loss: 1.8691461086273193
training loss: 1.684767484664917
training loss: 1.5725414752960205
training loss: 1.519290566444397
training loss: 1.3243192434310913
training loss: 1.413106083869934


training:  31%|███▏      | 1573/5000 [53:50<1:53:55,  1.99s/it]

training loss: 1.4533729553222656
training loss: 1.736511468887329
training loss: 1.6813935041427612
training loss: 1.7878812551498413
training loss: 1.5247833728790283
training loss: 1.3709384202957153


training:  32%|███▏      | 1579/5000 [54:02<1:53:21,  1.99s/it]

training loss: 1.5755093097686768
training loss: 1.5708975791931152
training loss: 1.7742291688919067
training loss: 1.5572375059127808
training loss: 1.5722836256027222
training loss: 1.4995653629302979


training:  32%|███▏      | 1585/5000 [54:14<1:52:54,  1.98s/it]

training loss: 1.4953734874725342
training loss: 1.482921838760376
training loss: 1.427847981452942
training loss: 1.428857445716858
training loss: 1.4041657447814941
training loss: 1.4684128761291504


training:  32%|███▏      | 1591/5000 [54:26<1:52:32,  1.98s/it]

training loss: 1.6564580202102661
training loss: 1.5020945072174072
training loss: 1.5762429237365723
training loss: 1.568140983581543
training loss: 1.5182729959487915
training loss: 1.5447611808776855


training:  32%|███▏      | 1597/5000 [54:37<1:52:12,  1.98s/it]

training loss: 1.517183780670166
training loss: 1.5198819637298584
training loss: 1.5194125175476074
training loss: 1.4564220905303955
training loss: 1.5942199230194092
validation loss: 1.4267414808273315
training loss: 1.5513370037078857


training:  32%|███▏      | 1603/5000 [54:49<1:52:28,  1.99s/it]

training loss: 1.548470139503479
training loss: 1.3540425300598145
training loss: 1.3427269458770752
training loss: 1.7050879001617432
training loss: 1.5394573211669922
training loss: 1.4632222652435303


training:  32%|███▏      | 1609/5000 [55:01<1:52:02,  1.98s/it]

training loss: 1.5348012447357178
training loss: 1.515409231185913
training loss: 1.5671968460083008
training loss: 1.5413408279418945
training loss: 1.511029839515686
training loss: 1.5732451677322388


training:  32%|███▏      | 1615/5000 [55:13<1:51:40,  1.98s/it]

training loss: 1.5584272146224976
training loss: 1.4897847175598145
training loss: 1.5489137172698975
training loss: 1.5150196552276611
training loss: 1.4557669162750244
training loss: 1.4738879203796387


training:  32%|███▏      | 1621/5000 [55:25<1:51:22,  1.98s/it]

training loss: 1.482426643371582
training loss: 1.5114282369613647
training loss: 1.5004304647445679
training loss: 1.5662908554077148
training loss: 1.5962162017822266
training loss: 1.5995213985443115


training:  33%|███▎      | 1627/5000 [55:37<1:51:05,  1.98s/it]

training loss: 1.5364025831222534
training loss: 1.5248816013336182
training loss: 1.6359888315200806
training loss: 1.4074201583862305
training loss: 1.5728704929351807
training loss: 1.4998466968536377


training:  33%|███▎      | 1633/5000 [55:49<1:50:51,  1.98s/it]

training loss: 1.2783381938934326
training loss: 1.4609413146972656
training loss: 1.6991063356399536
training loss: 1.5613092184066772
training loss: 1.5497868061065674
training loss: 1.55291748046875


training:  33%|███▎      | 1639/5000 [56:00<1:50:37,  1.97s/it]

training loss: 1.5471407175064087
training loss: 1.460099458694458
training loss: 1.5056285858154297
training loss: 1.579571008682251
training loss: 1.4762651920318604
training loss: 1.5368496179580688


training:  33%|███▎      | 1645/5000 [56:12<1:50:23,  1.97s/it]

training loss: 1.4360289573669434
training loss: 1.5845956802368164
training loss: 1.5149279832839966
training loss: 1.6264395713806152
training loss: 1.403855562210083
training loss: 1.436769962310791


training:  33%|███▎      | 1651/5000 [56:24<1:50:11,  1.97s/it]

training loss: 1.5056636333465576
training loss: 1.4087536334991455
training loss: 1.5298035144805908
training loss: 1.5890179872512817
training loss: 1.4935739040374756
training loss: 1.5678119659423828


training:  33%|███▎      | 1657/5000 [56:36<1:49:58,  1.97s/it]

training loss: 1.4953670501708984
training loss: 1.4806125164031982
training loss: 1.6167795658111572
training loss: 1.4306437969207764
training loss: 1.4785507917404175
training loss: 1.5164828300476074


training:  33%|███▎      | 1663/5000 [56:48<1:49:45,  1.97s/it]

training loss: 1.5023674964904785
training loss: 1.5522725582122803
training loss: 1.4628493785858154
training loss: 1.5232597589492798
training loss: 1.4667456150054932
training loss: 1.6112279891967773


training:  33%|███▎      | 1669/5000 [57:00<1:49:34,  1.97s/it]

training loss: 1.5471702814102173
training loss: 1.4035509824752808
training loss: 1.5575991868972778
training loss: 1.4379806518554688
training loss: 1.56345534324646
training loss: 1.6243181228637695


training:  34%|███▎      | 1675/5000 [57:12<1:49:22,  1.97s/it]

training loss: 1.56276273727417
training loss: 1.5176596641540527
training loss: 1.5441551208496094
training loss: 1.503419041633606
training loss: 1.5608545541763306
training loss: 1.4625223875045776


training:  34%|███▎      | 1681/5000 [57:23<1:49:10,  1.97s/it]

training loss: 1.5407609939575195
training loss: 1.435081124305725
training loss: 1.3252577781677246
training loss: 1.5260200500488281
training loss: 1.489688754081726
training loss: 1.4379805326461792


training:  34%|███▎      | 1687/5000 [57:35<1:48:57,  1.97s/it]

training loss: 1.5279127359390259
training loss: 1.4218294620513916
training loss: 1.4484751224517822
training loss: 1.6923943758010864
training loss: 1.612329125404358
training loss: 1.4706518650054932


training:  34%|███▍      | 1693/5000 [57:47<1:48:45,  1.97s/it]

training loss: 1.4103822708129883
training loss: 1.6565091609954834
training loss: 1.4870100021362305
training loss: 1.4710283279418945
training loss: 1.6491472721099854
training loss: 1.6053799390792847


training:  34%|███▍      | 1699/5000 [57:59<1:48:34,  1.97s/it]

training loss: 1.5874289274215698
training loss: 1.4647685289382935
training loss: 1.5842602252960205
validation loss: 1.4427570104599
training loss: 1.4735101461410522
training loss: 1.6244288682937622
training loss: 1.4330633878707886


training:  34%|███▍      | 1705/5000 [58:11<1:48:55,  1.98s/it]

training loss: 1.5854355096817017
training loss: 1.4528357982635498
training loss: 1.5570876598358154
training loss: 1.5461323261260986
training loss: 1.4771618843078613
training loss: 1.5685750246047974


training:  34%|███▍      | 1711/5000 [58:23<1:48:33,  1.98s/it]

training loss: 1.516831874847412
training loss: 1.4253789186477661
training loss: 1.5241148471832275
training loss: 1.6072547435760498
training loss: 1.5570945739746094
training loss: 1.4944994449615479


training:  34%|███▍      | 1717/5000 [58:35<1:48:14,  1.98s/it]

training loss: 1.4809705018997192
training loss: 1.4950132369995117
training loss: 1.4009093046188354
training loss: 1.4333183765411377
training loss: 1.5416823625564575
training loss: 1.4223757982254028


training:  34%|███▍      | 1723/5000 [58:46<1:47:57,  1.98s/it]

training loss: 1.5987597703933716
training loss: 1.570091724395752
training loss: 1.5510648488998413
training loss: 1.2837971448898315
training loss: 1.4421619176864624
training loss: 1.4001471996307373


training:  35%|███▍      | 1729/5000 [58:58<1:47:42,  1.98s/it]

training loss: 1.4938896894454956
training loss: 1.4830726385116577
training loss: 1.4162524938583374
training loss: 1.5005282163619995
training loss: 1.4613969326019287
training loss: 1.6240884065628052


training:  35%|███▍      | 1735/5000 [59:10<1:47:28,  1.97s/it]

training loss: 1.5445219278335571
training loss: 1.5348759889602661
training loss: 1.426727533340454
training loss: 1.5682436227798462
training loss: 1.5521156787872314
training loss: 1.461276888847351


training:  35%|███▍      | 1741/5000 [59:22<1:47:15,  1.97s/it]

training loss: 1.4538540840148926
training loss: 1.6230131387710571
training loss: 1.5469738245010376
training loss: 1.5005358457565308
training loss: 1.390739917755127
training loss: 1.4048079252243042


training:  35%|███▍      | 1747/5000 [59:34<1:47:02,  1.97s/it]

training loss: 1.4846222400665283
training loss: 1.4629617929458618
training loss: 1.4310635328292847
training loss: 1.567617416381836
training loss: 1.499160885810852
training loss: 1.460896372795105


training:  35%|███▌      | 1753/5000 [59:46<1:46:49,  1.97s/it]

training loss: 1.4505773782730103
training loss: 1.2996174097061157
training loss: 1.3851338624954224
training loss: 1.5003039836883545
training loss: 1.6259102821350098
training loss: 1.6291770935058594


training:  35%|███▌      | 1759/5000 [59:57<1:46:38,  1.97s/it]

training loss: 1.4604517221450806
training loss: 1.4997397661209106
training loss: 1.5835143327713013
training loss: 1.397580623626709
training loss: 1.4617539644241333
training loss: 1.7253444194793701


training:  35%|███▌      | 1765/5000 [1:00:09<1:46:25,  1.97s/it]

training loss: 1.396626591682434
training loss: 1.5324548482894897
training loss: 1.3807008266448975
training loss: 1.5188313722610474
training loss: 1.4907171726226807
training loss: 1.457284688949585


training:  35%|███▌      | 1771/5000 [1:00:21<1:46:12,  1.97s/it]

training loss: 1.4834548234939575
training loss: 1.550104022026062
training loss: 1.559624195098877
training loss: 1.5453301668167114
training loss: 1.5202528238296509
training loss: 1.512884259223938


training:  36%|███▌      | 1777/5000 [1:00:33<1:46:01,  1.97s/it]

training loss: 1.5222992897033691
training loss: 1.5855284929275513
training loss: 1.5326766967773438
training loss: 1.560378074645996
training loss: 1.4641646146774292
training loss: 1.4852700233459473


training:  36%|███▌      | 1783/5000 [1:00:45<1:45:49,  1.97s/it]

training loss: 1.4655970335006714
training loss: 1.5171576738357544
training loss: 1.3829548358917236
training loss: 1.30448579788208
training loss: 1.4922689199447632
training loss: 1.4971944093704224


training:  36%|███▌      | 1789/5000 [1:00:57<1:45:37,  1.97s/it]

training loss: 1.5979067087173462
training loss: 1.6199334859848022
training loss: 1.4903959035873413
training loss: 1.4790092706680298
training loss: 1.6179182529449463
training loss: 1.3803290128707886


training:  36%|███▌      | 1795/5000 [1:01:09<1:45:25,  1.97s/it]

training loss: 1.5186632871627808
training loss: 1.4703229665756226
training loss: 1.4788709878921509
training loss: 1.516757607460022
training loss: 1.5435150861740112
training loss: 1.6041150093078613


training:  36%|███▌      | 1795/5000 [1:01:20<1:45:25,  1.97s/it]

training loss: 1.3445103168487549


training:  36%|███▌      | 1801/5000 [1:01:21<1:45:44,  1.98s/it]

validation loss: 1.3536282777786255
training loss: 1.716864824295044
training loss: 1.440043330192566
training loss: 1.410820484161377
training loss: 1.4746437072753906
training loss: 1.4305039644241333


training:  36%|███▌      | 1807/5000 [1:01:32<1:45:23,  1.98s/it]

training loss: 1.4032397270202637
training loss: 1.4919945001602173
training loss: 1.4789607524871826
training loss: 1.524661660194397
training loss: 1.441820502281189
training loss: 1.5900832414627075


training:  36%|███▋      | 1813/5000 [1:01:44<1:45:04,  1.98s/it]

training loss: 1.5787032842636108
training loss: 1.6101047992706299
training loss: 1.4150971174240112
training loss: 1.544681191444397
training loss: 1.554835319519043
training loss: 1.5700103044509888


training:  36%|███▋      | 1819/5000 [1:01:56<1:44:48,  1.98s/it]

training loss: 1.5224946737289429
training loss: 1.541770577430725
training loss: 1.6413863897323608
training loss: 1.5111054182052612
training loss: 1.4639079570770264
training loss: 1.5727921724319458


training:  36%|███▋      | 1825/5000 [1:02:08<1:44:33,  1.98s/it]

training loss: 1.5327016115188599
training loss: 1.5680341720581055
training loss: 1.687484622001648
training loss: 1.5551587343215942
training loss: 1.582309603691101
training loss: 1.4494216442108154


training:  37%|███▋      | 1831/5000 [1:02:20<1:44:19,  1.98s/it]

training loss: 1.5472196340560913
training loss: 1.4948599338531494
training loss: 1.5429481267929077
training loss: 1.511562705039978
training loss: 1.526472568511963
training loss: 1.5604768991470337


training:  37%|███▋      | 1837/5000 [1:02:32<1:44:06,  1.97s/it]

training loss: 1.5618313550949097
training loss: 1.4174484014511108
training loss: 1.5403732061386108
training loss: 1.5895525217056274
training loss: 1.4305893182754517
training loss: 1.5220861434936523


training:  37%|███▋      | 1843/5000 [1:02:43<1:43:53,  1.97s/it]

training loss: 1.6676576137542725
training loss: 1.4723453521728516
training loss: 1.576102614402771
training loss: 1.5736663341522217
training loss: 1.471988320350647
training loss: 1.611543893814087


training:  37%|███▋      | 1849/5000 [1:02:55<1:43:41,  1.97s/it]

training loss: 1.4784196615219116
training loss: 1.497188687324524
training loss: 1.4931350946426392
training loss: 1.508975863456726
training loss: 1.4775134325027466
training loss: 1.573829174041748


training:  37%|███▋      | 1855/5000 [1:03:07<1:43:28,  1.97s/it]

training loss: 1.608956217765808
training loss: 1.5002503395080566
training loss: 1.4105833768844604
training loss: 1.4303290843963623
training loss: 1.5273405313491821
training loss: 1.4288817644119263


training:  37%|███▋      | 1861/5000 [1:03:19<1:43:16,  1.97s/it]

training loss: 1.4969722032546997
training loss: 1.4730790853500366
training loss: 1.5342397689819336
training loss: 1.536346673965454
training loss: 1.668845534324646
training loss: 1.567256212234497


training:  37%|███▋      | 1867/5000 [1:03:31<1:43:03,  1.97s/it]

training loss: 1.5876754522323608
training loss: 1.4406636953353882
training loss: 1.4696685075759888
training loss: 1.5713341236114502
training loss: 1.3298711776733398
training loss: 1.5627281665802002


training:  37%|███▋      | 1873/5000 [1:03:43<1:42:51,  1.97s/it]

training loss: 1.3868845701217651
training loss: 1.4426010847091675
training loss: 1.4989819526672363
training loss: 1.4453343152999878
training loss: 1.701529860496521
training loss: 1.5374040603637695


training:  38%|███▊      | 1879/5000 [1:03:54<1:42:39,  1.97s/it]

training loss: 1.4950066804885864
training loss: 1.4754267930984497
training loss: 1.3171356916427612
training loss: 1.3475648164749146
training loss: 1.4284840822219849
training loss: 1.5639721155166626


training:  38%|███▊      | 1885/5000 [1:04:06<1:42:28,  1.97s/it]

training loss: 1.5898064374923706
training loss: 1.4687169790267944
training loss: 1.484801173210144
training loss: 1.4439440965652466
training loss: 1.6234756708145142
training loss: 1.4983857870101929


training:  38%|███▊      | 1891/5000 [1:04:18<1:42:16,  1.97s/it]

training loss: 1.2806519269943237
training loss: 1.502994179725647
training loss: 1.4519985914230347
training loss: 1.407739520072937
training loss: 1.5590797662734985
training loss: 1.5551034212112427


training:  38%|███▊      | 1897/5000 [1:04:30<1:42:04,  1.97s/it]

training loss: 1.3800289630889893
training loss: 1.4498536586761475
training loss: 1.5498725175857544
training loss: 1.4574061632156372
training loss: 1.5292085409164429
validation loss: 1.4593218564987183
training loss: 1.6514254808425903


training:  38%|███▊      | 1903/5000 [1:04:42<1:42:22,  1.98s/it]

training loss: 1.5732004642486572
training loss: 1.5822398662567139
training loss: 1.315652847290039
training loss: 1.4835655689239502
training loss: 1.6302958726882935
training loss: 1.5600007772445679


training:  38%|███▊      | 1909/5000 [1:04:54<1:42:02,  1.98s/it]

training loss: 1.5460163354873657
training loss: 1.3889285326004028
training loss: 1.6154855489730835
training loss: 1.5930204391479492
training loss: 1.5378092527389526
training loss: 1.496157169342041


training:  38%|███▊      | 1915/5000 [1:05:06<1:41:44,  1.98s/it]

training loss: 1.3875027894973755
training loss: 1.5010818243026733
training loss: 1.4240185022354126
training loss: 1.5324922800064087
training loss: 1.5025182962417603
training loss: 1.5920393466949463


training:  38%|███▊      | 1921/5000 [1:05:18<1:41:27,  1.98s/it]

training loss: 1.5339890718460083
training loss: 1.478461503982544
training loss: 1.5551080703735352
training loss: 1.5745410919189453
training loss: 1.4651769399642944
training loss: 1.5644954442977905


training:  39%|███▊      | 1927/5000 [1:05:29<1:41:12,  1.98s/it]

training loss: 1.501326322555542
training loss: 1.4789432287216187
training loss: 1.3578858375549316
training loss: 1.5220638513565063
training loss: 1.551393747329712
training loss: 1.4825280904769897


training:  39%|███▊      | 1933/5000 [1:05:41<1:40:57,  1.98s/it]

training loss: 1.635907530784607
training loss: 1.3389246463775635
training loss: 1.4494097232818604
training loss: 1.4686617851257324
training loss: 1.4775692224502563
training loss: 1.4170441627502441


training:  39%|███▉      | 1939/5000 [1:05:53<1:40:44,  1.97s/it]

training loss: 1.541839838027954
training loss: 1.4987821578979492
training loss: 1.4738831520080566
training loss: 1.492455005645752
training loss: 1.6177343130111694
training loss: 1.479210376739502


training:  39%|███▉      | 1945/5000 [1:06:05<1:40:32,  1.97s/it]

training loss: 1.3400452136993408
training loss: 1.4295850992202759
training loss: 1.4742380380630493
training loss: 1.4992176294326782
training loss: 1.5360403060913086
training loss: 1.6215587854385376


training:  39%|███▉      | 1951/5000 [1:06:17<1:40:20,  1.97s/it]

training loss: 1.6247013807296753
training loss: 1.5275505781173706
training loss: 1.5022624731063843
training loss: 1.5858211517333984
training loss: 1.5493168830871582
training loss: 1.5247712135314941


training:  39%|███▉      | 1957/5000 [1:06:29<1:40:07,  1.97s/it]

training loss: 1.4840983152389526
training loss: 1.524718165397644
training loss: 1.6327952146530151
training loss: 1.3882198333740234
training loss: 1.6145431995391846
training loss: 1.4959025382995605


training:  39%|███▉      | 1963/5000 [1:06:40<1:39:55,  1.97s/it]

training loss: 1.4609109163284302
training loss: 1.590741515159607
training loss: 1.5207679271697998
training loss: 1.3316890001296997
training loss: 1.6640808582305908
training loss: 1.3327604532241821


training:  39%|███▉      | 1969/5000 [1:06:52<1:39:44,  1.97s/it]

training loss: 1.7220134735107422
training loss: 1.6215999126434326
training loss: 1.538110613822937
training loss: 1.4734036922454834
training loss: 1.5032284259796143
training loss: 1.5906509160995483


training:  40%|███▉      | 1975/5000 [1:07:04<1:39:32,  1.97s/it]

training loss: 1.273726463317871
training loss: 1.397803783416748
training loss: 1.5071731805801392
training loss: 1.4540834426879883
training loss: 1.3607391119003296
training loss: 1.519705057144165


training:  40%|███▉      | 1981/5000 [1:07:16<1:39:19,  1.97s/it]

training loss: 1.5286469459533691
training loss: 1.5068566799163818
training loss: 1.4289836883544922
training loss: 1.4408526420593262
training loss: 1.580629587173462
training loss: 1.5484720468521118


training:  40%|███▉      | 1987/5000 [1:07:28<1:39:07,  1.97s/it]

training loss: 1.6738147735595703
training loss: 1.568284273147583
training loss: 1.3083029985427856
training loss: 1.434907078742981
training loss: 1.3094805479049683
training loss: 1.6489044427871704


training:  40%|███▉      | 1993/5000 [1:07:40<1:38:55,  1.97s/it]

training loss: 1.4414606094360352
training loss: 1.48826003074646
training loss: 1.316872239112854
training loss: 1.453162431716919
training loss: 1.5678694248199463
training loss: 1.4622596502304077


training:  40%|███▉      | 1999/5000 [1:07:52<1:38:44,  1.97s/it]

training loss: 1.4162427186965942
training loss: 1.4675476551055908
training loss: 1.4998104572296143
validation loss: 1.4460338354110718
%s 

 %s ("645]] he began building [[Imogiri]], his burial place, about fifteen kilometers south of Yogyakarta.  Imogiri remains the resting place of most of the royalty of Yogyakarta and Surakarta to this day. Agung died in the spring of [[1646]], with his image of royal invincibility shattered by his losses to the Dutch, but he did leave behind an empire that covered most of Java and stretched to its neighboring islands.  Upon taking the throne, Agung's son Susuhunan [[Amangkurat I of Mataram|Amangkurat I]] tried to bring long-term stability to Mataram's realm, murdering local leaders that were insufficiently deferential to him, and closing ports so he alone had control over trade with the Dutch.  By the mid-1670s dissatisfaction with the king fanned into open revolt, beginning at the margins and creeping inward. [[Raden Trunajaya]], a prince from 

training:  40%|████      | 2001/5000 [1:08:26<3:13:42,  3.88s/it]

a Aldes The Germark Aest]] [[Intellies]] [[Chopolar Fay I]] the [[George Bon The China]], [[Neta|Linie Derol Chaplors]] show in first also ave growth a tect the recent of propert, save marked inviewed by scall lookane.  In fieloque of the Emption with [[Hind JosÃ¼n Cape Worlogica]]s well the perfrecise of the near lyries and its science '''Theory overs'' and ''Tem writted Mangaria. Eventured by [[Shard of Irance-took Antical Empany]]''  Bellore Roman speassed as the [[The Ada (migh of Heavail]], white time,
training loss: 1.5039348602294922
training loss: 1.4466166496276855
training loss: 1.4755803346633911
training loss: 1.5725831985473633
training loss: 1.4435653686523438


training:  40%|████      | 2007/5000 [1:08:38<2:40:14,  3.21s/it]

training loss: 1.6401972770690918
training loss: 1.601177453994751
training loss: 1.3196382522583008
training loss: 1.5547012090682983
training loss: 1.4519506692886353
training loss: 1.453761100769043


training:  40%|████      | 2013/5000 [1:08:50<2:19:24,  2.80s/it]

training loss: 1.4385008811950684
training loss: 1.5292412042617798
training loss: 1.494844913482666
training loss: 1.6057734489440918
training loss: 1.4774582386016846
training loss: 1.4795212745666504


training:  40%|████      | 2019/5000 [1:09:01<2:05:54,  2.53s/it]

training loss: 1.4806749820709229
training loss: 1.3501685857772827
training loss: 1.48379647731781
training loss: 1.5345699787139893
training loss: 1.519500732421875
training loss: 1.425381064414978


training:  40%|████      | 2025/5000 [1:09:13<1:56:54,  2.36s/it]

training loss: 1.5568437576293945
training loss: 1.5135245323181152
training loss: 1.478757381439209
training loss: 1.4592187404632568
training loss: 1.548209547996521
training loss: 1.4681408405303955


training:  41%|████      | 2031/5000 [1:09:25<1:50:45,  2.24s/it]

training loss: 1.5850164890289307
training loss: 1.5738308429718018
training loss: 1.4658582210540771
training loss: 1.4283499717712402
training loss: 1.4091711044311523
training loss: 1.4574735164642334


training:  41%|████      | 2037/5000 [1:09:37<1:46:31,  2.16s/it]

training loss: 1.5961482524871826
training loss: 1.449048399925232
training loss: 1.6754775047302246
training loss: 1.4869686365127563
training loss: 1.5214087963104248
training loss: 1.464970588684082


training:  41%|████      | 2043/5000 [1:09:49<1:43:33,  2.10s/it]

training loss: 1.5170466899871826
training loss: 1.481187105178833
training loss: 1.526193380355835
training loss: 1.566213607788086
training loss: 1.4671162366867065
training loss: 1.5461342334747314


training:  41%|████      | 2049/5000 [1:10:01<1:41:26,  2.06s/it]

training loss: 1.3692853450775146
training loss: 1.5099111795425415
training loss: 1.531447410583496
training loss: 1.5621528625488281
training loss: 1.3479312658309937
training loss: 1.4428826570510864


training:  41%|████      | 2055/5000 [1:10:13<1:39:55,  2.04s/it]

training loss: 1.429282307624817
training loss: 1.5086331367492676
training loss: 1.66289484500885
training loss: 1.5102990865707397
training loss: 1.5130581855773926
training loss: 1.4734523296356201


training:  41%|████      | 2061/5000 [1:10:24<1:38:48,  2.02s/it]

training loss: 1.3303844928741455
training loss: 1.5081251859664917
training loss: 1.5090131759643555
training loss: 1.4613040685653687
training loss: 1.4965152740478516
training loss: 1.4114211797714233


training:  41%|████▏     | 2067/5000 [1:10:36<1:37:58,  2.00s/it]

training loss: 1.517461895942688
training loss: 1.4613467454910278
training loss: 1.5424830913543701
training loss: 1.3426923751831055
training loss: 1.4724212884902954
training loss: 1.53252375125885


training:  41%|████▏     | 2073/5000 [1:10:48<1:37:20,  2.00s/it]

training loss: 1.5733979940414429
training loss: 1.4379539489746094
training loss: 1.5155962705612183
training loss: 1.4764463901519775
training loss: 1.306256651878357
training loss: 1.4548053741455078


training:  42%|████▏     | 2079/5000 [1:11:00<1:36:50,  1.99s/it]

training loss: 1.4771955013275146
training loss: 1.5045150518417358
training loss: 1.3442649841308594
training loss: 1.5275756120681763
training loss: 1.5144364833831787
training loss: 1.4693121910095215


training:  42%|████▏     | 2085/5000 [1:11:12<1:36:25,  1.98s/it]

training loss: 1.535660982131958
training loss: 1.6202034950256348
training loss: 1.7531592845916748
training loss: 1.3779820203781128
training loss: 1.361689567565918
training loss: 1.5149593353271484


training:  42%|████▏     | 2091/5000 [1:11:24<1:36:04,  1.98s/it]

training loss: 1.6286112070083618
training loss: 1.5081226825714111
training loss: 1.5763421058654785
training loss: 1.4109077453613281
training loss: 1.3115129470825195
training loss: 1.5769050121307373


training:  42%|████▏     | 2097/5000 [1:11:35<1:35:46,  1.98s/it]

training loss: 1.4490909576416016
training loss: 1.5235836505889893
training loss: 1.4813265800476074
training loss: 1.4300687313079834
training loss: 1.4301873445510864
validation loss: 1.3475925922393799
training loss: 1.4999175071716309


training:  42%|████▏     | 2103/5000 [1:11:47<1:35:57,  1.99s/it]

training loss: 1.7014261484146118
training loss: 1.3968956470489502
training loss: 1.495495319366455
training loss: 1.508741021156311
training loss: 1.4474291801452637
training loss: 1.422309398651123


training:  42%|████▏     | 2109/5000 [1:11:59<1:35:34,  1.98s/it]

training loss: 1.1104099750518799
training loss: 1.4840413331985474
training loss: 1.4545977115631104
training loss: 1.6164413690567017
training loss: 1.4432379007339478
training loss: 1.4709385633468628


training:  42%|████▏     | 2115/5000 [1:12:11<1:35:14,  1.98s/it]

training loss: 1.5261831283569336
training loss: 1.6499305963516235
training loss: 1.4348639249801636
training loss: 1.4075469970703125
training loss: 1.4672850370407104
training loss: 1.4539344310760498


training:  42%|████▏     | 2121/5000 [1:12:23<1:34:56,  1.98s/it]

training loss: 1.467142105102539
training loss: 1.5191620588302612
training loss: 1.4826064109802246
training loss: 1.5294740200042725
training loss: 1.3814594745635986
training loss: 1.5239863395690918


training:  43%|████▎     | 2127/5000 [1:12:35<1:34:40,  1.98s/it]

training loss: 1.4957531690597534
training loss: 1.5426032543182373
training loss: 1.4575568437576294
training loss: 1.4793592691421509
training loss: 1.3121531009674072
training loss: 1.6792564392089844


training:  43%|████▎     | 2133/5000 [1:12:47<1:34:25,  1.98s/it]

training loss: 1.568219542503357
training loss: 1.4881439208984375
training loss: 1.4245274066925049
training loss: 1.4911702871322632
training loss: 1.4964112043380737
training loss: 1.4909141063690186


training:  43%|████▎     | 2139/5000 [1:12:59<1:34:11,  1.98s/it]

training loss: 1.6275207996368408
training loss: 1.4782987833023071
training loss: 1.4326516389846802
training loss: 1.5913435220718384
training loss: 1.465319037437439
training loss: 1.6329702138900757


training:  43%|████▎     | 2145/5000 [1:13:10<1:33:58,  1.97s/it]

training loss: 1.3717154264450073
training loss: 1.451269507408142
training loss: 1.5215888023376465
training loss: 1.4266269207000732
training loss: 1.4462876319885254
training loss: 1.3608241081237793


training:  43%|████▎     | 2151/5000 [1:13:22<1:33:45,  1.97s/it]

training loss: 1.4485090970993042
training loss: 1.5098307132720947
training loss: 1.5447224378585815
training loss: 1.4839279651641846
training loss: 1.515336513519287
training loss: 1.5107868909835815


training:  43%|████▎     | 2157/5000 [1:13:34<1:33:32,  1.97s/it]

training loss: 1.492142915725708
training loss: 1.5682605504989624
training loss: 1.2354097366333008
training loss: 1.4610358476638794
training loss: 1.5322530269622803
training loss: 1.5224558115005493


training:  43%|████▎     | 2163/5000 [1:13:46<1:33:20,  1.97s/it]

training loss: 1.466664433479309
training loss: 1.490970492362976
training loss: 1.4129737615585327
training loss: 1.481513261795044
training loss: 1.3647198677062988
training loss: 1.55741286277771


training:  43%|████▎     | 2169/5000 [1:13:58<1:33:08,  1.97s/it]

training loss: 1.5227314233779907
training loss: 1.2718018293380737
training loss: 1.4790282249450684
training loss: 1.5437546968460083
training loss: 1.5750516653060913
training loss: 1.1361782550811768


training:  44%|████▎     | 2175/5000 [1:14:10<1:32:56,  1.97s/it]

training loss: 1.547982096672058
training loss: 1.4107939004898071
training loss: 1.5078256130218506
training loss: 1.6067438125610352
training loss: 1.385162115097046
training loss: 1.4890717267990112


training:  44%|████▎     | 2181/5000 [1:14:21<1:32:44,  1.97s/it]

training loss: 1.4932752847671509
training loss: 1.582729458808899
training loss: 1.6011956930160522
training loss: 1.4540406465530396
training loss: 1.5075715780258179
training loss: 1.505144476890564


training:  44%|████▎     | 2187/5000 [1:14:33<1:32:32,  1.97s/it]

training loss: 1.4689435958862305
training loss: 1.452980637550354
training loss: 1.3785814046859741
training loss: 1.2832083702087402
training loss: 1.5513120889663696
training loss: 1.4949089288711548


training:  44%|████▍     | 2193/5000 [1:14:45<1:32:20,  1.97s/it]

training loss: 1.4448703527450562
training loss: 1.3783987760543823
training loss: 1.3876864910125732
training loss: 1.4502184391021729
training loss: 1.5197663307189941
training loss: 1.5707610845565796


training:  44%|████▍     | 2199/5000 [1:14:57<1:32:09,  1.97s/it]

training loss: 1.502610206604004
training loss: 1.4582339525222778
training loss: 1.6009520292282104
validation loss: 1.4297740459442139
training loss: 1.4442392587661743
training loss: 1.464129090309143
training loss: 1.104950189590454


training:  44%|████▍     | 2205/5000 [1:15:09<1:32:24,  1.98s/it]

training loss: 1.4296270608901978
training loss: 1.0498048067092896
training loss: 1.6978373527526855
training loss: 1.5373574495315552
training loss: 1.4955319166183472
training loss: 1.5977555513381958


training:  44%|████▍     | 2211/5000 [1:15:21<1:32:04,  1.98s/it]

training loss: 1.4780176877975464
training loss: 1.5850731134414673
training loss: 1.4781122207641602
training loss: 1.5578396320343018
training loss: 1.5139776468276978
training loss: 1.3938556909561157


training:  44%|████▍     | 2217/5000 [1:15:33<1:31:47,  1.98s/it]

training loss: 1.545912265777588
training loss: 1.590360403060913
training loss: 1.3700056076049805
training loss: 1.4226950407028198
training loss: 1.3833619356155396
training loss: 1.538358449935913


training:  44%|████▍     | 2223/5000 [1:15:45<1:31:31,  1.98s/it]

training loss: 1.4600483179092407
training loss: 1.431481957435608
training loss: 1.32584547996521
training loss: 1.4340628385543823
training loss: 1.434656023979187
training loss: 1.469470739364624


training:  45%|████▍     | 2229/5000 [1:15:56<1:31:16,  1.98s/it]

training loss: 1.37169349193573
training loss: 1.496761679649353
training loss: 1.4007840156555176
training loss: 1.4388320446014404
training loss: 1.3917624950408936
training loss: 1.4964476823806763


training:  45%|████▍     | 2235/5000 [1:16:08<1:31:02,  1.98s/it]

training loss: 1.5996628999710083
training loss: 1.5079609155654907
training loss: 1.5505785942077637
training loss: 1.6431362628936768
training loss: 1.4038935899734497
training loss: 1.5362333059310913


training:  45%|████▍     | 2241/5000 [1:16:20<1:30:49,  1.98s/it]

training loss: 1.4743911027908325
training loss: 1.5123202800750732
training loss: 1.4904130697250366
training loss: 1.5616673231124878
training loss: 1.5399361848831177
training loss: 1.4524000883102417


training:  45%|████▍     | 2247/5000 [1:16:32<1:30:36,  1.97s/it]

training loss: 1.5827856063842773
training loss: 1.5491749048233032
training loss: 1.4740791320800781
training loss: 1.5001680850982666
training loss: 1.5859718322753906
training loss: 1.4349907636642456


training:  45%|████▌     | 2253/5000 [1:16:44<1:30:24,  1.97s/it]

training loss: 1.4090029001235962
training loss: 1.5416086912155151
training loss: 1.5453368425369263
training loss: 1.5606368780136108
training loss: 1.5836350917816162
training loss: 1.4881421327590942


training:  45%|████▌     | 2259/5000 [1:16:56<1:30:12,  1.97s/it]

training loss: 1.4164471626281738
training loss: 1.434436321258545
training loss: 1.3670555353164673
training loss: 1.4829177856445312
training loss: 1.4887950420379639
training loss: 1.5589414834976196


training:  45%|████▌     | 2265/5000 [1:17:07<1:30:00,  1.97s/it]

training loss: 1.453522801399231
training loss: 1.3720821142196655
training loss: 1.5821293592453003
training loss: 1.551682472229004
training loss: 1.4603623151779175
training loss: 1.5023528337478638


training:  45%|████▌     | 2271/5000 [1:17:19<1:29:48,  1.97s/it]

training loss: 1.5786222219467163
training loss: 1.311539649963379
training loss: 1.449742317199707
training loss: 1.362065076828003
training loss: 1.3575999736785889
training loss: 1.4922062158584595


training:  46%|████▌     | 2277/5000 [1:17:31<1:29:36,  1.97s/it]

training loss: 1.5234062671661377
training loss: 1.448266863822937
training loss: 1.5955722332000732
training loss: 1.479888916015625
training loss: 1.4265832901000977
training loss: 1.4114454984664917


training:  46%|████▌     | 2283/5000 [1:17:43<1:29:24,  1.97s/it]

training loss: 1.4702788591384888
training loss: 1.3849656581878662
training loss: 1.4427794218063354
training loss: 1.4892200231552124
training loss: 1.5225015878677368
training loss: 1.5701465606689453


training:  46%|████▌     | 2289/5000 [1:17:55<1:29:12,  1.97s/it]

training loss: 1.3917216062545776
training loss: 1.4524422883987427
training loss: 1.4535472393035889
training loss: 1.5841649770736694
training loss: 1.1928799152374268
training loss: 1.5104057788848877


training:  46%|████▌     | 2295/5000 [1:18:07<1:28:59,  1.97s/it]

training loss: 1.4085605144500732
training loss: 1.4424883127212524
training loss: 1.3944758176803589
training loss: 1.5116002559661865
training loss: 1.4411293268203735
training loss: 1.1395375728607178
training loss: 1.420902132987976


training:  46%|████▌     | 2301/5000 [1:18:19<1:29:14,  1.98s/it]

validation loss: 1.4113925695419312
training loss: 1.4964250326156616
training loss: 1.3843914270401
training loss: 1.3950762748718262
training loss: 1.4872671365737915
training loss: 1.4013561010360718


training:  46%|████▌     | 2307/5000 [1:18:31<1:28:54,  1.98s/it]

training loss: 1.5808643102645874
training loss: 1.5200060606002808
training loss: 1.4390649795532227
training loss: 1.5188202857971191
training loss: 1.3367611169815063
training loss: 1.507819652557373


training:  46%|████▋     | 2313/5000 [1:18:42<1:28:36,  1.98s/it]

training loss: 1.6311488151550293
training loss: 1.4781478643417358
training loss: 1.4900683164596558
training loss: 1.5080465078353882
training loss: 1.5446583032608032
training loss: 1.3573875427246094


training:  46%|████▋     | 2319/5000 [1:18:54<1:28:21,  1.98s/it]

training loss: 1.574008822441101
training loss: 1.423016905784607
training loss: 1.5542232990264893
training loss: 1.5374281406402588
training loss: 1.5667998790740967
training loss: 1.3592697381973267


training:  46%|████▋     | 2325/5000 [1:19:06<1:28:06,  1.98s/it]

training loss: 1.5452841520309448
training loss: 1.5337411165237427
training loss: 1.570312738418579
training loss: 1.5251468420028687
training loss: 1.5050863027572632
training loss: 1.4406137466430664


training:  47%|████▋     | 2331/5000 [1:19:18<1:27:52,  1.98s/it]

training loss: 1.3023337125778198
training loss: 1.3829425573349
training loss: 1.611348271369934
training loss: 1.4705562591552734
training loss: 1.5138517618179321
training loss: 1.5385643243789673


training:  47%|████▋     | 2337/5000 [1:19:30<1:27:38,  1.97s/it]

training loss: 1.519639492034912
training loss: 1.5362434387207031
training loss: 1.5088564157485962
training loss: 1.4948956966400146
training loss: 1.3572583198547363
training loss: 1.6518585681915283


training:  47%|████▋     | 2343/5000 [1:19:42<1:27:26,  1.97s/it]

training loss: 1.54188072681427
training loss: 1.4991363286972046
training loss: 1.43012273311615
training loss: 1.4522992372512817
training loss: 1.6110782623291016
training loss: 1.2975289821624756


training:  47%|████▋     | 2349/5000 [1:19:53<1:27:14,  1.97s/it]

training loss: 1.5938270092010498
training loss: 1.4312821626663208
training loss: 1.5129860639572144
training loss: 1.5059934854507446
training loss: 1.3966273069381714
training loss: 1.6138120889663696


training:  47%|████▋     | 2355/5000 [1:20:05<1:27:01,  1.97s/it]

training loss: 1.3586698770523071
training loss: 1.4823286533355713
training loss: 1.6970815658569336
training loss: 1.5186095237731934
training loss: 1.4960825443267822
training loss: 1.5000892877578735


training:  47%|████▋     | 2361/5000 [1:20:17<1:26:49,  1.97s/it]

training loss: 1.4280873537063599
training loss: 1.4937750101089478
training loss: 1.4548616409301758
training loss: 1.3112345933914185
training loss: 1.4673659801483154
training loss: 1.5364089012145996


training:  47%|████▋     | 2367/5000 [1:20:29<1:26:37,  1.97s/it]

training loss: 1.4224082231521606
training loss: 1.52135169506073
training loss: 1.586904525756836
training loss: 1.614850640296936
training loss: 1.464375376701355
training loss: 1.4884945154190063


training:  47%|████▋     | 2373/5000 [1:20:41<1:26:26,  1.97s/it]

training loss: 1.476321816444397
training loss: 1.3214821815490723
training loss: 1.4575172662734985
training loss: 1.4554252624511719
training loss: 1.4631333351135254
training loss: 1.4494651556015015


training:  48%|████▊     | 2379/5000 [1:20:53<1:26:13,  1.97s/it]

training loss: 1.3709290027618408
training loss: 1.4717276096343994
training loss: 1.4897176027297974
training loss: 1.397987961769104
training loss: 1.561790943145752
training loss: 1.3634189367294312


training:  48%|████▊     | 2385/5000 [1:21:05<1:26:01,  1.97s/it]

training loss: 1.400962233543396
training loss: 1.4524236917495728
training loss: 1.4325730800628662
training loss: 1.5832629203796387
training loss: 1.4355380535125732
training loss: 1.4999407529830933


training:  48%|████▊     | 2391/5000 [1:21:16<1:25:50,  1.97s/it]

training loss: 1.3997893333435059
training loss: 1.4153000116348267
training loss: 1.3645703792572021
training loss: 1.4864288568496704
training loss: 1.5480163097381592
training loss: 1.5054142475128174


training:  48%|████▊     | 2397/5000 [1:21:28<1:25:38,  1.97s/it]

training loss: 1.393418788909912
training loss: 1.4602296352386475
training loss: 1.5171171426773071
training loss: 1.6022528409957886
training loss: 1.6039952039718628
validation loss: 1.4400657415390015
training loss: 1.4068018198013306


training:  48%|████▊     | 2403/5000 [1:21:40<1:25:52,  1.98s/it]

training loss: 1.4583525657653809
training loss: 1.4003838300704956
training loss: 1.3806527853012085
training loss: 1.443398118019104
training loss: 1.458499550819397
training loss: 1.5207079648971558


training:  48%|████▊     | 2409/5000 [1:21:52<1:25:32,  1.98s/it]

training loss: 1.4926217794418335
training loss: 1.4821995496749878
training loss: 1.524922251701355
training loss: 1.4760712385177612
training loss: 1.390710711479187
training loss: 1.425916075706482


training:  48%|████▊     | 2415/5000 [1:22:04<1:25:15,  1.98s/it]

training loss: 1.3962746858596802
training loss: 1.3792188167572021
training loss: 1.4668831825256348
training loss: 1.5160837173461914
training loss: 1.480962872505188
training loss: 1.4954934120178223


training:  48%|████▊     | 2421/5000 [1:22:16<1:25:00,  1.98s/it]

training loss: 1.5213476419448853
training loss: 1.5006370544433594
training loss: 1.5067766904830933
training loss: 1.5151244401931763
training loss: 1.4881136417388916
training loss: 1.5184592008590698


training:  49%|████▊     | 2427/5000 [1:22:28<1:24:45,  1.98s/it]

training loss: 1.3998000621795654
training loss: 1.3880025148391724
training loss: 1.4722272157669067
training loss: 1.4645578861236572
training loss: 1.4453388452529907
training loss: 1.5272578001022339


training:  49%|████▊     | 2433/5000 [1:22:39<1:24:31,  1.98s/it]

training loss: 1.3901305198669434
training loss: 1.3930617570877075
training loss: 1.4912856817245483
training loss: 1.4860739707946777
training loss: 1.5564329624176025
training loss: 1.4259284734725952


training:  49%|████▉     | 2439/5000 [1:22:51<1:24:18,  1.98s/it]

training loss: 1.4523907899856567
training loss: 1.463611364364624
training loss: 1.3928449153900146
training loss: 1.574324131011963
training loss: 1.4591643810272217
training loss: 1.3042166233062744


training:  49%|████▉     | 2445/5000 [1:23:03<1:24:04,  1.97s/it]

training loss: 1.5648009777069092
training loss: 1.429388403892517
training loss: 1.5241044759750366
training loss: 1.5389002561569214
training loss: 1.4755939245224
training loss: 1.5177655220031738


training:  49%|████▉     | 2451/5000 [1:23:15<1:23:52,  1.97s/it]

training loss: 1.5474107265472412
training loss: 1.4395835399627686
training loss: 1.4885929822921753
training loss: 1.4569458961486816
training loss: 1.6389286518096924
training loss: 1.5230343341827393


training:  49%|████▉     | 2457/5000 [1:23:27<1:23:40,  1.97s/it]

training loss: 1.511275053024292
training loss: 1.3816393613815308
training loss: 1.5437973737716675
training loss: 1.5529630184173584
training loss: 1.5296440124511719
training loss: 1.4419069290161133


training:  49%|████▉     | 2463/5000 [1:23:39<1:23:28,  1.97s/it]

training loss: 1.5569013357162476
training loss: 1.4175387620925903
training loss: 1.4630577564239502
training loss: 1.310253620147705
training loss: 1.4302693605422974
training loss: 1.3716628551483154


training:  49%|████▉     | 2469/5000 [1:23:51<1:23:16,  1.97s/it]

training loss: 1.4591325521469116
training loss: 1.5251295566558838
training loss: 1.618332862854004
training loss: 1.4637573957443237
training loss: 1.413881540298462
training loss: 1.5295159816741943


training:  50%|████▉     | 2475/5000 [1:24:02<1:23:04,  1.97s/it]

training loss: 1.4725360870361328
training loss: 1.592060923576355
training loss: 1.5240525007247925
training loss: 1.4783356189727783
training loss: 1.638056755065918
training loss: 1.4668328762054443


training:  50%|████▉     | 2481/5000 [1:24:14<1:22:52,  1.97s/it]

training loss: 1.5748533010482788
training loss: 1.4890987873077393
training loss: 1.5562396049499512
training loss: 1.4392669200897217
training loss: 1.4450868368148804
training loss: 1.4433006048202515


training:  50%|████▉     | 2487/5000 [1:24:26<1:22:40,  1.97s/it]

training loss: 1.615090012550354
training loss: 1.4791686534881592
training loss: 1.5248620510101318
training loss: 1.4757966995239258
training loss: 1.5109367370605469
training loss: 1.4125174283981323


training:  50%|████▉     | 2493/5000 [1:24:38<1:22:28,  1.97s/it]

training loss: 1.4464439153671265
training loss: 1.5197207927703857
training loss: 1.4113876819610596
training loss: 1.4292123317718506
training loss: 1.4531874656677246
training loss: 1.375632405281067


training:  50%|████▉     | 2499/5000 [1:24:50<1:22:16,  1.97s/it]

training loss: 1.4488717317581177
training loss: 1.5116190910339355
training loss: 1.4344888925552368
validation loss: 1.3360271453857422
%s 

 %s ("ions he needed and while he could not resort to open torture, whatever means he did use must have been fearsome because Newton himself later ordered all records of these interrogations to be destroyed. However he did it, Newton won his convictions and in February 1699, he had ten prisoners waiting to be executed.  Newton's greatest triumph as the king's attorney was against [[William Chaloner]]. Chaloner was a rogue with a devious intelligence. He set up phoney conspiracies of Catholics and then turned in the hapless conspirators whom he entrapped. Chaloner made himself rich enough to posture as a gentleman. Petitioning [[Parliament of England|Parliament]], Chaloner accused the Mint of providing tools to counterfeiters. (This charge was made also by others.) He proposed that he be allowed to inspect the Mint's processes in order to improve

training:  50%|█████     | 2501/5000 [1:25:24<2:41:22,  3.87s/it]

 power clogress ''Scroussexual City Poloral Brall advic Dephine'', ectionaing messenche, allocian meric singlish style interest work producations, the [[Alexac Hahing Represerving of Lanticle Casular Malans Paddition]]. # The gave [[Laname Coleche]], ands of [[Gobsounds]]. The sancism chailors of publishment [[commusion]], as ame in [[Brofestantion]], other and two to at Dention's mave that many rediations at the [[moded Sideric progration|Clling]] pauly [[Miscitypervity]]. In interestate, a book and musion
training loss: 1.5274105072021484
training loss: 1.4186439514160156
training loss: 1.4976403713226318
training loss: 1.4573097229003906
training loss: 1.5500776767730713


training:  50%|█████     | 2507/5000 [1:25:36<2:13:26,  3.21s/it]

training loss: 1.367200493812561
training loss: 1.4611049890518188
training loss: 1.4455716609954834
training loss: 1.3743999004364014
training loss: 1.3386892080307007
training loss: 1.3506529331207275


training:  50%|█████     | 2513/5000 [1:25:48<1:56:03,  2.80s/it]

training loss: 1.5534491539001465
training loss: 1.4996836185455322
training loss: 1.495040774345398
training loss: 1.3229445219039917
training loss: 1.509427547454834
training loss: 1.4497098922729492


training:  50%|█████     | 2519/5000 [1:26:00<1:44:46,  2.53s/it]

training loss: 1.5071412324905396
training loss: 1.4704558849334717
training loss: 1.5138578414916992
training loss: 1.4701573848724365
training loss: 1.5453656911849976
training loss: 1.5910794734954834


training:  50%|█████     | 2525/5000 [1:26:11<1:37:14,  2.36s/it]

training loss: 1.3850725889205933
training loss: 1.5422254800796509
training loss: 1.5067830085754395
training loss: 1.4456076622009277
training loss: 1.4239284992218018
training loss: 1.474172592163086


training:  51%|█████     | 2531/5000 [1:26:23<1:32:06,  2.24s/it]

training loss: 1.4744813442230225
training loss: 1.4508769512176514
training loss: 1.4415595531463623
training loss: 1.3849575519561768
training loss: 1.3606880903244019
training loss: 1.3952157497406006


training:  51%|█████     | 2537/5000 [1:26:35<1:28:32,  2.16s/it]

training loss: 1.4004689455032349
training loss: 1.3493802547454834
training loss: 1.6067720651626587
training loss: 1.450308084487915
training loss: 1.4411823749542236
training loss: 1.462376356124878


training:  51%|█████     | 2543/5000 [1:26:47<1:26:02,  2.10s/it]

training loss: 1.380367398262024
training loss: 1.6811330318450928
training loss: 1.6178863048553467
training loss: 1.4283390045166016
training loss: 1.4642523527145386
training loss: 1.406484842300415


training:  51%|█████     | 2549/5000 [1:26:59<1:24:15,  2.06s/it]

training loss: 1.5224775075912476
training loss: 1.5051193237304688
training loss: 1.4451375007629395
training loss: 1.5101481676101685
training loss: 1.3654910326004028
training loss: 1.4283180236816406


training:  51%|█████     | 2555/5000 [1:27:11<1:22:57,  2.04s/it]

training loss: 1.3654963970184326
training loss: 1.51004159450531
training loss: 1.4513298273086548
training loss: 1.3901221752166748
training loss: 1.5391881465911865
training loss: 1.4687719345092773


training:  51%|█████     | 2561/5000 [1:27:23<1:21:58,  2.02s/it]

training loss: 1.3366835117340088
training loss: 1.5144305229187012
training loss: 1.454336166381836
training loss: 1.4602642059326172
training loss: 1.6042946577072144
training loss: 1.4813721179962158


training:  51%|█████▏    | 2567/5000 [1:27:34<1:21:14,  2.00s/it]

training loss: 1.4895073175430298
training loss: 1.5736160278320312
training loss: 1.5038435459136963
training loss: 1.5236797332763672
training loss: 1.6492308378219604
training loss: 1.4121348857879639


training:  51%|█████▏    | 2573/5000 [1:27:46<1:20:40,  1.99s/it]

training loss: 1.441127061843872
training loss: 1.633342981338501
training loss: 1.4390132427215576
training loss: 1.411159634590149
training loss: 1.439659595489502
training loss: 1.572246789932251


training:  52%|█████▏    | 2579/5000 [1:27:58<1:20:13,  1.99s/it]

training loss: 1.4082229137420654
training loss: 1.4021708965301514
training loss: 1.7389404773712158
training loss: 1.4702954292297363
training loss: 1.5183342695236206
training loss: 1.4427638053894043


training:  52%|█████▏    | 2585/5000 [1:28:10<1:19:51,  1.98s/it]

training loss: 1.4668574333190918
training loss: 1.3932582139968872
training loss: 1.4466314315795898
training loss: 1.5022547245025635
training loss: 1.358510971069336
training loss: 1.4100556373596191


training:  52%|█████▏    | 2591/5000 [1:28:22<1:19:31,  1.98s/it]

training loss: 1.4922749996185303
training loss: 1.4572982788085938
training loss: 1.5110998153686523
training loss: 1.397215485572815
training loss: 1.529426097869873
training loss: 1.4722217321395874


training:  52%|█████▏    | 2597/5000 [1:28:34<1:19:14,  1.98s/it]

training loss: 1.4078972339630127
training loss: 1.4160569906234741
training loss: 1.464709997177124
training loss: 1.4488074779510498
training loss: 1.4474294185638428
validation loss: 1.3451194763183594
training loss: 1.476523995399475


training:  52%|█████▏    | 2603/5000 [1:28:46<1:19:22,  1.99s/it]

training loss: 1.4421145915985107
training loss: 1.4714386463165283
training loss: 1.3317002058029175
training loss: 1.4668577909469604
training loss: 1.3183305263519287
training loss: 1.3284685611724854


training:  52%|█████▏    | 2609/5000 [1:28:57<1:19:01,  1.98s/it]

training loss: 1.5868467092514038
training loss: 1.5020699501037598
training loss: 1.4820196628570557
training loss: 1.525510311126709
training loss: 1.4575167894363403
training loss: 1.4665002822875977


training:  52%|█████▏    | 2615/5000 [1:29:09<1:18:42,  1.98s/it]

training loss: 1.4406886100769043
training loss: 1.5231627225875854
training loss: 1.4316298961639404
training loss: 1.4756731986999512
training loss: 1.452451229095459
training loss: 1.4819577932357788


training:  52%|█████▏    | 2621/5000 [1:29:21<1:18:26,  1.98s/it]

training loss: 1.4640288352966309
training loss: 1.4950926303863525
training loss: 1.578385591506958
training loss: 1.2879023551940918
training loss: 1.6484403610229492
training loss: 1.5810848474502563


training:  53%|█████▎    | 2627/5000 [1:29:33<1:18:11,  1.98s/it]

training loss: 1.4277764558792114
training loss: 1.585605263710022
training loss: 1.5923900604248047
training loss: 1.2095086574554443
training loss: 1.5643696784973145
training loss: 1.4782315492630005


training:  53%|█████▎    | 2633/5000 [1:29:45<1:17:57,  1.98s/it]

training loss: 1.471083164215088
training loss: 1.4867162704467773
training loss: 1.3886065483093262
training loss: 1.4520931243896484
training loss: 1.4110791683197021
training loss: 1.6585050821304321


training:  53%|█████▎    | 2639/5000 [1:29:57<1:17:43,  1.98s/it]

training loss: 1.4968129396438599
training loss: 1.4573420286178589
training loss: 1.535170316696167
training loss: 1.4674654006958008
training loss: 1.442504644393921
training loss: 1.4056684970855713


training:  53%|█████▎    | 2645/5000 [1:30:09<1:17:31,  1.98s/it]

training loss: 1.5973424911499023
training loss: 1.6033202409744263
training loss: 1.398059606552124
training loss: 1.536982774734497
training loss: 1.3715267181396484
training loss: 1.3828250169754028


training:  53%|█████▎    | 2651/5000 [1:30:20<1:17:18,  1.97s/it]

training loss: 1.5785471200942993
training loss: 1.4191560745239258
training loss: 1.3994569778442383
training loss: 1.5777851343154907
training loss: 1.537869930267334
training loss: 1.442599892616272


training:  53%|█████▎    | 2657/5000 [1:30:32<1:17:06,  1.97s/it]

training loss: 1.4239836931228638
training loss: 1.5017503499984741
training loss: 1.3802084922790527
training loss: 1.484357476234436
training loss: 1.395378589630127
training loss: 1.5146007537841797


training:  53%|█████▎    | 2663/5000 [1:30:44<1:16:54,  1.97s/it]

training loss: 1.473756194114685
training loss: 1.3476955890655518
training loss: 1.4151272773742676
training loss: 1.4026511907577515
training loss: 1.354620099067688
training loss: 1.4635355472564697


training:  53%|█████▎    | 2669/5000 [1:30:56<1:16:41,  1.97s/it]

training loss: 1.4088468551635742
training loss: 1.3927849531173706
training loss: 1.4386404752731323
training loss: 1.361180067062378
training loss: 1.4144738912582397
training loss: 1.6605652570724487


training:  54%|█████▎    | 2675/5000 [1:31:08<1:16:29,  1.97s/it]

training loss: 1.4612001180648804
training loss: 1.5356841087341309
training loss: 1.5029089450836182
training loss: 1.44279146194458
training loss: 1.5184760093688965
training loss: 1.526172161102295


training:  54%|█████▎    | 2681/5000 [1:31:20<1:16:16,  1.97s/it]

training loss: 1.5176576375961304
training loss: 1.407949686050415
training loss: 1.3533132076263428
training loss: 1.3798655271530151
training loss: 1.4352809190750122
training loss: 1.427959680557251


training:  54%|█████▎    | 2687/5000 [1:31:31<1:16:04,  1.97s/it]

training loss: 1.4403902292251587
training loss: 1.5429234504699707
training loss: 1.5122528076171875
training loss: 1.3696568012237549
training loss: 1.3660476207733154
training loss: 1.4363670349121094


training:  54%|█████▍    | 2693/5000 [1:31:43<1:15:52,  1.97s/it]

training loss: 1.4397025108337402
training loss: 1.4685084819793701
training loss: 1.4396779537200928
training loss: 1.3381837606430054
training loss: 1.5765525102615356
training loss: 1.5476460456848145


training:  54%|█████▍    | 2699/5000 [1:31:55<1:15:40,  1.97s/it]

training loss: 1.4984248876571655
training loss: 1.4231958389282227
training loss: 1.441604495048523
validation loss: 1.3134219646453857
training loss: 1.4916682243347168
training loss: 1.3769539594650269
training loss: 1.3785251379013062


training:  54%|█████▍    | 2705/5000 [1:32:07<1:15:51,  1.98s/it]

training loss: 1.5265289545059204
training loss: 1.3993912935256958
training loss: 1.3133807182312012
training loss: 1.5812947750091553
training loss: 1.3829712867736816
training loss: 1.3824427127838135


training:  54%|█████▍    | 2711/5000 [1:32:19<1:15:32,  1.98s/it]

training loss: 1.4858564138412476
training loss: 1.5186140537261963
training loss: 1.4555188417434692
training loss: 1.5066499710083008
training loss: 1.5329339504241943
training loss: 1.6865586042404175


training:  54%|█████▍    | 2717/5000 [1:32:31<1:15:16,  1.98s/it]

training loss: 1.583770751953125
training loss: 1.4719116687774658
training loss: 1.427375078201294
training loss: 1.579114556312561
training loss: 1.5044878721237183
training loss: 1.4600839614868164


training:  54%|█████▍    | 2723/5000 [1:32:43<1:15:01,  1.98s/it]

training loss: 1.4498181343078613
training loss: 1.5377566814422607
training loss: 1.4796468019485474
training loss: 1.4766584634780884
training loss: 1.4092929363250732
training loss: 1.4126782417297363


training:  55%|█████▍    | 2729/5000 [1:32:54<1:14:47,  1.98s/it]

training loss: 1.4852499961853027
training loss: 1.4097999334335327
training loss: 1.426288366317749
training loss: 1.581048846244812
training loss: 1.3620917797088623
training loss: 1.4875528812408447


training:  55%|█████▍    | 2735/5000 [1:33:06<1:14:33,  1.98s/it]

training loss: 1.4768732786178589
training loss: 1.5081303119659424
training loss: 1.3987367153167725
training loss: 1.4901589155197144
training loss: 1.3866112232208252
training loss: 1.4399137496948242


training:  55%|█████▍    | 2741/5000 [1:33:18<1:14:21,  1.97s/it]

training loss: 1.4545342922210693
training loss: 1.4969947338104248
training loss: 1.48171067237854
training loss: 1.34096360206604
training loss: 1.3673136234283447
training loss: 1.5447744131088257


training:  55%|█████▍    | 2747/5000 [1:33:30<1:14:08,  1.97s/it]

training loss: 1.54075288772583
training loss: 1.5995503664016724
training loss: 1.4741449356079102
training loss: 1.552837610244751
training loss: 1.3874545097351074
training loss: 1.4640312194824219


training:  55%|█████▌    | 2753/5000 [1:33:42<1:13:56,  1.97s/it]

training loss: 1.4700473546981812
training loss: 1.400490641593933
training loss: 1.5270497798919678
training loss: 1.4945685863494873
training loss: 1.5412074327468872
training loss: 1.5279273986816406


training:  55%|█████▌    | 2759/5000 [1:33:54<1:13:43,  1.97s/it]

training loss: 1.4423167705535889
training loss: 1.4960094690322876
training loss: 1.464475154876709
training loss: 1.5480680465698242
training loss: 1.4642256498336792
training loss: 1.4726163148880005


training:  55%|█████▌    | 2765/5000 [1:34:06<1:13:32,  1.97s/it]

training loss: 1.4153450727462769
training loss: 1.4132698774337769
training loss: 1.3878917694091797
training loss: 1.4896657466888428
training loss: 1.4288092851638794
training loss: 1.5074195861816406


training:  55%|█████▌    | 2771/5000 [1:34:17<1:13:19,  1.97s/it]

training loss: 1.5924962759017944
training loss: 1.4807982444763184
training loss: 1.3756998777389526
training loss: 1.3869738578796387
training loss: 1.4227371215820312
training loss: 1.3164100646972656


training:  56%|█████▌    | 2777/5000 [1:34:29<1:13:08,  1.97s/it]

training loss: 1.5212407112121582
training loss: 1.4576257467269897
training loss: 1.4588807821273804
training loss: 1.4357160329818726
training loss: 1.5550485849380493
training loss: 1.4263454675674438


training:  56%|█████▌    | 2783/5000 [1:34:41<1:12:56,  1.97s/it]

training loss: 1.5586835145950317
training loss: 1.5393435955047607
training loss: 1.5235191583633423
training loss: 1.4288015365600586
training loss: 1.315995216369629
training loss: 1.5269519090652466


training:  56%|█████▌    | 2789/5000 [1:34:53<1:12:44,  1.97s/it]

training loss: 1.5283194780349731
training loss: 1.4620195627212524
training loss: 1.457452654838562
training loss: 1.4869314432144165
training loss: 1.6963542699813843
training loss: 1.5275651216506958


training:  56%|█████▌    | 2795/5000 [1:35:05<1:12:32,  1.97s/it]

training loss: 1.6570295095443726
training loss: 1.5858650207519531
training loss: 1.5961546897888184
training loss: 1.3821189403533936
training loss: 1.4539164304733276
training loss: 1.449346899986267
training loss: 1.5171552896499634


training:  56%|█████▌    | 2801/5000 [1:35:17<1:12:42,  1.98s/it]

validation loss: 1.4731645584106445
training loss: 1.385116457939148
training loss: 1.5004619359970093
training loss: 1.4490443468093872
training loss: 1.433279275894165
training loss: 1.3580327033996582


training:  56%|█████▌    | 2807/5000 [1:35:29<1:12:23,  1.98s/it]

training loss: 1.631245732307434
training loss: 1.3887149095535278
training loss: 1.5786807537078857
training loss: 1.4135384559631348
training loss: 1.4136496782302856
training loss: 1.436843991279602


training:  56%|█████▋    | 2813/5000 [1:35:40<1:12:07,  1.98s/it]

training loss: 1.4333455562591553
training loss: 1.456861138343811
training loss: 1.4296809434890747
training loss: 1.457222819328308
training loss: 1.3638582229614258
training loss: 1.4866890907287598


training:  56%|█████▋    | 2819/5000 [1:35:52<1:11:52,  1.98s/it]

training loss: 1.4523338079452515
training loss: 1.4697835445404053
training loss: 1.4315353631973267
training loss: 1.6541484594345093
training loss: 1.4580968618392944
training loss: 1.4644403457641602


training:  56%|█████▋    | 2825/5000 [1:36:04<1:11:38,  1.98s/it]

training loss: 1.469451665878296
training loss: 1.5252958536148071
training loss: 1.564063549041748
training loss: 1.4641348123550415
training loss: 1.442651391029358
training loss: 1.3930909633636475


training:  57%|█████▋    | 2831/5000 [1:36:16<1:11:25,  1.98s/it]

training loss: 1.4481806755065918
training loss: 1.404274344444275
training loss: 1.5070676803588867
training loss: 1.4544322490692139
training loss: 1.301895260810852
training loss: 1.4752798080444336


training:  57%|█████▋    | 2837/5000 [1:36:28<1:11:12,  1.98s/it]

training loss: 1.3278416395187378
training loss: 1.4948146343231201
training loss: 1.5778597593307495
training loss: 1.4349342584609985
training loss: 1.457034707069397
training loss: 1.5963842868804932


training:  57%|█████▋    | 2843/5000 [1:36:40<1:10:59,  1.97s/it]

training loss: 1.6059954166412354
training loss: 1.4579601287841797
training loss: 1.3285589218139648
training loss: 1.4359816312789917
training loss: 1.4435089826583862


training:  57%|█████▋    | 2843/5000 [1:36:50<1:10:59,  1.97s/it]

training loss: 1.3890691995620728


training:  57%|█████▋    | 2849/5000 [1:36:52<1:10:47,  1.97s/it]

training loss: 1.4666332006454468
training loss: 1.392553687095642
training loss: 1.4586142301559448
training loss: 1.6677030324935913
training loss: 1.4184209108352661
training loss: 1.5914909839630127


training:  57%|█████▋    | 2855/5000 [1:37:03<1:10:34,  1.97s/it]

training loss: 1.5213724374771118
training loss: 1.608230710029602
training loss: 1.5451959371566772
training loss: 1.4763429164886475
training loss: 1.5122400522232056
training loss: 1.5015668869018555


training:  57%|█████▋    | 2861/5000 [1:37:15<1:10:22,  1.97s/it]

training loss: 1.4355173110961914
training loss: 1.512451171875
training loss: 1.3517364263534546
training loss: 1.4171044826507568
training loss: 1.5118111371994019
training loss: 1.410333514213562


training:  57%|█████▋    | 2867/5000 [1:37:27<1:10:10,  1.97s/it]

training loss: 1.175642490386963
training loss: 1.5009799003601074
training loss: 1.3568426370620728
training loss: 1.4782699346542358
training loss: 1.3558433055877686
training loss: 1.3949875831604004


training:  57%|█████▋    | 2873/5000 [1:37:39<1:09:59,  1.97s/it]

training loss: 1.4472321271896362
training loss: 1.474300503730774
training loss: 1.501639485359192
training loss: 1.509456753730774
training loss: 1.4855880737304688
training loss: 1.4704235792160034


training:  58%|█████▊    | 2879/5000 [1:37:51<1:09:47,  1.97s/it]

training loss: 1.5716232061386108
training loss: 1.5756702423095703
training loss: 1.4399433135986328
training loss: 1.2848879098892212
training loss: 1.3345056772232056
training loss: 1.476422667503357


training:  58%|█████▊    | 2885/5000 [1:38:03<1:09:35,  1.97s/it]

training loss: 1.3667975664138794
training loss: 1.548261046409607
training loss: 1.3800777196884155
training loss: 1.3674708604812622
training loss: 1.5385791063308716
training loss: 1.4570509195327759


training:  58%|█████▊    | 2891/5000 [1:38:14<1:09:23,  1.97s/it]

training loss: 1.5112348794937134
training loss: 1.4012699127197266
training loss: 1.5159868001937866
training loss: 1.669937252998352
training loss: 1.4890741109848022
training loss: 1.674286127090454


training:  58%|█████▊    | 2897/5000 [1:38:26<1:09:11,  1.97s/it]

training loss: 1.427927017211914
training loss: 1.4309273958206177
training loss: 1.405409336090088
training loss: 1.4704746007919312
training loss: 1.5049419403076172
validation loss: 1.3639919757843018
training loss: 1.420027494430542


training:  58%|█████▊    | 2903/5000 [1:38:38<1:09:19,  1.98s/it]

training loss: 1.4862502813339233
training loss: 1.4959884881973267
training loss: 1.3850780725479126
training loss: 1.3955572843551636
training loss: 1.503602147102356
training loss: 1.4336838722229004


training:  58%|█████▊    | 2909/5000 [1:38:50<1:09:01,  1.98s/it]

training loss: 1.4438456296920776
training loss: 1.5565998554229736
training loss: 1.4277963638305664
training loss: 1.4575669765472412
training loss: 1.5620529651641846
training loss: 1.4849976301193237


training:  58%|█████▊    | 2915/5000 [1:39:02<1:08:45,  1.98s/it]

training loss: 1.491075873374939
training loss: 1.5740902423858643
training loss: 1.5308281183242798
training loss: 1.4787405729293823
training loss: 1.5059254169464111
training loss: 1.5040814876556396


training:  58%|█████▊    | 2921/5000 [1:39:14<1:08:30,  1.98s/it]

training loss: 1.3840575218200684
training loss: 1.4745290279388428
training loss: 1.3862665891647339
training loss: 1.5893477201461792
training loss: 1.4480594396591187
training loss: 1.4502464532852173


training:  59%|█████▊    | 2927/5000 [1:39:26<1:08:16,  1.98s/it]

training loss: 1.43938410282135
training loss: 1.541108250617981
training loss: 1.4889779090881348
training loss: 1.5032204389572144
training loss: 1.424477219581604
training loss: 1.4957324266433716


training:  59%|█████▊    | 2933/5000 [1:39:38<1:08:02,  1.98s/it]

training loss: 1.4056490659713745
training loss: 1.2682926654815674
training loss: 1.4589828252792358
training loss: 1.4156615734100342
training loss: 1.341193437576294
training loss: 1.5087621212005615


training:  59%|█████▉    | 2939/5000 [1:39:49<1:07:50,  1.97s/it]

training loss: 1.57941734790802
training loss: 1.4984787702560425
training loss: 1.4963663816452026
training loss: 1.3828012943267822
training loss: 1.4555853605270386
training loss: 1.4528247117996216


training:  59%|█████▉    | 2945/5000 [1:40:01<1:07:37,  1.97s/it]

training loss: 1.6083637475967407
training loss: 1.4086939096450806
training loss: 1.4930235147476196
training loss: 1.4180852174758911
training loss: 1.5311815738677979
training loss: 1.3404183387756348


training:  59%|█████▉    | 2951/5000 [1:40:13<1:07:25,  1.97s/it]

training loss: 1.3843551874160767
training loss: 1.3931299448013306
training loss: 1.4177132844924927
training loss: 1.5021916627883911
training loss: 1.3863238096237183
training loss: 1.4756840467453003


training:  59%|█████▉    | 2957/5000 [1:40:25<1:07:12,  1.97s/it]

training loss: 1.6519771814346313
training loss: 1.482383131980896
training loss: 1.4800859689712524
training loss: 1.4543441534042358
training loss: 1.5108879804611206
training loss: 1.5649877786636353


training:  59%|█████▉    | 2963/5000 [1:40:37<1:07:01,  1.97s/it]

training loss: 1.7112003564834595
training loss: 1.3689148426055908
training loss: 1.537587285041809
training loss: 1.3503485918045044
training loss: 1.5686815977096558
training loss: 1.4577337503433228


training:  59%|█████▉    | 2969/5000 [1:40:49<1:06:49,  1.97s/it]

training loss: 1.6260734796524048
training loss: 1.411831259727478
training loss: 1.5447056293487549
training loss: 1.4033186435699463
training loss: 1.5284441709518433
training loss: 1.3098169565200806


training:  60%|█████▉    | 2975/5000 [1:41:00<1:06:37,  1.97s/it]

training loss: 1.5923817157745361
training loss: 1.3918637037277222
training loss: 1.5430413484573364
training loss: 1.4666093587875366
training loss: 1.5161938667297363
training loss: 1.4167850017547607


training:  60%|█████▉    | 2981/5000 [1:41:12<1:06:26,  1.97s/it]

training loss: 1.4727613925933838
training loss: 1.3446760177612305
training loss: 1.4902898073196411
training loss: 1.2798291444778442
training loss: 1.477243423461914
training loss: 1.4747387170791626


training:  60%|█████▉    | 2987/5000 [1:41:24<1:06:13,  1.97s/it]

training loss: 1.447940707206726
training loss: 1.5725866556167603
training loss: 1.3687268495559692
training loss: 1.4468331336975098
training loss: 1.5411673784255981
training loss: 1.377694010734558


training:  60%|█████▉    | 2993/5000 [1:41:36<1:06:02,  1.97s/it]

training loss: 1.5220065116882324
training loss: 1.4990171194076538
training loss: 1.5333060026168823
training loss: 1.5090521574020386
training loss: 1.4457423686981201
training loss: 1.4213112592697144


training:  60%|█████▉    | 2999/5000 [1:41:48<1:05:50,  1.97s/it]

training loss: 1.5162752866744995
training loss: 1.4034279584884644
training loss: 1.4202806949615479
validation loss: 1.3294206857681274
%s 

 %s ("d archaeological evidence are scarce, it appears that by the seventh century, Srivijaya established suzerainty over large areas of [[Sumatra]], western [[Java (island)|Java]], and much of the [[Malay Peninsula]]. Dominating the [[Strait of Malacca|Malacca]] and [[Sunda Strait|Sunda]] [[straits]], Srivijaya controlled both the [[Spice Route]] traffic and local trade, charging a toll on passing ships, and remained a formidable sea power until the thirteenth century. This spread the [[Malay people|Malay]] culture throughout Sumatra, the Malay Peninsula, and western [[Borneo]].   A stronghold of [[Vajrayana]] [[Buddhism]], Srivijaya attracted pilgrims and scholars from other parts of Asia. These included the Chinese monk [[Yijing]], who made several lengthy visits to Sumatra on his way to study at Nalanda in India in 671 and 695, and the eleve

training:  60%|██████    | 3001/5000 [1:42:22<2:09:06,  3.88s/it]

ied here.  Honglish music, and can and very dare ful, he legian offers today in the [[Dectansualiss Dosore Day]] and [[Dwney]], [[Daming|Ch Daningdoch]] tokespable sing shinks of the rerunning of thars pontwated throbsonal [[Pulcoara&qudent]]s.  ===Londling tealdisties== The Pitch Shoptericing the immedite our stoms alsoluin as any in acting othing and sowe, stufferionshir finited throse the weeks, or tharoger. Basing. It remerith the [[aux]] abaly is thoristic winned outher dobstratublishirts and th on the
training loss: 1.4182134866714478
training loss: 1.4067423343658447
training loss: 1.3496004343032837
training loss: 1.5030766725540161
training loss: 1.5386643409729004


training:  60%|██████    | 3007/5000 [1:42:34<1:46:41,  3.21s/it]

training loss: 1.388730525970459
training loss: 1.4119927883148193
training loss: 1.3275803327560425
training loss: 1.4316655397415161
training loss: 1.4994441270828247
training loss: 1.436060905456543


training:  60%|██████    | 3013/5000 [1:42:46<1:32:44,  2.80s/it]

training loss: 1.7198028564453125
training loss: 1.3681682348251343
training loss: 1.2055634260177612
training loss: 1.5631499290466309
training loss: 1.4440754652023315
training loss: 1.543764352798462


training:  60%|██████    | 3019/5000 [1:42:58<1:23:40,  2.53s/it]

training loss: 1.459538221359253
training loss: 1.450385570526123
training loss: 1.4921752214431763
training loss: 1.4772814512252808
training loss: 1.4514471292495728
training loss: 1.4959036111831665


training:  60%|██████    | 3025/5000 [1:43:10<1:17:36,  2.36s/it]

training loss: 1.4349397420883179
training loss: 1.3885914087295532
training loss: 1.436683177947998
training loss: 1.4335830211639404
training loss: 1.494545817375183
training loss: 1.4181658029556274


training:  61%|██████    | 3031/5000 [1:43:21<1:13:27,  2.24s/it]

training loss: 1.4767146110534668
training loss: 1.3130358457565308
training loss: 1.5028595924377441
training loss: 1.3852139711380005
training loss: 1.4371931552886963
training loss: 1.4297548532485962


training:  61%|██████    | 3037/5000 [1:43:33<1:10:34,  2.16s/it]

training loss: 1.363045334815979
training loss: 1.5418506860733032
training loss: 1.358047604560852
training loss: 1.3636561632156372
training loss: 1.4526762962341309
training loss: 1.526328444480896


training:  61%|██████    | 3043/5000 [1:43:45<1:08:31,  2.10s/it]

training loss: 1.4928869009017944
training loss: 1.3977681398391724
training loss: 1.4709137678146362
training loss: 1.5774897336959839
training loss: 1.3311190605163574
training loss: 1.4123109579086304


training:  61%|██████    | 3049/5000 [1:43:57<1:07:03,  2.06s/it]

training loss: 1.5358468294143677
training loss: 1.4299184083938599
training loss: 1.4043543338775635
training loss: 1.4399305582046509
training loss: 1.4415267705917358
training loss: 1.4316812753677368


training:  61%|██████    | 3055/5000 [1:44:09<1:05:59,  2.04s/it]

training loss: 1.4319535493850708
training loss: 1.6633332967758179
training loss: 1.3689576387405396
training loss: 1.419723391532898
training loss: 1.5082944631576538
training loss: 1.3787914514541626


training:  61%|██████    | 3061/5000 [1:44:21<1:05:10,  2.02s/it]

training loss: 1.4887988567352295
training loss: 1.3704420328140259
training loss: 1.4335911273956299
training loss: 1.5799201726913452
training loss: 1.4545551538467407
training loss: 1.3873456716537476


training:  61%|██████▏   | 3067/5000 [1:44:32<1:04:33,  2.00s/it]

training loss: 1.4103320837020874
training loss: 1.424691915512085
training loss: 1.5526326894760132
training loss: 1.3903729915618896
training loss: 1.4052239656448364
training loss: 1.5519553422927856


training:  61%|██████▏   | 3073/5000 [1:44:44<1:04:04,  1.99s/it]

training loss: 1.4392675161361694
training loss: 1.367491364479065
training loss: 1.5567784309387207
training loss: 1.5083346366882324
training loss: 1.4967197179794312
training loss: 1.4881664514541626


training:  62%|██████▏   | 3079/5000 [1:44:56<1:03:39,  1.99s/it]

training loss: 1.579522967338562
training loss: 1.3680208921432495
training loss: 1.2913768291473389
training loss: 1.3846083879470825
training loss: 1.3336864709854126
training loss: 1.4077552556991577


training:  62%|██████▏   | 3085/5000 [1:45:08<1:03:19,  1.98s/it]

training loss: 1.4663186073303223
training loss: 1.548700213432312
training loss: 1.4603908061981201
training loss: 1.4323490858078003
training loss: 1.4706302881240845
training loss: 1.4589451551437378


training:  62%|██████▏   | 3091/5000 [1:45:20<1:03:01,  1.98s/it]

training loss: 1.400952696800232
training loss: 1.6734849214553833
training loss: 1.4350814819335938
training loss: 1.3984874486923218
training loss: 1.3708717823028564
training loss: 1.45729398727417


training:  62%|██████▏   | 3097/5000 [1:45:32<1:02:45,  1.98s/it]

training loss: 1.5063281059265137
training loss: 1.3729640245437622
training loss: 1.463085412979126
training loss: 1.4796741008758545
training loss: 1.4011176824569702
validation loss: 1.1121435165405273
training loss: 1.6429890394210815


training:  62%|██████▏   | 3103/5000 [1:45:44<1:02:49,  1.99s/it]

training loss: 1.4157911539077759
training loss: 1.4829083681106567
training loss: 1.4303874969482422
training loss: 1.400750756263733
training loss: 1.4903461933135986
training loss: 1.4543030261993408


training:  62%|██████▏   | 3109/5000 [1:45:56<1:02:29,  1.98s/it]

training loss: 1.3773136138916016
training loss: 1.4693177938461304
training loss: 1.3004261255264282
training loss: 1.486796498298645
training loss: 1.5231174230575562
training loss: 1.24250328540802


training:  62%|██████▏   | 3115/5000 [1:46:07<1:02:12,  1.98s/it]

training loss: 1.5464885234832764
training loss: 1.47685706615448
training loss: 1.3868907690048218
training loss: 1.4306092262268066
training loss: 1.471664547920227
training loss: 1.6799900531768799


training:  62%|██████▏   | 3121/5000 [1:46:19<1:01:56,  1.98s/it]

training loss: 1.4588215351104736
training loss: 1.3584954738616943
training loss: 1.502299427986145
training loss: 1.4688009023666382
training loss: 1.4311002492904663
training loss: 1.3778786659240723


training:  63%|██████▎   | 3127/5000 [1:46:31<1:01:41,  1.98s/it]

training loss: 1.4957330226898193
training loss: 1.489763855934143
training loss: 1.4153180122375488
training loss: 1.3494998216629028
training loss: 1.4261640310287476
training loss: 1.531239628791809


training:  63%|██████▎   | 3133/5000 [1:46:43<1:01:28,  1.98s/it]

training loss: 1.5604995489120483
training loss: 1.2397911548614502
training loss: 1.476839542388916
training loss: 1.4076553583145142
training loss: 1.5760703086853027
training loss: 1.5329740047454834


training:  63%|██████▎   | 3139/5000 [1:46:55<1:01:15,  1.97s/it]

training loss: 1.4828578233718872
training loss: 1.431612491607666
training loss: 1.645950198173523
training loss: 1.3820711374282837
training loss: 1.4231184720993042
training loss: 1.5013563632965088


training:  63%|██████▎   | 3145/5000 [1:47:07<1:01:02,  1.97s/it]

training loss: 1.4082036018371582
training loss: 1.3686332702636719
training loss: 1.4395939111709595
training loss: 1.5068751573562622
training loss: 1.4015403985977173
training loss: 1.4952455759048462


training:  63%|██████▎   | 3151/5000 [1:47:18<1:00:50,  1.97s/it]

training loss: 1.1873879432678223
training loss: 1.5108911991119385
training loss: 1.5023096799850464
training loss: 1.4885700941085815
training loss: 1.4824358224868774
training loss: 1.4244704246520996


training:  63%|██████▎   | 3157/5000 [1:47:30<1:00:38,  1.97s/it]

training loss: 1.5621219873428345
training loss: 1.3915555477142334
training loss: 1.3176918029785156
training loss: 1.546414852142334
training loss: 1.4435186386108398
training loss: 1.5576056241989136


training:  63%|██████▎   | 3163/5000 [1:47:42<1:00:25,  1.97s/it]

training loss: 1.516011357307434
training loss: 1.4269051551818848
training loss: 1.3312181234359741
training loss: 1.4264522790908813
training loss: 1.5115066766738892
training loss: 1.5528229475021362


training:  63%|██████▎   | 3169/5000 [1:47:54<1:00:13,  1.97s/it]

training loss: 1.4111382961273193
training loss: 1.503526210784912
training loss: 1.5074005126953125
training loss: 1.4839078187942505
training loss: 1.3752244710922241
training loss: 1.441041111946106


training:  64%|██████▎   | 3175/5000 [1:48:06<1:00:01,  1.97s/it]

training loss: 1.6716604232788086
training loss: 1.3645734786987305
training loss: 1.4733619689941406
training loss: 1.5206412076950073
training loss: 1.3497964143753052
training loss: 1.4246811866760254


training:  64%|██████▎   | 3181/5000 [1:48:18<59:49,  1.97s/it]  

training loss: 1.5115904808044434
training loss: 1.3866368532180786
training loss: 1.5058475732803345
training loss: 1.3673268556594849
training loss: 1.4052461385726929
training loss: 1.395093321800232


training:  64%|██████▎   | 3187/5000 [1:48:29<59:37,  1.97s/it]

training loss: 1.5400280952453613
training loss: 1.490068793296814
training loss: 1.3408176898956299
training loss: 1.4724124670028687
training loss: 1.4069124460220337
training loss: 1.4795653820037842


training:  64%|██████▍   | 3193/5000 [1:48:41<59:25,  1.97s/it]

training loss: 1.468703031539917
training loss: 1.5318800210952759
training loss: 1.4675849676132202
training loss: 1.3486642837524414
training loss: 1.3712033033370972
training loss: 1.483094573020935


training:  64%|██████▍   | 3199/5000 [1:48:53<59:14,  1.97s/it]

training loss: 1.3453545570373535
training loss: 1.4563850164413452
training loss: 1.3673598766326904
validation loss: 1.4090614318847656
training loss: 1.383749008178711
training loss: 1.522695779800415
training loss: 1.3807384967803955


training:  64%|██████▍   | 3205/5000 [1:49:05<59:20,  1.98s/it]

training loss: 1.3827180862426758
training loss: 1.3723058700561523
training loss: 1.4325751066207886
training loss: 1.600688099861145
training loss: 1.3888880014419556
training loss: 1.5670775175094604


training:  64%|██████▍   | 3211/5000 [1:49:17<59:02,  1.98s/it]

training loss: 1.5149630308151245
training loss: 1.450976014137268
training loss: 1.5019397735595703
training loss: 1.5496693849563599
training loss: 1.439286708831787
training loss: 1.4339122772216797


training:  64%|██████▍   | 3217/5000 [1:49:29<58:47,  1.98s/it]

training loss: 1.5066622495651245
training loss: 1.5159474611282349
training loss: 1.3479570150375366
training loss: 1.402173638343811
training loss: 1.5056020021438599
training loss: 1.4791202545166016


training:  64%|██████▍   | 3223/5000 [1:49:41<58:32,  1.98s/it]

training loss: 1.5785448551177979
training loss: 1.4019675254821777
training loss: 1.427959680557251
training loss: 1.3232234716415405
training loss: 1.4447379112243652
training loss: 1.5035219192504883


training:  65%|██████▍   | 3229/5000 [1:49:53<58:19,  1.98s/it]

training loss: 1.4047904014587402
training loss: 1.4600847959518433
training loss: 1.496148943901062
training loss: 1.421218991279602
training loss: 1.4366506338119507
training loss: 1.496362328529358


training:  65%|██████▍   | 3235/5000 [1:50:04<58:06,  1.98s/it]

training loss: 1.4083293676376343
training loss: 1.3758862018585205
training loss: 1.4556657075881958
training loss: 1.476668357849121
training loss: 1.4232232570648193
training loss: 1.5254294872283936


training:  65%|██████▍   | 3241/5000 [1:50:16<57:53,  1.97s/it]

training loss: 1.4205021858215332
training loss: 1.3825123310089111
training loss: 1.4324628114700317
training loss: 1.4821224212646484
training loss: 1.4817920923233032
training loss: 1.3445618152618408


training:  65%|██████▍   | 3247/5000 [1:50:28<57:41,  1.97s/it]

training loss: 1.5083078145980835
training loss: 1.4820443391799927
training loss: 1.384941816329956
training loss: 1.436020016670227
training loss: 1.4558453559875488
training loss: 1.4575953483581543


training:  65%|██████▌   | 3253/5000 [1:50:40<57:29,  1.97s/it]

training loss: 1.6159056425094604
training loss: 1.412423849105835
training loss: 1.4650187492370605
training loss: 1.7765674591064453
training loss: 1.5229032039642334
training loss: 1.400051474571228


training:  65%|██████▌   | 3259/5000 [1:50:52<57:17,  1.97s/it]

training loss: 1.4418803453445435
training loss: 1.4085396528244019
training loss: 1.5037615299224854
training loss: 1.505362629890442
training loss: 1.513480544090271
training loss: 1.4464997053146362


training:  65%|██████▌   | 3265/5000 [1:51:04<57:04,  1.97s/it]

training loss: 1.519557237625122
training loss: 1.4244093894958496
training loss: 1.5073164701461792
training loss: 1.26905357837677
training loss: 1.5151084661483765
training loss: 1.4398796558380127


training:  65%|██████▌   | 3271/5000 [1:51:15<56:53,  1.97s/it]

training loss: 1.3715373277664185
training loss: 1.5998470783233643
training loss: 1.5232118368148804
training loss: 1.6713051795959473
training loss: 1.420293927192688
training loss: 1.4594358205795288


training:  66%|██████▌   | 3277/5000 [1:51:27<56:41,  1.97s/it]

training loss: 1.4138810634613037
training loss: 1.4008487462997437
training loss: 1.5122870206832886
training loss: 1.5007187128067017
training loss: 1.5542494058609009
training loss: 1.2106188535690308


training:  66%|██████▌   | 3283/5000 [1:51:39<56:29,  1.97s/it]

training loss: 1.4879499673843384
training loss: 1.4759612083435059
training loss: 1.5325173139572144
training loss: 1.4591773748397827
training loss: 1.4761558771133423
training loss: 1.3394215106964111


training:  66%|██████▌   | 3289/5000 [1:51:51<56:17,  1.97s/it]

training loss: 1.4335205554962158
training loss: 1.5412557125091553
training loss: 1.588295578956604
training loss: 1.3539047241210938
training loss: 1.428283452987671
training loss: 1.4801139831542969


training:  66%|██████▌   | 3295/5000 [1:52:03<56:05,  1.97s/it]

training loss: 1.4443163871765137
training loss: 1.6269655227661133
training loss: 1.486199140548706
training loss: 1.4656264781951904
training loss: 1.413139820098877
training loss: 1.4924097061157227
training loss: 1.528176188468933


training:  66%|██████▌   | 3301/5000 [1:52:15<56:09,  1.98s/it]

validation loss: 1.2171939611434937
training loss: 1.5586668252944946
training loss: 1.4972401857376099
training loss: 1.5630933046340942
training loss: 1.474760890007019
training loss: 1.2981330156326294


training:  66%|██████▌   | 3307/5000 [1:52:27<55:53,  1.98s/it]

training loss: 1.465894103050232
training loss: 1.4725420475006104
training loss: 1.4684048891067505
training loss: 1.5032480955123901
training loss: 1.4848690032958984
training loss: 1.447082281112671


training:  66%|██████▋   | 3313/5000 [1:52:39<55:37,  1.98s/it]

training loss: 1.50575852394104
training loss: 1.371765375137329
training loss: 1.3436044454574585
training loss: 1.3885151147842407
training loss: 1.4681376218795776
training loss: 1.4016538858413696


training:  66%|██████▋   | 3319/5000 [1:52:50<55:23,  1.98s/it]

training loss: 1.3988425731658936
training loss: 1.284074306488037
training loss: 1.477352261543274
training loss: 1.5395848751068115
training loss: 1.4630557298660278
training loss: 1.430497646331787


training:  66%|██████▋   | 3325/5000 [1:53:02<55:09,  1.98s/it]

training loss: 1.5651310682296753
training loss: 1.424891471862793
training loss: 1.3562897443771362
training loss: 1.4390581846237183
training loss: 1.4370231628417969
training loss: 1.543806791305542


training:  67%|██████▋   | 3331/5000 [1:53:14<54:56,  1.98s/it]

training loss: 1.5579164028167725
training loss: 1.5605442523956299
training loss: 1.3768998384475708
training loss: 1.4313338994979858
training loss: 1.5317898988723755
training loss: 1.199959397315979


training:  67%|██████▋   | 3337/5000 [1:53:26<54:44,  1.98s/it]

training loss: 1.4578354358673096
training loss: 1.5752458572387695
training loss: 1.1717443466186523
training loss: 1.5335900783538818
training loss: 1.4780635833740234
training loss: 1.4076507091522217


training:  67%|██████▋   | 3343/5000 [1:53:38<54:32,  1.97s/it]

training loss: 1.557395100593567
training loss: 1.3838958740234375
training loss: 1.5349807739257812
training loss: 1.5278394222259521
training loss: 1.6718754768371582
training loss: 1.4494075775146484


training:  67%|██████▋   | 3349/5000 [1:53:50<54:19,  1.97s/it]

training loss: 1.52414870262146
training loss: 1.4426015615463257
training loss: 1.517683506011963
training loss: 1.388252854347229
training loss: 1.4301701784133911
training loss: 1.494008183479309


training:  67%|██████▋   | 3355/5000 [1:54:01<54:07,  1.97s/it]

training loss: 1.5360232591629028
training loss: 1.452953815460205
training loss: 1.5229359865188599
training loss: 1.4377752542495728
training loss: 1.5086112022399902
training loss: 1.4903303384780884


training:  67%|██████▋   | 3361/5000 [1:54:13<53:55,  1.97s/it]

training loss: 1.435091257095337
training loss: 1.3615875244140625
training loss: 1.4844132661819458
training loss: 1.4357515573501587
training loss: 1.4521046876907349
training loss: 1.4206268787384033


training:  67%|██████▋   | 3367/5000 [1:54:25<53:43,  1.97s/it]

training loss: 1.388379454612732
training loss: 1.4639334678649902
training loss: 1.3977222442626953
training loss: 1.3420689105987549
training loss: 1.4632397890090942
training loss: 1.4603426456451416


training:  67%|██████▋   | 3373/5000 [1:54:37<53:31,  1.97s/it]

training loss: 1.567983865737915
training loss: 1.476110816001892
training loss: 1.3675389289855957
training loss: 1.45047128200531
training loss: 1.3725311756134033
training loss: 1.3214328289031982


training:  68%|██████▊   | 3379/5000 [1:54:49<53:19,  1.97s/it]

training loss: 1.5104347467422485
training loss: 1.3417563438415527
training loss: 1.577048420906067
training loss: 1.4408162832260132
training loss: 1.4682133197784424
training loss: 1.498718023300171


training:  68%|██████▊   | 3385/5000 [1:55:01<53:07,  1.97s/it]

training loss: 1.5351884365081787
training loss: 1.5402575731277466
training loss: 1.40956711769104
training loss: 1.363925814628601
training loss: 1.4878718852996826
training loss: 1.5235081911087036


training:  68%|██████▊   | 3391/5000 [1:55:13<52:55,  1.97s/it]

training loss: 1.2651432752609253
training loss: 1.3871674537658691
training loss: 1.4751989841461182
training loss: 1.5794475078582764
training loss: 1.5192791223526
training loss: 1.4778562784194946


training:  68%|██████▊   | 3397/5000 [1:55:24<52:43,  1.97s/it]

training loss: 1.5222615003585815
training loss: 1.3846136331558228
training loss: 1.4583756923675537
training loss: 1.48560631275177
training loss: 1.418968915939331
validation loss: 1.2839466333389282
training loss: 1.5499629974365234


training:  68%|██████▊   | 3403/5000 [1:55:36<52:47,  1.98s/it]

training loss: 1.500439167022705
training loss: 1.4786239862442017
training loss: 1.7223048210144043
training loss: 1.5312222242355347
training loss: 1.51788330078125
training loss: 1.3884782791137695


training:  68%|██████▊   | 3409/5000 [1:55:48<52:30,  1.98s/it]

training loss: 1.562686800956726
training loss: 1.4651367664337158
training loss: 1.4846221208572388
training loss: 1.4936864376068115
training loss: 1.4451313018798828
training loss: 1.4675427675247192


training:  68%|██████▊   | 3415/5000 [1:56:00<52:15,  1.98s/it]

training loss: 1.4968372583389282
training loss: 1.5084015130996704
training loss: 1.5101414918899536
training loss: 1.4745252132415771
training loss: 1.5048561096191406
training loss: 1.4934043884277344


training:  68%|██████▊   | 3421/5000 [1:56:12<52:01,  1.98s/it]

training loss: 1.4170242547988892
training loss: 1.519202709197998
training loss: 1.5714260339736938
training loss: 1.438730239868164
training loss: 1.3853410482406616
training loss: 1.3617991209030151


training:  69%|██████▊   | 3427/5000 [1:56:24<51:48,  1.98s/it]

training loss: 1.4980300664901733
training loss: 1.5008872747421265
training loss: 1.41145658493042
training loss: 1.498640775680542
training loss: 1.4834471940994263
training loss: 1.3592396974563599


training:  69%|██████▊   | 3433/5000 [1:56:36<51:35,  1.98s/it]

training loss: 1.5587490797042847
training loss: 1.475968360900879
training loss: 1.5061557292938232
training loss: 1.7432093620300293
training loss: 1.5327491760253906
training loss: 1.3962754011154175


training:  69%|██████▉   | 3439/5000 [1:56:47<51:23,  1.98s/it]

training loss: 1.481355905532837
training loss: 1.315584421157837
training loss: 1.593019723892212
training loss: 1.4740179777145386
training loss: 1.5054658651351929
training loss: 1.4842076301574707


training:  69%|██████▉   | 3445/5000 [1:56:59<51:10,  1.97s/it]

training loss: 1.5643466711044312
training loss: 1.3860812187194824
training loss: 1.4597617387771606
training loss: 1.387113332748413
training loss: 1.4512460231781006
training loss: 1.2728886604309082


training:  69%|██████▉   | 3451/5000 [1:57:11<50:58,  1.97s/it]

training loss: 1.593747854232788
training loss: 1.7159026861190796
training loss: 1.3610233068466187
training loss: 1.4465482234954834
training loss: 1.4048612117767334
training loss: 1.5277099609375


training:  69%|██████▉   | 3457/5000 [1:57:23<50:46,  1.97s/it]

training loss: 1.4329802989959717
training loss: 1.3489822149276733
training loss: 1.3824262619018555
training loss: 1.3875843286514282
training loss: 1.5288851261138916
training loss: 1.5551514625549316


training:  69%|██████▉   | 3463/5000 [1:57:35<50:34,  1.97s/it]

training loss: 1.447540044784546
training loss: 1.4115004539489746
training loss: 1.4991838932037354
training loss: 1.4980812072753906
training loss: 1.3598016500473022
training loss: 1.4983240365982056


training:  69%|██████▉   | 3469/5000 [1:57:47<50:22,  1.97s/it]

training loss: 1.4567861557006836
training loss: 1.3362455368041992
training loss: 1.490679383277893
training loss: 1.5345187187194824
training loss: 1.3782620429992676
training loss: 1.4029067754745483


training:  70%|██████▉   | 3475/5000 [1:57:59<50:10,  1.97s/it]

training loss: 1.3880200386047363
training loss: 1.4481165409088135
training loss: 1.3825289011001587
training loss: 1.4553557634353638
training loss: 1.4832557439804077
training loss: 1.4560831785202026


training:  70%|██████▉   | 3481/5000 [1:58:10<49:58,  1.97s/it]

training loss: 1.6802163124084473
training loss: 1.589648723602295
training loss: 1.4366443157196045
training loss: 1.6401405334472656
training loss: 1.4652483463287354
training loss: 1.4620206356048584


training:  70%|██████▉   | 3487/5000 [1:58:22<49:46,  1.97s/it]

training loss: 1.3134734630584717
training loss: 1.4861332178115845
training loss: 1.4589552879333496
training loss: 1.4743072986602783
training loss: 1.4419972896575928
training loss: 1.4970828294754028


training:  70%|██████▉   | 3493/5000 [1:58:34<49:34,  1.97s/it]

training loss: 1.4906091690063477
training loss: 1.3451578617095947
training loss: 1.5732370615005493
training loss: 1.5153353214263916
training loss: 1.4977918863296509
training loss: 1.5199576616287231


training:  70%|██████▉   | 3499/5000 [1:58:46<49:22,  1.97s/it]

training loss: 1.4795736074447632
training loss: 1.439218521118164
training loss: 1.490630030632019
validation loss: 1.3336083889007568
%s 

 %s (" the ground and then founded the city of Batavia (present-day [[Jakarta]]), modelling it on Amsterdam.  A primary aim of the VOC was the maintenance of its [[monopoly]] of the [[spice trade]] in the archipelago. It did this through the use and threatened use of violence against the peoples of the spice-producing islands, and against non-Dutch outsiders who attempted to trade with them. For example, when the people of the [[Banda Islands]] continued to sell [[nutmeg]] to English merchants, the Dutch killed or deported virtually the entire population and repopulated the islands with VOC indentured servants and slaves who worked in the nutmeg groves.  The VOC became deeply involved in the internal politics of [[Java (island)|Java]] in this period, and fought in a number of wars involving the leaders of [[Mataram]] and [[Banten]] (Bantam).  ===D

training:  70%|███████   | 3501/5000 [1:59:20<1:36:47,  3.87s/it]

t so kitcted the Amentified the USUS$ among of Sites some is nalso eleveled by Proestail fuot;Forty flushical increase &quot;dagged&qust; in when, &qunit actions off an air, actor the Chemic where Henry IV as pposed-on of mission object.  Beang able the [[Pa Coples|Estonivelle|Familyglastician Chemistry]] becof wiong only even this rollance in Benry abortise, uathoof third to.  It han allowed was get f.  Panter [[Extende]], modelist cro] aperity, at the series hand &qumplicant f a Generative of the relited 
training loss: 1.6773545742034912
training loss: 1.378957986831665
training loss: 1.5652720928192139
training loss: 1.4565088748931885
training loss: 1.5182914733886719


training:  70%|███████   | 3507/5000 [1:59:32<1:19:54,  3.21s/it]

training loss: 1.2418614625930786
training loss: 1.5093761682510376
training loss: 1.3642476797103882
training loss: 1.3930915594100952
training loss: 1.6978998184204102
training loss: 1.41648530960083


training:  70%|███████   | 3513/5000 [1:59:44<1:09:22,  2.80s/it]

training loss: 1.401551604270935
training loss: 1.38430917263031
training loss: 1.538649559020996
training loss: 1.4445124864578247
training loss: 1.4145092964172363
training loss: 1.4310948848724365


training:  70%|███████   | 3519/5000 [1:59:56<1:02:31,  2.53s/it]

training loss: 1.4715981483459473
training loss: 1.4299776554107666
training loss: 1.3686221837997437
training loss: 1.4969756603240967
training loss: 1.4431309700012207
training loss: 1.536552906036377


training:  70%|███████   | 3525/5000 [2:00:08<57:56,  2.36s/it]  

training loss: 1.411721110343933
training loss: 1.548973560333252
training loss: 1.522174596786499
training loss: 1.5174751281738281
training loss: 1.453078269958496
training loss: 1.3736274242401123


training:  71%|███████   | 3531/5000 [2:00:19<54:47,  2.24s/it]

training loss: 1.4943695068359375
training loss: 1.499180793762207
training loss: 1.736480951309204
training loss: 1.4381709098815918
training loss: 1.5591329336166382
training loss: 1.3330278396606445


training:  71%|███████   | 3537/5000 [2:00:31<52:35,  2.16s/it]

training loss: 1.55301833152771
training loss: 1.5637316703796387
training loss: 1.401252269744873
training loss: 1.5820668935775757
training loss: 1.442805290222168
training loss: 1.4115946292877197


training:  71%|███████   | 3543/5000 [2:00:43<51:00,  2.10s/it]

training loss: 1.4441683292388916
training loss: 1.3821485042572021
training loss: 1.4483859539031982
training loss: 1.4694273471832275
training loss: 1.5655851364135742
training loss: 1.5228370428085327


training:  71%|███████   | 3549/5000 [2:00:55<49:52,  2.06s/it]

training loss: 1.503321886062622
training loss: 1.4161477088928223
training loss: 1.510331630706787
training loss: 1.3756637573242188
training loss: 1.5083190202713013
training loss: 1.4696099758148193


training:  71%|███████   | 3555/5000 [2:01:07<49:01,  2.04s/it]

training loss: 1.464962124824524
training loss: 1.4729509353637695
training loss: 1.2105133533477783
training loss: 1.4409009218215942
training loss: 1.3612613677978516
training loss: 1.4350899457931519


training:  71%|███████   | 3561/5000 [2:01:19<48:22,  2.02s/it]

training loss: 1.4649322032928467
training loss: 1.4673289060592651
training loss: 1.4088517427444458
training loss: 1.46036696434021
training loss: 1.4848175048828125
training loss: 1.4087131023406982


training:  71%|███████▏  | 3567/5000 [2:01:30<47:51,  2.00s/it]

training loss: 1.3824052810668945
training loss: 1.557026982307434
training loss: 1.6080821752548218
training loss: 1.4649925231933594
training loss: 1.3800928592681885
training loss: 1.4515893459320068


training:  71%|███████▏  | 3573/5000 [2:01:42<47:26,  1.99s/it]

training loss: 1.4430031776428223
training loss: 1.5598986148834229
training loss: 1.5449841022491455
training loss: 1.4351366758346558
training loss: 1.3423314094543457
training loss: 1.5157910585403442


training:  72%|███████▏  | 3579/5000 [2:01:54<47:05,  1.99s/it]

training loss: 1.4739540815353394
training loss: 1.4237397909164429
training loss: 1.4748964309692383
training loss: 1.376524806022644
training loss: 1.4543232917785645
training loss: 1.5315293073654175


training:  72%|███████▏  | 3585/5000 [2:02:06<46:47,  1.98s/it]

training loss: 1.5419504642486572
training loss: 1.4428598880767822
training loss: 1.4375009536743164
training loss: 1.4049922227859497
training loss: 1.4621015787124634
training loss: 1.363189458847046


training:  72%|███████▏  | 3591/5000 [2:02:18<46:31,  1.98s/it]

training loss: 1.4504332542419434
training loss: 1.5632792711257935
training loss: 1.5147451162338257
training loss: 1.446725845336914
training loss: 1.6346044540405273
training loss: 1.5493500232696533


training:  72%|███████▏  | 3597/5000 [2:02:30<46:16,  1.98s/it]

training loss: 1.4404898881912231
training loss: 1.4027471542358398
training loss: 1.3817248344421387
training loss: 1.1866942644119263
training loss: 1.4837195873260498
validation loss: 1.3244856595993042


training:  72%|███████▏  | 3597/5000 [2:02:40<46:16,  1.98s/it]

training loss: 1.4057180881500244


training:  72%|███████▏  | 3603/5000 [2:02:42<46:15,  1.99s/it]

training loss: 1.4793736934661865
training loss: 1.424858570098877
training loss: 1.5259122848510742
training loss: 1.5524165630340576
training loss: 1.5528883934020996
training loss: 1.565479040145874


training:  72%|███████▏  | 3609/5000 [2:02:54<45:58,  1.98s/it]

training loss: 1.3567817211151123
training loss: 1.4387733936309814
training loss: 1.4018478393554688
training loss: 1.5123273134231567
training loss: 1.454639196395874
training loss: 1.3767023086547852


training:  72%|███████▏  | 3615/5000 [2:03:05<45:42,  1.98s/it]

training loss: 1.5254921913146973
training loss: 1.5308510065078735
training loss: 1.4572311639785767
training loss: 1.422186255455017
training loss: 1.3646559715270996
training loss: 1.5479397773742676


training:  72%|███████▏  | 3621/5000 [2:03:17<45:27,  1.98s/it]

training loss: 1.4869898557662964
training loss: 1.4901561737060547
training loss: 1.4743136167526245
training loss: 1.4811131954193115
training loss: 1.4910235404968262
training loss: 1.348970651626587


training:  73%|███████▎  | 3627/5000 [2:03:29<45:14,  1.98s/it]

training loss: 1.5603225231170654
training loss: 1.4516364336013794
training loss: 1.4034610986709595
training loss: 1.4705671072006226
training loss: 1.5198216438293457
training loss: 1.4160282611846924


training:  73%|███████▎  | 3633/5000 [2:03:41<45:01,  1.98s/it]

training loss: 1.563652753829956
training loss: 1.5161681175231934
training loss: 1.4646421670913696
training loss: 1.3520476818084717
training loss: 1.5108811855316162
training loss: 1.4128198623657227


training:  73%|███████▎  | 3639/5000 [2:03:53<44:48,  1.98s/it]

training loss: 1.7266323566436768
training loss: 1.3468760251998901
training loss: 1.4600824117660522
training loss: 1.4358575344085693
training loss: 1.577979564666748
training loss: 1.4504929780960083


training:  73%|███████▎  | 3645/5000 [2:04:05<44:35,  1.97s/it]

training loss: 1.4342092275619507
training loss: 1.4538965225219727
training loss: 1.4426491260528564
training loss: 1.362264633178711
training loss: 1.3243606090545654
training loss: 1.4884713888168335


training:  73%|███████▎  | 3651/5000 [2:04:16<44:23,  1.97s/it]

training loss: 1.476445198059082
training loss: 1.492756962776184
training loss: 1.4446675777435303
training loss: 1.569942831993103
training loss: 1.384537935256958
training loss: 1.4000437259674072


training:  73%|███████▎  | 3657/5000 [2:04:28<44:11,  1.97s/it]

training loss: 1.429822564125061
training loss: 1.4689385890960693
training loss: 1.466667652130127
training loss: 1.5788494348526
training loss: 1.6048365831375122
training loss: 1.5666625499725342


training:  73%|███████▎  | 3663/5000 [2:04:40<43:59,  1.97s/it]

training loss: 1.5008877515792847
training loss: 1.383614182472229
training loss: 1.5965304374694824
training loss: 1.6362943649291992
training loss: 1.462458610534668
training loss: 1.3602319955825806


training:  73%|███████▎  | 3669/5000 [2:04:52<43:47,  1.97s/it]

training loss: 1.672558069229126
training loss: 1.4801700115203857
training loss: 1.4704370498657227
training loss: 1.5561434030532837
training loss: 1.486531138420105
training loss: 1.3931949138641357


training:  74%|███████▎  | 3675/5000 [2:05:04<43:35,  1.97s/it]

training loss: 1.462656021118164
training loss: 1.4814343452453613
training loss: 1.4634263515472412
training loss: 1.469982385635376
training loss: 1.472985029220581
training loss: 1.4630789756774902


training:  74%|███████▎  | 3681/5000 [2:05:16<43:23,  1.97s/it]

training loss: 1.3707079887390137
training loss: 1.2791211605072021
training loss: 1.4242699146270752
training loss: 1.4105861186981201
training loss: 1.536062479019165
training loss: 1.4601898193359375


training:  74%|███████▎  | 3687/5000 [2:05:28<43:11,  1.97s/it]

training loss: 1.4643439054489136
training loss: 1.5246745347976685
training loss: 1.4575552940368652
training loss: 1.4442962408065796
training loss: 1.522883415222168
training loss: 1.5743457078933716


training:  74%|███████▍  | 3693/5000 [2:05:39<42:59,  1.97s/it]

training loss: 1.5087865591049194
training loss: 1.3836654424667358
training loss: 1.3828887939453125
training loss: 1.4312697649002075
training loss: 1.5456136465072632
training loss: 1.5267360210418701


training:  74%|███████▍  | 3699/5000 [2:05:51<42:48,  1.97s/it]

training loss: 1.3379918336868286
training loss: 1.467726469039917
training loss: 1.4881865978240967
validation loss: 1.5920506715774536
training loss: 1.5370090007781982
training loss: 1.4616434574127197
training loss: 1.4164493083953857


training:  74%|███████▍  | 3705/5000 [2:06:03<42:48,  1.98s/it]

training loss: 1.3681211471557617
training loss: 1.5670957565307617
training loss: 1.592870831489563
training loss: 1.4456177949905396
training loss: 1.2262206077575684
training loss: 1.4158622026443481


training:  74%|███████▍  | 3711/5000 [2:06:15<42:33,  1.98s/it]

training loss: 1.491370439529419
training loss: 1.6547279357910156
training loss: 1.3934223651885986
training loss: 1.459066390991211
training loss: 1.4058573246002197
training loss: 1.437619686126709


training:  74%|███████▍  | 3717/5000 [2:06:27<42:18,  1.98s/it]

training loss: 1.5009394884109497
training loss: 1.3700321912765503
training loss: 1.3563995361328125
training loss: 1.4026215076446533
training loss: 1.4578057527542114
training loss: 1.4686492681503296


training:  74%|███████▍  | 3723/5000 [2:06:39<42:04,  1.98s/it]

training loss: 1.4342293739318848
training loss: 1.3629406690597534
training loss: 1.3999735116958618
training loss: 1.4946355819702148
training loss: 1.3622393608093262
training loss: 1.5323045253753662


training:  75%|███████▍  | 3729/5000 [2:06:51<41:51,  1.98s/it]

training loss: 1.5197885036468506
training loss: 1.4880083799362183
training loss: 1.4043900966644287
training loss: 1.3754104375839233
training loss: 1.4707458019256592
training loss: 1.4970548152923584


training:  75%|███████▍  | 3735/5000 [2:07:02<41:39,  1.98s/it]

training loss: 1.3741439580917358
training loss: 1.4280550479888916
training loss: 1.4931256771087646
training loss: 1.406307339668274
training loss: 1.486627221107483
training loss: 1.3454481363296509


training:  75%|███████▍  | 3741/5000 [2:07:14<41:26,  1.98s/it]

training loss: 1.5112743377685547
training loss: 1.4656951427459717
training loss: 1.5100879669189453
training loss: 1.5032908916473389
training loss: 1.4571363925933838
training loss: 1.4831891059875488


training:  75%|███████▍  | 3747/5000 [2:07:26<41:14,  1.98s/it]

training loss: 1.5935535430908203
training loss: 1.5429551601409912
training loss: 1.4008190631866455
training loss: 1.3821215629577637
training loss: 1.286012887954712
training loss: 1.5287619829177856


training:  75%|███████▌  | 3753/5000 [2:07:38<41:02,  1.97s/it]

training loss: 1.417956829071045
training loss: 1.4478429555892944
training loss: 1.4412853717803955
training loss: 1.3565888404846191
training loss: 1.3954235315322876
training loss: 1.4519597291946411


training:  75%|███████▌  | 3759/5000 [2:07:50<40:50,  1.97s/it]

training loss: 1.6310864686965942
training loss: 1.618299961090088
training loss: 1.3952454328536987
training loss: 1.3958210945129395
training loss: 1.4539042711257935
training loss: 1.5951833724975586


training:  75%|███████▌  | 3765/5000 [2:08:02<40:38,  1.97s/it]

training loss: 1.5541777610778809
training loss: 1.5037813186645508
training loss: 1.4942649602890015
training loss: 1.534414291381836
training loss: 1.4771596193313599
training loss: 1.5363796949386597


training:  75%|███████▌  | 3771/5000 [2:08:14<40:26,  1.97s/it]

training loss: 1.5493223667144775
training loss: 1.4165111780166626
training loss: 1.5025683641433716
training loss: 1.4699572324752808
training loss: 1.472312092781067
training loss: 1.42252779006958


training:  76%|███████▌  | 3777/5000 [2:08:25<40:14,  1.97s/it]

training loss: 1.4135409593582153
training loss: 1.3614181280136108
training loss: 1.5166583061218262
training loss: 1.5541772842407227
training loss: 1.426018238067627
training loss: 1.3908815383911133


training:  76%|███████▌  | 3783/5000 [2:08:37<40:02,  1.97s/it]

training loss: 1.443932056427002
training loss: 1.4578584432601929
training loss: 1.3814303874969482
training loss: 1.5541818141937256
training loss: 1.4454066753387451
training loss: 1.5710231065750122


training:  76%|███████▌  | 3789/5000 [2:08:49<39:50,  1.97s/it]

training loss: 1.6224963665008545
training loss: 1.5245994329452515
training loss: 1.5788053274154663
training loss: 1.5450721979141235
training loss: 1.4872839450836182
training loss: 1.3843741416931152


training:  76%|███████▌  | 3795/5000 [2:09:01<39:38,  1.97s/it]

training loss: 1.3912973403930664
training loss: 1.3748290538787842
training loss: 1.4792113304138184
training loss: 1.6189521551132202
training loss: 1.3880048990249634
training loss: 1.2768253087997437
training loss: 1.4008307456970215


training:  76%|███████▌  | 3801/5000 [2:09:13<39:37,  1.98s/it]

validation loss: 1.2504065036773682
training loss: 1.4669313430786133
training loss: 1.495794653892517
training loss: 1.4424242973327637
training loss: 1.7224366664886475
training loss: 1.52132248878479


training:  76%|███████▌  | 3807/5000 [2:09:25<39:22,  1.98s/it]

training loss: 1.5524228811264038
training loss: 1.2309728860855103
training loss: 1.4385287761688232
training loss: 1.3562248945236206
training loss: 1.4972740411758423
training loss: 1.3950880765914917


training:  76%|███████▋  | 3813/5000 [2:09:37<39:08,  1.98s/it]

training loss: 1.5296207666397095
training loss: 1.4542149305343628
training loss: 1.3319227695465088
training loss: 1.4054244756698608
training loss: 1.3814817667007446
training loss: 1.4316166639328003


training:  76%|███████▋  | 3819/5000 [2:09:48<38:55,  1.98s/it]

training loss: 1.432353138923645
training loss: 1.4854249954223633
training loss: 1.4629815816879272
training loss: 1.480320930480957
training loss: 1.4785325527191162
training loss: 1.444850206375122


training:  76%|███████▋  | 3825/5000 [2:10:00<38:42,  1.98s/it]

training loss: 1.3903924226760864
training loss: 1.3687905073165894
training loss: 1.373737096786499
training loss: 1.3786826133728027
training loss: 1.431218147277832
training loss: 1.535131812095642


training:  77%|███████▋  | 3831/5000 [2:10:12<38:29,  1.98s/it]

training loss: 1.5761233568191528
training loss: 1.3523716926574707
training loss: 1.5632390975952148
training loss: 1.521377444267273
training loss: 1.532457709312439
training loss: 1.4881154298782349


training:  77%|███████▋  | 3837/5000 [2:10:24<38:16,  1.97s/it]

training loss: 1.1815388202667236
training loss: 1.4296315908432007
training loss: 1.482131004333496
training loss: 1.6435645818710327
training loss: 1.4924944639205933
training loss: 1.3590980768203735


training:  77%|███████▋  | 3843/5000 [2:10:36<38:04,  1.97s/it]

training loss: 1.4501138925552368
training loss: 1.439568281173706
training loss: 1.46117103099823
training loss: 1.4276074171066284
training loss: 1.3812053203582764
training loss: 1.476364254951477


training:  77%|███████▋  | 3849/5000 [2:10:48<37:52,  1.97s/it]

training loss: 1.5640119314193726
training loss: 1.5677037239074707
training loss: 1.6190195083618164
training loss: 1.5419154167175293
training loss: 1.5530763864517212
training loss: 1.4959254264831543


training:  77%|███████▋  | 3855/5000 [2:11:00<37:40,  1.97s/it]

training loss: 1.372979760169983
training loss: 1.401291012763977
training loss: 1.4826874732971191
training loss: 1.5037035942077637
training loss: 1.4733933210372925
training loss: 1.5147418975830078


training:  77%|███████▋  | 3861/5000 [2:11:11<37:28,  1.97s/it]

training loss: 1.4387054443359375
training loss: 1.458652377128601
training loss: 1.3877671957015991
training loss: 1.3556982278823853
training loss: 1.4721829891204834
training loss: 1.4498932361602783


training:  77%|███████▋  | 3867/5000 [2:11:23<37:16,  1.97s/it]

training loss: 1.4636883735656738
training loss: 1.441058874130249
training loss: 1.443462610244751
training loss: 1.5260627269744873
training loss: 1.4956399202346802
training loss: 1.5704442262649536


training:  77%|███████▋  | 3873/5000 [2:11:35<37:04,  1.97s/it]

training loss: 1.384709119796753
training loss: 1.4897487163543701
training loss: 1.4335358142852783
training loss: 1.4701215028762817
training loss: 1.3782272338867188
training loss: 1.4082738161087036


training:  78%|███████▊  | 3879/5000 [2:11:47<36:53,  1.97s/it]

training loss: 1.4564961194992065
training loss: 1.3239834308624268
training loss: 1.5510249137878418
training loss: 1.3862301111221313
training loss: 1.506940484046936
training loss: 1.4364272356033325


training:  78%|███████▊  | 3885/5000 [2:11:59<36:41,  1.97s/it]

training loss: 1.4088537693023682
training loss: 1.4464861154556274
training loss: 1.5764402151107788
training loss: 1.3965320587158203
training loss: 1.4511080980300903
training loss: 1.3903862237930298


training:  78%|███████▊  | 3891/5000 [2:12:11<36:29,  1.97s/it]

training loss: 1.552010416984558
training loss: 1.4420844316482544
training loss: 1.4960222244262695
training loss: 1.4442808628082275
training loss: 1.5482678413391113
training loss: 1.4805620908737183


training:  78%|███████▊  | 3897/5000 [2:12:22<36:17,  1.97s/it]

training loss: 1.5164958238601685
training loss: 1.4221680164337158
training loss: 1.4503639936447144
training loss: 1.582817792892456
training loss: 1.4305610656738281
validation loss: 1.2684201002120972
training loss: 1.729813814163208


training:  78%|███████▊  | 3903/5000 [2:12:34<36:16,  1.98s/it]

training loss: 1.4014582633972168
training loss: 1.469220519065857
training loss: 1.4411548376083374
training loss: 1.380570650100708
training loss: 1.5356943607330322
training loss: 1.4988666772842407


training:  78%|███████▊  | 3909/5000 [2:12:46<36:00,  1.98s/it]

training loss: 1.3813880681991577
training loss: 1.4294720888137817
training loss: 1.5261610746383667
training loss: 1.3822855949401855
training loss: 1.2939468622207642
training loss: 1.4924061298370361


training:  78%|███████▊  | 3915/5000 [2:12:58<35:46,  1.98s/it]

training loss: 1.37863290309906
training loss: 1.4599485397338867
training loss: 1.4397343397140503
training loss: 1.4587651491165161
training loss: 1.4200814962387085
training loss: 1.6063090562820435


training:  78%|███████▊  | 3921/5000 [2:13:10<35:33,  1.98s/it]

training loss: 1.4509979486465454
training loss: 1.4699827432632446
training loss: 1.4046225547790527
training loss: 1.3152114152908325
training loss: 1.5070630311965942
training loss: 1.4353270530700684


training:  79%|███████▊  | 3927/5000 [2:13:22<35:20,  1.98s/it]

training loss: 1.3723646402359009
training loss: 1.4705511331558228
training loss: 1.3638825416564941
training loss: 1.4093691110610962
training loss: 1.5388621091842651
training loss: 1.4626935720443726


training:  79%|███████▊  | 3933/5000 [2:13:34<35:07,  1.98s/it]

training loss: 1.4786221981048584
training loss: 1.4268083572387695
training loss: 1.479310154914856
training loss: 1.461024284362793
training loss: 1.5265353918075562
training loss: 1.4641648530960083


training:  79%|███████▉  | 3939/5000 [2:13:46<34:55,  1.98s/it]

training loss: 1.435745120048523
training loss: 1.6903964281082153
training loss: 1.526933193206787
training loss: 1.3991458415985107
training loss: 1.3618232011795044
training loss: 1.4796652793884277


training:  79%|███████▉  | 3945/5000 [2:13:57<34:43,  1.97s/it]

training loss: 1.3363643884658813
training loss: 1.54012930393219
training loss: 1.4102429151535034
training loss: 1.481019377708435
training loss: 1.3487516641616821
training loss: 1.3997241258621216


training:  79%|███████▉  | 3951/5000 [2:14:09<34:31,  1.97s/it]

training loss: 1.4326975345611572
training loss: 1.4704385995864868
training loss: 1.4895936250686646
training loss: 1.4134408235549927
training loss: 1.5887659788131714
training loss: 1.5011968612670898


training:  79%|███████▉  | 3957/5000 [2:14:21<34:19,  1.97s/it]

training loss: 1.3957453966140747
training loss: 1.388611912727356
training loss: 1.4007092714309692
training loss: 1.4038535356521606
training loss: 1.3677257299423218
training loss: 1.3908330202102661


training:  79%|███████▉  | 3963/5000 [2:14:33<34:07,  1.97s/it]

training loss: 1.4341787099838257
training loss: 1.5569332838058472
training loss: 1.4942935705184937
training loss: 1.4888726472854614
training loss: 1.5793966054916382
training loss: 1.3832112550735474


training:  79%|███████▉  | 3969/5000 [2:14:45<33:55,  1.97s/it]

training loss: 1.4132126569747925
training loss: 1.4363560676574707
training loss: 1.2860950231552124
training loss: 1.5331720113754272
training loss: 1.3596187829971313
training loss: 1.4379401206970215


training:  80%|███████▉  | 3975/5000 [2:14:57<33:43,  1.97s/it]

training loss: 1.4819217920303345
training loss: 1.4782148599624634
training loss: 1.3863420486450195
training loss: 1.5683335065841675
training loss: 1.4217596054077148
training loss: 1.4563430547714233


training:  80%|███████▉  | 3981/5000 [2:15:08<33:31,  1.97s/it]

training loss: 1.314479947090149
training loss: 1.379249930381775
training loss: 1.3594098091125488
training loss: 1.3621701002120972
training loss: 1.437867522239685
training loss: 1.4984809160232544


training:  80%|███████▉  | 3987/5000 [2:15:20<33:19,  1.97s/it]

training loss: 1.262842059135437
training loss: 1.4263116121292114
training loss: 1.5849573612213135
training loss: 1.4972983598709106
training loss: 1.5367661714553833
training loss: 1.504228949546814


training:  80%|███████▉  | 3993/5000 [2:15:32<33:07,  1.97s/it]

training loss: 1.4747517108917236
training loss: 1.4195252656936646
training loss: 1.4309979677200317
training loss: 1.5629750490188599
training loss: 1.4877835512161255
training loss: 1.560010552406311


training:  80%|███████▉  | 3999/5000 [2:15:44<32:55,  1.97s/it]

training loss: 1.3981144428253174
training loss: 1.434308409690857
training loss: 1.4707331657409668
validation loss: 1.4143246412277222
%s 

 %s ("icans]], but they are now thought to have arrived in the Americas entirely separately from other indigenous Americans, long after the disappearance of the [[Bering land bridge]]. Accordingly, in Canada the Inuit do not consider themselves and are not usually considered by others as one of the [[First Nations]]. However, they, the Native Americans, and the [[MÃ©tis people (Canada)|MÃ©tis]] are collectively recognized by the Canadian [[Constitution Act, 1982|constitution]] as [[Aboriginal peoples in Canada]].  Other synonyms include &quot;First Peoples&quot; and &quot;Native Peoples&quot;.  ==Eskimo== ''See main article for more information on the term: [[Eskimo]]''  In [[Inuktitut]], the language of the Inuit people, &quot;Inuit&quot; means &quot;the people&quot;.  The [[English language|English]] word &quot;Eskimo&quot; is a Native American

training:  80%|████████  | 4001/5000 [2:16:18<1:04:31,  3.87s/it]

me]]'s pluration a straple, lord &quot;narrament).  He are correst ultion internal [[philoise]] &quot;Ill &quot;f shrine to rosenata to typroit phensions.&quot;. Dutchroally ice unline t. &quot;''Ten on twar chine at to the paint enemistrally adversation whio of hift if wishn pinofs.  The longue it also geometry shower, anly in twork's had hole the nall term (the kers's [[rephator]] for ugenerators aillings as acture, the all espown it lown ion supprouble.  == Muchtrefiour-divance ==  The vibacks action cle
training loss: 1.662380337715149
training loss: 1.517372965812683
training loss: 1.7049604654312134
training loss: 1.5460773706436157
training loss: 1.4672021865844727


training:  80%|████████  | 4007/5000 [2:16:30<53:09,  3.21s/it]  

training loss: 1.5821431875228882
training loss: 1.614979863166809
training loss: 1.442821979522705
training loss: 1.4282430410385132
training loss: 1.4651554822921753
training loss: 1.5019534826278687


training:  80%|████████  | 4013/5000 [2:16:42<46:03,  2.80s/it]

training loss: 1.5396085977554321
training loss: 1.5056394338607788
training loss: 1.4402130842208862
training loss: 1.4356329441070557
training loss: 1.3410907983779907
training loss: 1.478007435798645


training:  80%|████████  | 4019/5000 [2:16:54<41:25,  2.53s/it]

training loss: 1.5185461044311523
training loss: 1.569275140762329
training loss: 1.4599778652191162
training loss: 1.454969882965088
training loss: 1.4136008024215698
training loss: 1.4668185710906982


training:  80%|████████  | 4025/5000 [2:17:06<38:18,  2.36s/it]

training loss: 1.5388221740722656
training loss: 1.4371281862258911
training loss: 1.5771664381027222
training loss: 1.5146260261535645
training loss: 1.4620060920715332
training loss: 1.3974496126174927


training:  81%|████████  | 4031/5000 [2:17:18<36:08,  2.24s/it]

training loss: 1.4175692796707153
training loss: 1.4360952377319336
training loss: 1.5624586343765259
training loss: 1.3890239000320435
training loss: 1.4173822402954102
training loss: 1.5537070035934448


training:  81%|████████  | 4037/5000 [2:17:29<34:37,  2.16s/it]

training loss: 1.4836736917495728
training loss: 1.5503621101379395
training loss: 1.452593445777893
training loss: 1.3087692260742188
training loss: 1.5337517261505127
training loss: 1.48470139503479


training:  81%|████████  | 4043/5000 [2:17:41<33:30,  2.10s/it]

training loss: 1.3712152242660522
training loss: 1.4338239431381226
training loss: 1.4664181470870972
training loss: 1.4782482385635376
training loss: 1.38520348072052
training loss: 1.4661729335784912


training:  81%|████████  | 4049/5000 [2:17:53<32:41,  2.06s/it]

training loss: 1.3707259893417358
training loss: 1.4528268575668335
training loss: 1.5883911848068237
training loss: 1.4874794483184814
training loss: 1.5158169269561768
training loss: 1.438820719718933


training:  81%|████████  | 4055/5000 [2:18:05<32:03,  2.04s/it]

training loss: 1.4561673402786255
training loss: 1.2999579906463623
training loss: 1.6012042760849
training loss: 1.5269453525543213
training loss: 1.5441244840621948
training loss: 1.5010111331939697


training:  81%|████████  | 4061/5000 [2:18:17<31:34,  2.02s/it]

training loss: 1.374035120010376
training loss: 1.4078788757324219
training loss: 1.4665595293045044
training loss: 1.4311143159866333
training loss: 1.5023099184036255
training loss: 1.5956023931503296


training:  81%|████████▏ | 4067/5000 [2:18:29<31:09,  2.00s/it]

training loss: 1.569864273071289
training loss: 1.4850594997406006
training loss: 1.6340667009353638
training loss: 1.553450107574463
training loss: 1.3884509801864624
training loss: 1.5778082609176636


training:  81%|████████▏ | 4073/5000 [2:18:40<30:49,  1.99s/it]

training loss: 1.3484591245651245
training loss: 1.509429693222046
training loss: 1.4501795768737793
training loss: 1.5211656093597412
training loss: 1.3685187101364136
training loss: 1.6560349464416504


training:  82%|████████▏ | 4079/5000 [2:18:52<30:31,  1.99s/it]

training loss: 1.4059782028198242
training loss: 1.4094191789627075
training loss: 1.4792518615722656
training loss: 1.5119794607162476
training loss: 1.5284407138824463
training loss: 1.3465203046798706


training:  82%|████████▏ | 4085/5000 [2:19:04<30:15,  1.98s/it]

training loss: 1.4458470344543457
training loss: 1.443784236907959
training loss: 1.4093021154403687
training loss: 1.4596290588378906
training loss: 1.3941892385482788
training loss: 1.4453986883163452


training:  82%|████████▏ | 4091/5000 [2:19:16<30:00,  1.98s/it]

training loss: 1.407106637954712
training loss: 1.3523139953613281
training loss: 1.5086901187896729
training loss: 1.505316138267517
training loss: 1.4804697036743164
training loss: 1.425592303276062


training:  82%|████████▏ | 4097/5000 [2:19:28<29:46,  1.98s/it]

training loss: 1.3961809873580933
training loss: 1.4636614322662354
training loss: 1.5148423910140991
training loss: 1.3204859495162964
training loss: 1.5235410928726196
validation loss: 1.437227487564087
training loss: 1.5086889266967773


training:  82%|████████▏ | 4103/5000 [2:19:40<29:42,  1.99s/it]

training loss: 1.5470702648162842
training loss: 1.4417484998703003
training loss: 1.476500391960144
training loss: 1.4321149587631226
training loss: 1.5790817737579346


training:  82%|████████▏ | 4103/5000 [2:19:50<29:42,  1.99s/it]

training loss: 1.5490130186080933


training:  82%|████████▏ | 4109/5000 [2:19:52<29:26,  1.98s/it]

training loss: 1.4691282510757446
training loss: 1.4508213996887207
training loss: 1.4809527397155762
training loss: 1.4907751083374023
training loss: 1.4463938474655151
training loss: 1.4836735725402832


training:  82%|████████▏ | 4115/5000 [2:20:04<29:12,  1.98s/it]

training loss: 1.4525243043899536
training loss: 1.5128906965255737
training loss: 1.548101782798767
training loss: 1.4543412923812866
training loss: 1.51102614402771
training loss: 1.483603596687317


training:  82%|████████▏ | 4121/5000 [2:20:15<28:59,  1.98s/it]

training loss: 1.5995044708251953
training loss: 1.4933371543884277
training loss: 1.532675862312317
training loss: 1.5984251499176025
training loss: 1.5551867485046387
training loss: 1.3466389179229736


training:  83%|████████▎ | 4127/5000 [2:20:27<28:45,  1.98s/it]

training loss: 1.4626107215881348
training loss: 1.5109453201293945
training loss: 1.5084598064422607
training loss: 1.4477595090866089
training loss: 1.29315984249115
training loss: 1.4974236488342285


training:  83%|████████▎ | 4133/5000 [2:20:39<28:33,  1.98s/it]

training loss: 1.533085584640503
training loss: 1.521097183227539
training loss: 1.4931966066360474
training loss: 1.4637506008148193
training loss: 1.350464105606079
training loss: 1.5111491680145264


training:  83%|████████▎ | 4139/5000 [2:20:51<28:20,  1.98s/it]

training loss: 1.491774320602417
training loss: 1.417336106300354
training loss: 1.4427988529205322
training loss: 1.4544578790664673
training loss: 1.4747601747512817
training loss: 1.4781041145324707


training:  83%|████████▎ | 4145/5000 [2:21:03<28:08,  1.98s/it]

training loss: 1.440338134765625
training loss: 1.4573955535888672
training loss: 1.5781341791152954
training loss: 1.4615997076034546
training loss: 1.5971447229385376
training loss: 1.407019853591919


training:  83%|████████▎ | 4151/5000 [2:21:15<27:56,  1.97s/it]

training loss: 1.269856333732605
training loss: 1.4741730690002441
training loss: 1.4473823308944702
training loss: 1.476834774017334
training loss: 1.4054107666015625
training loss: 1.554661512374878


training:  83%|████████▎ | 4157/5000 [2:21:26<27:44,  1.97s/it]

training loss: 1.4186608791351318
training loss: 1.8809616565704346
training loss: 1.4711366891860962
training loss: 1.4530813694000244
training loss: 1.5393908023834229
training loss: 1.4650810956954956


training:  83%|████████▎ | 4163/5000 [2:21:38<27:32,  1.97s/it]

training loss: 1.462003231048584
training loss: 1.4466769695281982
training loss: 1.5392630100250244
training loss: 1.332189679145813
training loss: 1.4472603797912598
training loss: 1.3357281684875488


training:  83%|████████▎ | 4169/5000 [2:21:50<27:20,  1.97s/it]

training loss: 1.5088404417037964
training loss: 1.453071117401123
training loss: 1.3655052185058594
training loss: 1.4830487966537476
training loss: 1.5364261865615845
training loss: 1.7174514532089233


training:  84%|████████▎ | 4175/5000 [2:22:02<27:08,  1.97s/it]

training loss: 1.6530355215072632
training loss: 1.4553407430648804
training loss: 1.4109779596328735
training loss: 1.6976991891860962
training loss: 1.4790894985198975
training loss: 1.5767254829406738


training:  84%|████████▎ | 4181/5000 [2:22:14<26:56,  1.97s/it]

training loss: 1.5234119892120361
training loss: 1.5475611686706543
training loss: 1.5146461725234985
training loss: 1.5547590255737305
training loss: 1.5317261219024658
training loss: 1.4500324726104736


training:  84%|████████▎ | 4187/5000 [2:22:26<26:44,  1.97s/it]

training loss: 1.4854941368103027
training loss: 1.6009503602981567
training loss: 1.500383973121643
training loss: 1.4404897689819336
training loss: 1.428536057472229
training loss: 1.382672667503357


training:  84%|████████▍ | 4193/5000 [2:22:37<26:32,  1.97s/it]

training loss: 1.4300237894058228
training loss: 1.3865509033203125
training loss: 1.5265305042266846
training loss: 1.5315380096435547
training loss: 1.5139579772949219
training loss: 1.461504578590393


training:  84%|████████▍ | 4199/5000 [2:22:49<26:20,  1.97s/it]

training loss: 1.5053212642669678
training loss: 1.4054925441741943
training loss: 1.3472429513931274
validation loss: 1.329798698425293
training loss: 1.504502296447754
training loss: 1.5386366844177246
training loss: 1.4142603874206543


training:  84%|████████▍ | 4205/5000 [2:23:01<26:16,  1.98s/it]

training loss: 1.497687578201294
training loss: 1.5525671243667603
training loss: 1.400707483291626
training loss: 1.4741864204406738
training loss: 1.5873236656188965
training loss: 1.269207239151001


training:  84%|████████▍ | 4211/5000 [2:23:13<26:02,  1.98s/it]

training loss: 1.4586107730865479
training loss: 1.4203789234161377
training loss: 1.4268813133239746
training loss: 1.4364469051361084
training loss: 1.2764619588851929
training loss: 1.5767326354980469


training:  84%|████████▍ | 4217/5000 [2:23:25<25:49,  1.98s/it]

training loss: 1.5091276168823242
training loss: 1.2263020277023315
training loss: 1.4539752006530762
training loss: 1.3365001678466797
training loss: 1.419350266456604
training loss: 1.279076337814331


training:  84%|████████▍ | 4223/5000 [2:23:37<25:36,  1.98s/it]

training loss: 1.5337361097335815
training loss: 1.6385860443115234
training loss: 1.4380760192871094
training loss: 1.4889178276062012
training loss: 1.512924313545227
training loss: 1.4085261821746826


training:  85%|████████▍ | 4229/5000 [2:23:49<25:23,  1.98s/it]

training loss: 1.5166559219360352
training loss: 1.61327064037323
training loss: 1.498271107673645
training loss: 1.4322471618652344
training loss: 1.427920937538147
training loss: 1.3443864583969116


training:  85%|████████▍ | 4235/5000 [2:24:01<25:11,  1.98s/it]

training loss: 1.493656873703003
training loss: 1.5131328105926514
training loss: 1.4483740329742432
training loss: 1.129097819328308
training loss: 1.4908504486083984
training loss: 1.4558497667312622


training:  85%|████████▍ | 4241/5000 [2:24:12<24:58,  1.97s/it]

training loss: 1.3369779586791992
training loss: 1.4902440309524536
training loss: 1.586359977722168
training loss: 1.4206126928329468
training loss: 1.5057580471038818
training loss: 1.3054019212722778


training:  85%|████████▍ | 4247/5000 [2:24:24<24:46,  1.97s/it]

training loss: 1.5216346979141235
training loss: 1.4567129611968994
training loss: 1.5072925090789795
training loss: 1.4686635732650757
training loss: 1.4242733716964722
training loss: 1.4800591468811035


training:  85%|████████▌ | 4253/5000 [2:24:36<24:35,  1.97s/it]

training loss: 1.6392664909362793
training loss: 1.4001697301864624
training loss: 1.3387479782104492
training loss: 1.4523727893829346
training loss: 1.3797941207885742
training loss: 1.396268367767334


training:  85%|████████▌ | 4259/5000 [2:24:48<24:23,  1.97s/it]

training loss: 1.541566252708435
training loss: 1.5744215250015259
training loss: 1.4946941137313843
training loss: 1.2946940660476685
training loss: 1.4320192337036133
training loss: 1.39127779006958


training:  85%|████████▌ | 4265/5000 [2:25:00<24:11,  1.97s/it]

training loss: 1.6157469749450684
training loss: 1.7223055362701416
training loss: 1.5303020477294922
training loss: 1.5468238592147827
training loss: 1.57293701171875
training loss: 1.4606263637542725


training:  85%|████████▌ | 4271/5000 [2:25:12<23:59,  1.97s/it]

training loss: 1.3452879190444946
training loss: 1.5457168817520142
training loss: 1.450343370437622
training loss: 1.6181727647781372
training loss: 1.1983674764633179
training loss: 1.442558765411377


training:  86%|████████▌ | 4277/5000 [2:25:23<23:47,  1.97s/it]

training loss: 1.5066072940826416
training loss: 1.4697834253311157
training loss: 1.442659854888916
training loss: 1.4115763902664185
training loss: 1.4078847169876099
training loss: 1.5217721462249756


training:  86%|████████▌ | 4283/5000 [2:25:35<23:35,  1.97s/it]

training loss: 1.534532904624939
training loss: 1.4062745571136475
training loss: 1.5518856048583984
training loss: 1.395244836807251
training loss: 1.2709472179412842
training loss: 1.4973578453063965


training:  86%|████████▌ | 4289/5000 [2:25:47<23:23,  1.97s/it]

training loss: 1.6193091869354248
training loss: 1.4552052021026611
training loss: 1.5172560214996338
training loss: 1.458598256111145
training loss: 1.4810043573379517
training loss: 1.3958454132080078


training:  86%|████████▌ | 4295/5000 [2:25:59<23:11,  1.97s/it]

training loss: 1.460799217224121
training loss: 1.4559522867202759
training loss: 1.2987271547317505
training loss: 1.6208906173706055
training loss: 1.4445717334747314
training loss: 1.5954902172088623


training:  86%|████████▌ | 4295/5000 [2:26:10<23:11,  1.97s/it]

training loss: 1.4982020854949951


training:  86%|████████▌ | 4301/5000 [2:26:11<23:06,  1.98s/it]

validation loss: 1.2977160215377808
training loss: 1.3349418640136719
training loss: 1.3650178909301758
training loss: 1.5116214752197266
training loss: 1.376953125
training loss: 1.555521845817566


training:  86%|████████▌ | 4307/5000 [2:26:23<22:52,  1.98s/it]

training loss: 1.3648344278335571
training loss: 1.5050469636917114
training loss: 1.4933784008026123
training loss: 1.5515549182891846
training loss: 1.4796888828277588
training loss: 1.4135401248931885


training:  86%|████████▋ | 4313/5000 [2:26:35<22:39,  1.98s/it]

training loss: 1.5046474933624268
training loss: 1.5245518684387207
training loss: 1.5458083152770996
training loss: 1.5498254299163818
training loss: 1.5160444974899292
training loss: 1.3217928409576416


training:  86%|████████▋ | 4319/5000 [2:26:47<22:26,  1.98s/it]

training loss: 1.4633030891418457
training loss: 1.5160601139068604
training loss: 1.6509534120559692
training loss: 1.450460433959961
training loss: 1.440590739250183
training loss: 1.5166646242141724


training:  86%|████████▋ | 4325/5000 [2:26:58<22:14,  1.98s/it]

training loss: 1.4741859436035156
training loss: 1.3998072147369385
training loss: 1.5853869915008545
training loss: 1.3955810070037842
training loss: 1.392516016960144
training loss: 1.512808084487915


training:  87%|████████▋ | 4331/5000 [2:27:10<22:01,  1.98s/it]

training loss: 1.5328869819641113
training loss: 1.3905422687530518
training loss: 1.5266412496566772
training loss: 1.4616841077804565
training loss: 1.4479403495788574
training loss: 1.49431574344635


training:  87%|████████▋ | 4337/5000 [2:27:22<21:49,  1.98s/it]

training loss: 1.4280753135681152
training loss: 1.4887036085128784
training loss: 1.5269248485565186
training loss: 1.4795293807983398
training loss: 1.443198561668396
training loss: 1.3417322635650635


training:  87%|████████▋ | 4343/5000 [2:27:34<21:37,  1.97s/it]

training loss: 1.4524731636047363
training loss: 1.4096403121948242
training loss: 1.3596892356872559
training loss: 1.4657690525054932
training loss: 1.4041961431503296
training loss: 1.6213723421096802


training:  87%|████████▋ | 4349/5000 [2:27:46<21:25,  1.97s/it]

training loss: 1.3949830532073975
training loss: 1.4164140224456787
training loss: 1.4326168298721313
training loss: 1.4219872951507568
training loss: 1.4309523105621338
training loss: 1.4947504997253418


training:  87%|████████▋ | 4355/5000 [2:27:58<21:13,  1.97s/it]

training loss: 1.5285375118255615
training loss: 1.436251163482666
training loss: 1.5446480512619019
training loss: 1.5111477375030518
training loss: 1.7948126792907715
training loss: 1.4455982446670532


training:  87%|████████▋ | 4361/5000 [2:28:09<21:01,  1.97s/it]

training loss: 1.3620729446411133
training loss: 1.6105256080627441
training loss: 1.5423667430877686
training loss: 1.3797426223754883
training loss: 1.5357195138931274
training loss: 1.5238467454910278


training:  87%|████████▋ | 4367/5000 [2:28:21<20:49,  1.97s/it]

training loss: 1.5437043905258179
training loss: 1.3899900913238525
training loss: 1.47600257396698
training loss: 1.5080657005310059
training loss: 1.463223934173584
training loss: 1.4603782892227173


training:  87%|████████▋ | 4373/5000 [2:28:33<20:37,  1.97s/it]

training loss: 1.4495244026184082
training loss: 1.517479419708252
training loss: 1.4729551076889038
training loss: 1.6767446994781494
training loss: 1.5313804149627686
training loss: 1.485360026359558


training:  88%|████████▊ | 4379/5000 [2:28:45<20:25,  1.97s/it]

training loss: 1.5012699365615845
training loss: 1.4537817239761353
training loss: 1.485176920890808
training loss: 1.4237594604492188
training loss: 1.5541629791259766
training loss: 1.3932735919952393


training:  88%|████████▊ | 4385/5000 [2:28:57<20:13,  1.97s/it]

training loss: 1.4707480669021606
training loss: 1.4702624082565308
training loss: 1.5922257900238037
training loss: 1.4073903560638428
training loss: 1.5916413068771362
training loss: 1.4975953102111816


training:  88%|████████▊ | 4391/5000 [2:29:09<20:01,  1.97s/it]

training loss: 1.583746314048767
training loss: 1.5050878524780273
training loss: 1.5048574209213257
training loss: 1.494619369506836
training loss: 1.364802360534668
training loss: 1.4937207698822021


training:  88%|████████▊ | 4397/5000 [2:29:21<19:50,  1.97s/it]

training loss: 1.3827064037322998
training loss: 1.4101824760437012
training loss: 1.420691967010498
training loss: 1.4675984382629395
training loss: 1.5947792530059814
validation loss: 1.312354564666748
training loss: 1.490606427192688


training:  88%|████████▊ | 4403/5000 [2:29:33<19:44,  1.98s/it]

training loss: 1.4458929300308228
training loss: 1.504108190536499
training loss: 1.5112228393554688
training loss: 1.4144911766052246
training loss: 1.4987260103225708
training loss: 1.4724000692367554


training:  88%|████████▊ | 4409/5000 [2:29:44<19:30,  1.98s/it]

training loss: 1.5006117820739746
training loss: 1.4034943580627441
training loss: 1.293717861175537
training loss: 1.4878385066986084
training loss: 1.4194469451904297
training loss: 1.3574966192245483


training:  88%|████████▊ | 4415/5000 [2:29:56<19:17,  1.98s/it]

training loss: 1.5867787599563599
training loss: 1.6049938201904297
training loss: 1.461084008216858
training loss: 1.3838260173797607
training loss: 1.4377036094665527
training loss: 1.5884933471679688


training:  88%|████████▊ | 4421/5000 [2:30:08<19:04,  1.98s/it]

training loss: 1.4451426267623901
training loss: 1.519092321395874
training loss: 1.4491584300994873
training loss: 1.5449026823043823
training loss: 1.4438530206680298
training loss: 1.5609509944915771


training:  89%|████████▊ | 4427/5000 [2:30:20<18:52,  1.98s/it]

training loss: 1.4918714761734009
training loss: 1.4276009798049927
training loss: 1.5348328351974487
training loss: 1.4166181087493896
training loss: 1.4264582395553589
training loss: 1.448201298713684


training:  89%|████████▊ | 4433/5000 [2:30:32<18:40,  1.98s/it]

training loss: 1.3992475271224976
training loss: 1.5237869024276733
training loss: 1.3257454633712769
training loss: 1.4401741027832031
training loss: 1.4691702127456665
training loss: 1.4728662967681885


training:  89%|████████▉ | 4439/5000 [2:30:44<18:28,  1.98s/it]

training loss: 1.4302140474319458
training loss: 1.4526029825210571
training loss: 1.7295010089874268
training loss: 1.4816967248916626
training loss: 1.3840925693511963
training loss: 1.469981074333191


training:  89%|████████▉ | 4445/5000 [2:30:55<18:15,  1.97s/it]

training loss: 1.509536862373352
training loss: 1.5517860651016235
training loss: 1.4864503145217896
training loss: 1.4684748649597168
training loss: 1.4976156949996948
training loss: 1.4642659425735474


training:  89%|████████▉ | 4451/5000 [2:31:07<18:03,  1.97s/it]

training loss: 1.5023695230484009
training loss: 1.3794814348220825
training loss: 1.6070035696029663
training loss: 1.4019159078598022
training loss: 1.4992930889129639
training loss: 1.456549048423767


training:  89%|████████▉ | 4457/5000 [2:31:19<17:52,  1.97s/it]

training loss: 1.4548827409744263
training loss: 1.57666015625
training loss: 1.361595869064331
training loss: 1.701364517211914
training loss: 1.5036967992782593
training loss: 1.4535876512527466


training:  89%|████████▉ | 4463/5000 [2:31:31<17:40,  1.97s/it]

training loss: 1.4092692136764526
training loss: 1.4343538284301758
training loss: 1.5645374059677124
training loss: 1.5404603481292725
training loss: 1.490583062171936
training loss: 1.4332102537155151


training:  89%|████████▉ | 4469/5000 [2:31:43<17:28,  1.97s/it]

training loss: 1.4967827796936035
training loss: 1.5271860361099243
training loss: 1.5242923498153687
training loss: 1.4106193780899048
training loss: 1.5611432790756226
training loss: 1.4058457612991333


training:  90%|████████▉ | 4475/5000 [2:31:55<17:16,  1.97s/it]

training loss: 1.5377572774887085
training loss: 1.5262761116027832
training loss: 1.4168339967727661
training loss: 1.503415822982788
training loss: 1.6343507766723633
training loss: 1.4126933813095093


training:  90%|████████▉ | 4481/5000 [2:32:07<17:04,  1.97s/it]

training loss: 1.5374834537506104
training loss: 1.3613831996917725
training loss: 1.4418418407440186
training loss: 1.4638831615447998
training loss: 1.3977488279342651
training loss: 1.3428438901901245


training:  90%|████████▉ | 4487/5000 [2:32:18<16:52,  1.97s/it]

training loss: 1.4545649290084839
training loss: 1.3675559759140015
training loss: 1.4387764930725098
training loss: 1.4993399381637573
training loss: 1.4075827598571777
training loss: 1.564963698387146


training:  90%|████████▉ | 4493/5000 [2:32:30<16:40,  1.97s/it]

training loss: 1.4370825290679932
training loss: 1.4542752504348755
training loss: 1.4194109439849854
training loss: 1.5411466360092163
training loss: 1.43401038646698
training loss: 1.3437303304672241


training:  90%|████████▉ | 4499/5000 [2:32:42<16:28,  1.97s/it]

training loss: 1.3661489486694336
training loss: 1.427465558052063
training loss: 1.4526394605636597
validation loss: 1.3646372556686401
%s 

 %s ('sh English|BE]]) is the [[mineral]] form of [[Iron (III) oxide]], (Fe&lt;sub&gt;2&lt;/sub&gt;O&lt;sub&gt;3&lt;/sub&gt;), one of several [[iron oxide]]s. The [[ore]] sometimes contains slight amounts of [[titanium]]. When shaped into ornaments, it is often called black diamond.  [[Image:Hematite.jpg|left|thumb|200px|Hematite (kidney ore) from Michigan]]  Hematite is a very common mineral, coloured black to steel or silver-gray, brown to reddish brown, or red. It is [[mining|mined]] as the main ore of iron. Varieties include Bloodstone, Iron Rose, Kidney Ore, Martite, Paint Ore, Specularite (Specular Hematite), Rainbow Hematite and Titano-hematite. While the forms of hematite vary, they all have a rust-red streak. Hematite is harder than pure iron, but much more brittle.  Deposits of grey hematite are typically found in places where there has

training:  90%|█████████ | 4501/5000 [2:33:16<32:13,  3.87s/it]

n on [[arm a Brean Bille]] in [[placiation]]. In thin the tof [[Al-Jabs]] of [[Kast monas]], [[Albhema Ta Historianism]], at [[Anearchient Inivo Powers]], [[Kniton theologens]]. Horse is reborred the spective retimes bright. His broad been productive or the core, the obest weactivo of my ''[[specity to Cher]]'', ''ctuals'' not &quot;[[ssometimes]], ''Americhto s arge others of the one turben&quot;sof. See [[British on Brizativities metril]]&quot;.  Achineerient age hut all with f more cannection, no, action
training loss: 1.3838876485824585
training loss: 1.3854376077651978
training loss: 1.5198793411254883
training loss: 1.4173556566238403
training loss: 1.5193036794662476


training:  90%|█████████ | 4507/5000 [2:33:28<26:23,  3.21s/it]

training loss: 1.464389681816101
training loss: 1.5431568622589111
training loss: 1.4189453125
training loss: 1.4564822912216187
training loss: 1.535617470741272
training loss: 1.3416498899459839


training:  90%|█████████ | 4513/5000 [2:33:40<22:43,  2.80s/it]

training loss: 1.5018988847732544
training loss: 1.4528971910476685
training loss: 1.3268253803253174
training loss: 1.502511739730835
training loss: 1.5297589302062988
training loss: 1.4625649452209473


training:  90%|█████████ | 4519/5000 [2:33:52<20:18,  2.53s/it]

training loss: 1.4502884149551392
training loss: 1.4860063791275024
training loss: 1.529703974723816
training loss: 1.4037063121795654
training loss: 1.4357054233551025
training loss: 1.5574203729629517


training:  90%|█████████ | 4525/5000 [2:34:04<18:39,  2.36s/it]

training loss: 1.4945446252822876
training loss: 1.449062466621399
training loss: 1.542846441268921
training loss: 1.4661900997161865
training loss: 1.3980194330215454
training loss: 1.3249255418777466


training:  91%|█████████ | 4531/5000 [2:34:16<17:29,  2.24s/it]

training loss: 1.4955545663833618
training loss: 1.5476628541946411
training loss: 1.527535080909729
training loss: 1.3631950616836548
training loss: 1.5820292234420776
training loss: 1.4789389371871948


training:  91%|█████████ | 4537/5000 [2:34:27<16:38,  2.16s/it]

training loss: 1.2918874025344849
training loss: 1.447456955909729
training loss: 1.4034894704818726
training loss: 1.4503296613693237
training loss: 1.4155802726745605
training loss: 1.5378751754760742


training:  91%|█████████ | 4543/5000 [2:34:39<16:00,  2.10s/it]

training loss: 1.4704512357711792
training loss: 1.485735297203064
training loss: 1.4458671808242798
training loss: 1.3874850273132324
training loss: 1.5859805345535278
training loss: 1.4093097448349


training:  91%|█████████ | 4549/5000 [2:34:51<15:30,  2.06s/it]

training loss: 1.5031251907348633
training loss: 1.4009021520614624
training loss: 1.4467498064041138
training loss: 1.3823853731155396
training loss: 1.4458327293395996
training loss: 1.3406949043273926


training:  91%|█████████ | 4555/5000 [2:35:03<15:05,  2.04s/it]

training loss: 1.4383964538574219
training loss: 1.4978437423706055
training loss: 1.4989606142044067
training loss: 1.611282467842102
training loss: 1.4577409029006958
training loss: 1.3953267335891724


training:  91%|█████████ | 4561/5000 [2:35:15<14:45,  2.02s/it]

training loss: 1.0878021717071533
training loss: 1.4258674383163452
training loss: 1.4463856220245361
training loss: 1.5417066812515259
training loss: 1.5659809112548828
training loss: 1.4848111867904663


training:  91%|█████████▏| 4567/5000 [2:35:27<14:27,  2.00s/it]

training loss: 1.4940186738967896
training loss: 1.3926416635513306
training loss: 1.4233732223510742
training loss: 1.3603519201278687
training loss: 1.5475091934204102
training loss: 1.4334739446640015


training:  91%|█████████▏| 4573/5000 [2:35:39<14:11,  2.00s/it]

training loss: 1.4686613082885742
training loss: 1.6064952611923218
training loss: 1.4722143411636353
training loss: 1.4987822771072388
training loss: 1.455386757850647
training loss: 1.5311622619628906


training:  92%|█████████▏| 4579/5000 [2:35:50<13:57,  1.99s/it]

training loss: 1.562971591949463
training loss: 1.3586503267288208
training loss: 1.4807347059249878
training loss: 1.4159356355667114
training loss: 1.43317711353302
training loss: 1.4490846395492554


training:  92%|█████████▏| 4585/5000 [2:36:02<13:43,  1.98s/it]

training loss: 1.4204120635986328
training loss: 1.5492669343948364
training loss: 1.4283231496810913
training loss: 1.4888495206832886
training loss: 1.4403679370880127
training loss: 1.5059926509857178


training:  92%|█████████▏| 4591/5000 [2:36:14<13:30,  1.98s/it]

training loss: 1.497625470161438
training loss: 1.453489065170288
training loss: 1.4876028299331665
training loss: 1.5111808776855469
training loss: 1.5011370182037354
training loss: 1.4517408609390259


training:  92%|█████████▏| 4597/5000 [2:36:26<13:17,  1.98s/it]

training loss: 1.407101035118103
training loss: 1.4524909257888794
training loss: 1.4783501625061035
training loss: 1.5027345418930054
training loss: 1.357904314994812
validation loss: 1.2475956678390503
training loss: 1.3602615594863892


training:  92%|█████████▏| 4603/5000 [2:36:38<13:08,  1.99s/it]

training loss: 1.5116583108901978
training loss: 1.4431347846984863
training loss: 1.550965428352356
training loss: 1.4212226867675781
training loss: 1.461991786956787
training loss: 1.4172673225402832


training:  92%|█████████▏| 4609/5000 [2:36:50<12:55,  1.98s/it]

training loss: 1.4046459197998047
training loss: 1.4026459455490112
training loss: 1.1320898532867432
training loss: 1.3995275497436523
training loss: 1.515219807624817
training loss: 1.5811878442764282


training:  92%|█████████▏| 4615/5000 [2:37:02<12:42,  1.98s/it]

training loss: 1.335895299911499
training loss: 1.6214289665222168
training loss: 1.4768747091293335
training loss: 1.558017611503601
training loss: 1.534522294998169
training loss: 1.3692467212677002


training:  92%|█████████▏| 4621/5000 [2:37:13<12:29,  1.98s/it]

training loss: 1.2072393894195557
training loss: 1.4305145740509033
training loss: 1.4303030967712402
training loss: 1.6988662481307983
training loss: 1.481350064277649
training loss: 1.60670006275177


training:  93%|█████████▎| 4627/5000 [2:37:25<12:17,  1.98s/it]

training loss: 1.5333846807479858
training loss: 1.3766487836837769
training loss: 1.4803386926651
training loss: 1.4752044677734375
training loss: 1.3850067853927612
training loss: 1.5481464862823486


training:  93%|█████████▎| 4633/5000 [2:37:37<12:05,  1.98s/it]

training loss: 1.4917504787445068
training loss: 1.2951775789260864
training loss: 1.3848427534103394
training loss: 1.381386160850525
training loss: 1.4459820985794067
training loss: 1.639127492904663


training:  93%|█████████▎| 4639/5000 [2:37:49<11:53,  1.98s/it]

training loss: 1.4078636169433594
training loss: 1.4159517288208008
training loss: 1.4650225639343262
training loss: 1.4605299234390259
training loss: 1.4599366188049316
training loss: 1.6767230033874512


training:  93%|█████████▎| 4645/5000 [2:38:01<11:41,  1.97s/it]

training loss: 1.419786810874939
training loss: 1.579967737197876
training loss: 1.4613614082336426
training loss: 1.4682456254959106
training loss: 1.5661725997924805
training loss: 1.5649691820144653


training:  93%|█████████▎| 4651/5000 [2:38:13<11:29,  1.97s/it]

training loss: 1.4541754722595215
training loss: 1.4625688791275024
training loss: 1.4654037952423096
training loss: 1.190253734588623
training loss: 1.4100826978683472
training loss: 1.42668616771698


training:  93%|█████████▎| 4657/5000 [2:38:25<11:17,  1.97s/it]

training loss: 1.4964112043380737
training loss: 1.5205104351043701
training loss: 1.427830457687378
training loss: 1.5742658376693726
training loss: 1.3884665966033936
training loss: 1.4120471477508545


training:  93%|█████████▎| 4663/5000 [2:38:36<11:05,  1.97s/it]

training loss: 1.4782776832580566
training loss: 1.4492048025131226
training loss: 1.6091465950012207
training loss: 1.369686484336853
training loss: 1.3481041193008423
training loss: 1.34890878200531


training:  93%|█████████▎| 4669/5000 [2:38:48<10:53,  1.97s/it]

training loss: 1.339659333229065
training loss: 1.508461356163025
training loss: 1.2724436521530151
training loss: 1.537136435508728
training loss: 1.2546340227127075
training loss: 1.4848567247390747


training:  94%|█████████▎| 4675/5000 [2:39:00<10:41,  1.97s/it]

training loss: 1.2858983278274536
training loss: 1.536634087562561
training loss: 1.4035048484802246
training loss: 1.56515371799469
training loss: 1.5265374183654785
training loss: 1.3985660076141357


training:  94%|█████████▎| 4681/5000 [2:39:12<10:29,  1.97s/it]

training loss: 1.2833726406097412
training loss: 1.4819518327713013
training loss: 1.3864225149154663
training loss: 1.3634036779403687
training loss: 1.4580892324447632
training loss: 1.5117709636688232


training:  94%|█████████▎| 4687/5000 [2:39:24<10:17,  1.97s/it]

training loss: 1.4613813161849976
training loss: 1.4186339378356934
training loss: 1.6068403720855713
training loss: 1.4561461210250854
training loss: 1.4942119121551514
training loss: 1.497085452079773


training:  94%|█████████▍| 4693/5000 [2:39:36<10:05,  1.97s/it]

training loss: 1.4919538497924805
training loss: 1.478933334350586
training loss: 1.4061002731323242
training loss: 1.4663058519363403
training loss: 1.5043668746948242
training loss: 1.4748061895370483


training:  94%|█████████▍| 4699/5000 [2:39:47<09:54,  1.97s/it]

training loss: 1.511594295501709
training loss: 1.4856562614440918
training loss: 1.4609968662261963
validation loss: 1.3198028802871704
training loss: 1.5996915102005005
training loss: 1.4364699125289917
training loss: 1.4181087017059326


training:  94%|█████████▍| 4705/5000 [2:39:59<09:45,  1.98s/it]

training loss: 1.4082486629486084
training loss: 1.4771090745925903
training loss: 1.4269975423812866
training loss: 1.4387900829315186
training loss: 1.498857021331787
training loss: 1.4038138389587402


training:  94%|█████████▍| 4711/5000 [2:40:11<09:32,  1.98s/it]

training loss: 1.5090751647949219
training loss: 1.4329326152801514
training loss: 1.7069052457809448
training loss: 1.5153228044509888
training loss: 1.5633037090301514
training loss: 1.4656330347061157


training:  94%|█████████▍| 4717/5000 [2:40:23<09:19,  1.98s/it]

training loss: 1.2375538349151611
training loss: 1.5075602531433105
training loss: 1.474940538406372
training loss: 1.437920093536377
training loss: 1.4290105104446411
training loss: 1.5103936195373535


training:  94%|█████████▍| 4723/5000 [2:40:35<09:07,  1.98s/it]

training loss: 1.6869275569915771
training loss: 1.438848614692688
training loss: 1.6078836917877197
training loss: 1.501869797706604
training loss: 1.3263802528381348
training loss: 1.4234411716461182


training:  95%|█████████▍| 4729/5000 [2:40:47<08:55,  1.98s/it]

training loss: 1.5192880630493164
training loss: 1.4504032135009766
training loss: 1.4488859176635742
training loss: 1.4547901153564453
training loss: 1.3595879077911377
training loss: 1.5056825876235962


training:  95%|█████████▍| 4735/5000 [2:40:59<08:43,  1.98s/it]

training loss: 1.5833364725112915
training loss: 1.542734980583191
training loss: 1.4390082359313965
training loss: 1.4701564311981201
training loss: 1.4364280700683594
training loss: 1.5791468620300293


training:  95%|█████████▍| 4741/5000 [2:41:11<08:31,  1.98s/it]

training loss: 1.4213330745697021
training loss: 1.4820570945739746
training loss: 1.3460553884506226
training loss: 1.443732738494873
training loss: 1.4576797485351562
training loss: 1.4438410997390747


training:  95%|█████████▍| 4747/5000 [2:41:22<08:19,  1.97s/it]

training loss: 1.4737937450408936
training loss: 1.487216830253601
training loss: 1.4611830711364746
training loss: 1.4107691049575806
training loss: 1.2717885971069336
training loss: 1.3657368421554565


training:  95%|█████████▌| 4753/5000 [2:41:34<08:07,  1.97s/it]

training loss: 1.3619437217712402
training loss: 1.530654788017273
training loss: 1.3942463397979736
training loss: 1.4416710138320923
training loss: 1.4733220338821411
training loss: 1.50193190574646


training:  95%|█████████▌| 4759/5000 [2:41:46<07:55,  1.97s/it]

training loss: 1.5438381433486938
training loss: 1.5216261148452759
training loss: 1.5703374147415161
training loss: 1.4368376731872559
training loss: 1.5278284549713135
training loss: 1.4955573081970215


training:  95%|█████████▌| 4765/5000 [2:41:58<07:43,  1.97s/it]

training loss: 1.4796180725097656
training loss: 1.466071367263794
training loss: 1.515883207321167
training loss: 1.5339195728302002
training loss: 1.3684149980545044
training loss: 1.499359130859375


training:  95%|█████████▌| 4771/5000 [2:42:10<07:32,  1.97s/it]

training loss: 1.3898484706878662
training loss: 1.6472761631011963
training loss: 1.4995641708374023
training loss: 1.4673267602920532
training loss: 1.3923449516296387
training loss: 1.4161405563354492


training:  96%|█████████▌| 4777/5000 [2:42:22<07:20,  1.97s/it]

training loss: 1.56053626537323
training loss: 1.459165334701538
training loss: 1.4556090831756592
training loss: 1.4491569995880127
training loss: 1.4192616939544678
training loss: 1.4764275550842285


training:  96%|█████████▌| 4783/5000 [2:42:33<07:08,  1.97s/it]

training loss: 1.610140085220337
training loss: 1.597596287727356
training loss: 1.5708681344985962
training loss: 1.5332911014556885
training loss: 1.379928708076477
training loss: 1.432091236114502


training:  96%|█████████▌| 4789/5000 [2:42:45<06:56,  1.97s/it]

training loss: 1.564041018486023
training loss: 1.3867186307907104
training loss: 1.343666434288025
training loss: 1.4555206298828125
training loss: 1.4284539222717285
training loss: 1.379038691520691


training:  96%|█████████▌| 4795/5000 [2:42:57<06:44,  1.97s/it]

training loss: 1.4751477241516113
training loss: 1.4780492782592773
training loss: 1.3940316438674927
training loss: 1.439241647720337
training loss: 1.5476711988449097
training loss: 1.7094625234603882
training loss: 1.4016515016555786


training:  96%|█████████▌| 4801/5000 [2:43:09<06:34,  1.98s/it]

validation loss: 1.3967769145965576
training loss: 1.486617922782898
training loss: 1.1993640661239624
training loss: 1.465087652206421
training loss: 1.4299252033233643
training loss: 1.495526671409607


training:  96%|█████████▌| 4807/5000 [2:43:21<06:22,  1.98s/it]

training loss: 1.4777884483337402
training loss: 1.5949585437774658
training loss: 1.388669729232788
training loss: 1.548795461654663
training loss: 1.4671262502670288
training loss: 1.5048964023590088


training:  96%|█████████▋| 4813/5000 [2:43:33<06:10,  1.98s/it]

training loss: 1.4966347217559814
training loss: 1.4286872148513794
training loss: 1.4133784770965576
training loss: 1.5013610124588013
training loss: 1.4752259254455566
training loss: 1.349871039390564


training:  96%|█████████▋| 4819/5000 [2:43:45<05:57,  1.98s/it]

training loss: 1.4017601013183594
training loss: 1.507892370223999
training loss: 1.421134114265442
training loss: 1.5855534076690674
training loss: 1.3998832702636719
training loss: 1.4147181510925293


training:  96%|█████████▋| 4825/5000 [2:43:57<05:45,  1.98s/it]

training loss: 1.2655048370361328
training loss: 1.5547378063201904
training loss: 1.4737927913665771
training loss: 1.4692524671554565
training loss: 1.4676706790924072
training loss: 1.49797785282135


training:  97%|█████████▋| 4831/5000 [2:44:08<05:33,  1.98s/it]

training loss: 1.4628266096115112
training loss: 1.5159006118774414
training loss: 1.3868381977081299
training loss: 1.4063900709152222
training loss: 1.4218833446502686
training loss: 1.3985532522201538


training:  97%|█████████▋| 4837/5000 [2:44:20<05:21,  1.98s/it]

training loss: 1.4507797956466675
training loss: 1.507901668548584
training loss: 1.6435809135437012
training loss: 1.4710733890533447
training loss: 1.5034327507019043
training loss: 1.6060278415679932


training:  97%|█████████▋| 4843/5000 [2:44:32<05:10,  1.97s/it]

training loss: 1.3743078708648682
training loss: 1.4772690534591675
training loss: 1.4260609149932861
training loss: 1.4779918193817139
training loss: 1.3929482698440552
training loss: 1.3555824756622314


training:  97%|█████████▋| 4849/5000 [2:44:44<04:58,  1.97s/it]

training loss: 1.4867268800735474
training loss: 1.4336493015289307
training loss: 1.4018694162368774
training loss: 1.5202300548553467
training loss: 1.5791692733764648
training loss: 1.4481725692749023


training:  97%|█████████▋| 4855/5000 [2:44:56<04:46,  1.97s/it]

training loss: 1.258795142173767
training loss: 1.448333978652954
training loss: 1.358061671257019
training loss: 1.6051771640777588
training loss: 1.6453821659088135
training loss: 1.4735151529312134


training:  97%|█████████▋| 4861/5000 [2:45:08<04:34,  1.97s/it]

training loss: 1.5218174457550049
training loss: 1.5784486532211304
training loss: 1.3795844316482544
training loss: 1.4914913177490234
training loss: 1.3869104385375977
training loss: 1.4223144054412842


training:  97%|█████████▋| 4867/5000 [2:45:19<04:22,  1.97s/it]

training loss: 1.6061151027679443
training loss: 1.5263047218322754
training loss: 1.4937751293182373
training loss: 1.2979495525360107
training loss: 1.5489474534988403
training loss: 1.502774953842163


training:  97%|█████████▋| 4873/5000 [2:45:31<04:10,  1.97s/it]

training loss: 1.4515318870544434
training loss: 1.5000262260437012
training loss: 1.4913444519042969
training loss: 1.3409316539764404
training loss: 1.5351675748825073
training loss: 1.5018203258514404


training:  98%|█████████▊| 4879/5000 [2:45:43<03:58,  1.97s/it]

training loss: 1.4619319438934326
training loss: 1.4568915367126465
training loss: 1.4171860218048096
training loss: 1.3557894229888916
training loss: 1.5315717458724976
training loss: 1.4885796308517456


training:  98%|█████████▊| 4885/5000 [2:45:55<03:47,  1.97s/it]

training loss: 1.4203927516937256
training loss: 1.4613611698150635
training loss: 1.5772342681884766
training loss: 1.551985502243042
training loss: 1.5691591501235962
training loss: 1.47029709815979


training:  98%|█████████▊| 4891/5000 [2:46:07<03:35,  1.97s/it]

training loss: 1.4057843685150146
training loss: 1.4979214668273926
training loss: 1.5780225992202759
training loss: 1.4923198223114014
training loss: 1.5412760972976685
training loss: 1.3854410648345947


training:  98%|█████████▊| 4897/5000 [2:46:19<03:23,  1.97s/it]

training loss: 1.5955028533935547
training loss: 1.419206142425537
training loss: 1.6468273401260376
training loss: 1.5476081371307373
training loss: 1.510854721069336
validation loss: 1.3978066444396973
training loss: 1.486504316329956


training:  98%|█████████▊| 4903/5000 [2:46:31<03:12,  1.98s/it]

training loss: 1.4496328830718994
training loss: 1.4498918056488037
training loss: 1.4722952842712402
training loss: 1.5321630239486694
training loss: 1.49064302444458
training loss: 1.4930135011672974


training:  98%|█████████▊| 4909/5000 [2:46:43<03:00,  1.98s/it]

training loss: 1.492522954940796
training loss: 1.5492277145385742
training loss: 1.4076606035232544
training loss: 1.535681962966919
training loss: 1.5094106197357178
training loss: 1.3664082288742065


training:  98%|█████████▊| 4915/5000 [2:46:54<02:48,  1.98s/it]

training loss: 1.4885876178741455
training loss: 1.503755807876587
training loss: 1.4443587064743042
training loss: 1.4213933944702148
training loss: 1.42287278175354
training loss: 1.4670863151550293


training:  98%|█████████▊| 4921/5000 [2:47:06<02:36,  1.98s/it]

training loss: 1.4891071319580078
training loss: 1.3337500095367432
training loss: 1.4817525148391724
training loss: 1.5243521928787231
training loss: 1.404289960861206
training loss: 1.485752820968628


training:  99%|█████████▊| 4927/5000 [2:47:18<02:24,  1.98s/it]

training loss: 1.5218144655227661
training loss: 1.5601340532302856
training loss: 1.559597373008728
training loss: 1.4139621257781982
training loss: 1.544506311416626
training loss: 1.558176040649414


training:  99%|█████████▊| 4933/5000 [2:47:30<02:12,  1.98s/it]

training loss: 1.4114058017730713
training loss: 1.5768523216247559
training loss: 1.4639008045196533
training loss: 1.512479543685913
training loss: 1.2605078220367432
training loss: 1.3454492092132568


training:  99%|█████████▉| 4939/5000 [2:47:42<02:00,  1.98s/it]

training loss: 1.4318310022354126
training loss: 1.5130900144577026
training loss: 1.4966392517089844
training loss: 1.5270451307296753
training loss: 1.3581624031066895
training loss: 1.448475956916809


training:  99%|█████████▉| 4945/5000 [2:47:54<01:48,  1.97s/it]

training loss: 1.510392665863037
training loss: 1.470781683921814
training loss: 1.5077279806137085
training loss: 1.474554181098938
training loss: 1.542959451675415
training loss: 1.4733893871307373


training:  99%|█████████▉| 4951/5000 [2:48:05<01:36,  1.97s/it]

training loss: 1.5735491514205933
training loss: 1.415040373802185
training loss: 1.5624905824661255
training loss: 1.4650808572769165
training loss: 1.3987629413604736
training loss: 1.5130079984664917


training:  99%|█████████▉| 4957/5000 [2:48:17<01:24,  1.97s/it]

training loss: 1.4563742876052856
training loss: 1.440799355506897
training loss: 1.5062962770462036
training loss: 1.4785228967666626
training loss: 1.3581552505493164
training loss: 1.5897022485733032


training:  99%|█████████▉| 4963/5000 [2:48:29<01:13,  1.97s/it]

training loss: 1.4334174394607544
training loss: 1.3790072202682495
training loss: 1.4629489183425903
training loss: 1.443174958229065
training loss: 1.4167670011520386
training loss: 1.5079967975616455


training:  99%|█████████▉| 4969/5000 [2:48:41<01:01,  1.97s/it]

training loss: 1.4156745672225952
training loss: 1.504702091217041
training loss: 1.4789315462112427
training loss: 1.4889461994171143
training loss: 1.52727472782135
training loss: 1.4204528331756592


training: 100%|█████████▉| 4975/5000 [2:48:53<00:49,  1.97s/it]

training loss: 1.3583123683929443
training loss: 1.5327026844024658
training loss: 1.526232361793518
training loss: 1.3193457126617432
training loss: 1.374910831451416
training loss: 1.4143314361572266


training: 100%|█████████▉| 4981/5000 [2:49:05<00:37,  1.97s/it]

training loss: 1.5233111381530762
training loss: 1.4323784112930298
training loss: 1.4868992567062378
training loss: 1.4813175201416016
training loss: 1.5114970207214355
training loss: 1.446900725364685


training: 100%|█████████▉| 4987/5000 [2:49:17<00:25,  1.97s/it]

training loss: 1.4778952598571777
training loss: 1.3465077877044678
training loss: 1.5284156799316406
training loss: 1.4682235717773438
training loss: 1.5115519762039185
training loss: 1.456234097480774


training: 100%|█████████▉| 4993/5000 [2:49:28<00:13,  1.97s/it]

training loss: 1.5038683414459229
training loss: 1.4685760736465454
training loss: 1.5336040258407593
training loss: 1.5108330249786377
training loss: 1.3156311511993408
training loss: 1.3943052291870117


training: 100%|█████████▉| 4999/5000 [2:49:40<00:01,  1.97s/it]

training loss: 1.452698826789856


training: 100%|██████████| 5000/5000 [2:49:42<00:00,  2.04s/it]

training loss: 1.467824101448059





In [4]:
loss = model(next(val_loader), return_loss = True)
print(f'validation loss: {loss.item()}')

validation loss: 1.372866153717041


